From dd7152d3b56b752ee3a6bf2cb45e1ec1eaad36d7 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 16 Dec 2025 16:53:02 -0800
Subject: [PATCH 01/10] added simulations and quickstart

---
 fern/docs.yml                                 |   6 +
 fern/observability/simulations-quickstart.mdx | 627 ++++++++++++++++++
 2 files changed, 633 insertions(+)
 create mode 100644 fern/observability/simulations-quickstart.mdx
diff --git a/fern/docs.yml b/fern/docs.yml
index 97e195f56..3c28388e5 100644
--- a/fern/docs.yml
+++ b/fern/docs.yml
@@ -289,6 +289,12 @@ navigation:
               - page: Advanced
                 path: observability/evals-advanced.mdx
                 icon: fa-light fa-clipboard-check
+          - section: Simulations
+            icon: fa-light fa-flask-vial
+            contents:
+              - page: Quickstart
+                path: observability/simulations-quickstart.mdx
+                icon: fa-light fa-rocket
           - page: Boards
             path: observability/boards-quickstart.mdx
             icon: fa-light fa-chart-line
diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
new file mode 100644
index 000000000..c58b5b3c7
--- /dev/null
+++ b/fern/observability/simulations-quickstart.mdx
@@ -0,0 +1,627 @@
+---
+title: Simulations quickstart
+subtitle: Test your AI assistants with realistic AI-powered callers
+slug: observability/simulations-quickstart
+---
+
+## Overview
+
+This quickstart guide will help you test your AI assistants and squads using realistic, AI-powered callers. In just a few minutes, you'll create test scenarios, define success criteria, and validate your agents work correctly under different conditions.
+
+### What are Simulations?
+
+Simulations is Vapi's voice agent testing framework that enables you to systematically test assistants and squads using AI-powered callers that follow defined goals and evaluate outcomes. Instead of relying on manual testing or rigid scripts, Simulations recreate real conversations and measure whether your assistant behaves correctly. Test your agents by:
+
+1. **Creating personalities** - Define how the AI caller behaves (e.g., decisive, indecisive, impatient)
+2. **Defining scenarios** - Specify the caller's goal, constraints, and success criteria
+3. **Running simulations** - Pair scenarios with personalities to test your assistant
+4. **Monitoring results** - Watch tests in real time and review pass/fail outcomes
+5. **Tracking performance** - Analyze historical results to identify trends
+
+### When are Simulations useful?
+
+Simulations help you maintain quality and catch issues early:
+
+- **Pre-deployment testing** - Validate new assistant configurations before going live
+- **Regression testing** - Ensure prompt or tool changes don't break existing behaviors
+- **Conversation flow validation** - Test multi-turn interactions and complex scenarios
+- **Personality-based testing** - Verify your agent handles different caller types appropriately
+- **Squad handoff testing** - Ensure smooth transitions between squad members
+- **Performance monitoring** - Track success rates over time and identify regressions
+
+### What you'll build
+
+A simulation suite for an appointment booking assistant that tests:
+
+- Different caller personalities (decisive vs. indecisive)
+- Goal completion and success criteria validation
+- Real-time monitoring of test calls
+- Historical performance tracking
+
+## Prerequisites
+
+<CardGroup cols={2}>
+  <Card title="Vapi account" icon="user">
+    Sign up at [dashboard.vapi.ai](https://dashboard.vapi.ai)
+  </Card>
+  <Card title="API key" icon="key">
+    Get your API key from **API Keys** in sidebar
+  </Card>
+</CardGroup>
+
+<Note>
+  You'll also need an existing assistant or squad to test. You can create one in
+  the Dashboard or use the API.
+</Note>
+
+## Step 1: Create a personality (optional)
+
+Personalities define how the AI caller behaves during a test call. You can use built-in default personalities or create custom ones.
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Navigate to Simulations">
+        1. Log in to [dashboard.vapi.ai](https://dashboard.vapi.ai)
+        2. Click on **Simulations** in the left sidebar
+        3. Click the **Personalities** tab
+      </Step>
+
+      <Step title="Create a personality">
+        1. Click **Create Personality**
+        2. **Name**: Enter "Impatient Customer"
+        3. **Description**: Add "A busy customer who wants quick answers and may interrupt"
+        4. **Behavior**: Define the personality traits:
+           - Speaks quickly and directly
+           - May interrupt if responses are too long
+           - Expects immediate solutions
+        5. Click **Save**
+      </Step>
+    </Steps>
+
+    <Tip>
+      Start with the built-in default personalities to get familiar with the system before creating custom ones.
+    </Tip>
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/simulation/personality" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Impatient Customer",
+    "description": "A busy customer who wants quick answers and may interrupt",
+    "behavior": "Speaks quickly and directly. May interrupt if responses are too long. Expects immediate solutions."
+  }'
+```
+
+**Response:**
+
+```json
+{
+  "id": "personality-123",
+  "orgId": "org-456",
+  "name": "Impatient Customer",
+  "description": "A busy customer who wants quick answers and may interrupt",
+  "behavior": "Speaks quickly and directly. May interrupt if responses are too long. Expects immediate solutions.",
+  "createdAt": "2024-01-15T09:30:00Z",
+  "updatedAt": "2024-01-15T09:30:00Z"
+}
+```
+
+Save the returned `id` - you'll need it when creating simulations.
+  </Tab>
+</Tabs>
+
+<Note>
+  **Personality types:** Consider creating personalities for different customer types you encounter: decisive buyers, hesitant customers, detail-oriented users, or frustrated callers.
+</Note>
+
+## Step 2: Create a scenario
+
+Scenarios define what the test call is trying to accomplish, including the goal and success criteria.
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Navigate to Scenarios">
+        1. In **Simulations**, click the **Scenarios** tab
+        2. Click **Create Scenario**
+      </Step>
+
+      <Step title="Configure the scenario">
+        1. **Name**: Enter "Book Appointment"
+        2. **Description**: Add "Test that the assistant can successfully book an appointment"
+        3. **Goal**: Define what the caller is trying to accomplish:
+           - "Schedule an appointment for next Monday at 2pm"
+        4. **Constraints** (optional): Add any limitations:
+           - "Only available on weekdays"
+           - "Preferred morning appointments"
+      </Step>
+
+      <Step title="Add success criteria">
+        1. Click **Add Success Criterion**
+        2. Define what must happen for the test to pass:
+           - "Appointment is confirmed with a specific date and time"
+           - "Confirmation number is provided"
+        3. Click **Save Scenario**
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/simulation/scenario" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Book Appointment",
+    "description": "Test that the assistant can successfully book an appointment",
+    "goal": "Schedule an appointment for next Monday at 2pm",
+    "constraints": [
+      "Only available on weekdays",
+      "Preferred morning appointments"
+    ],
+    "successCriteria": [
+      "Appointment is confirmed with a specific date and time",
+      "Confirmation number is provided"
+    ]
+  }'
+```
+
+**Response:**
+
+```json
+{
+  "id": "scenario-789",
+  "orgId": "org-456",
+  "name": "Book Appointment",
+  "description": "Test that the assistant can successfully book an appointment",
+  "goal": "Schedule an appointment for next Monday at 2pm",
+  "constraints": [
+    "Only available on weekdays",
+    "Preferred morning appointments"
+  ],
+  "successCriteria": [
+    "Appointment is confirmed with a specific date and time",
+    "Confirmation number is provided"
+  ],
+  "createdAt": "2024-01-15T09:35:00Z",
+  "updatedAt": "2024-01-15T09:35:00Z"
+}
+```
+
+Save the returned `id` - you'll need it when creating simulations.
+  </Tab>
+</Tabs>
+
+<Tip>
+  **Success criteria tips:** Be specific about what constitutes success. Include both the action (appointment booked) and the verification (confirmation provided).
+</Tip>
+
+## Step 3: Create a simulation
+
+Simulations pair a scenario with a personality and select the assistant or squad you want to test.
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Navigate to Simulations">
+        1. In **Simulations**, click the **Simulations** tab
+        2. Click **Create Simulation**
+      </Step>
+
+      <Step title="Configure the simulation">
+        1. **Name**: Enter "Appointment Booking - Impatient Customer"
+        2. **Scenario**: Select "Book Appointment" from the dropdown
+        3. **Personality**: Select "Impatient Customer" (or use a default)
+        4. **Target**: Choose **Assistant** or **Squad**
+        5. Select your assistant/squad from the dropdown
+        6. Click **Save Simulation**
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/simulation" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Appointment Booking - Impatient Customer",
+    "scenarioId": "scenario-789",
+    "personalityId": "personality-123",
+    "target": {
+      "type": "assistant",
+      "assistantId": "your-assistant-id"
+    }
+  }'
+```
+
+**Response:**
+
+```json
+{
+  "id": "simulation-abc",
+  "orgId": "org-456",
+  "name": "Appointment Booking - Impatient Customer",
+  "scenarioId": "scenario-789",
+  "personalityId": "personality-123",
+  "target": {
+    "type": "assistant",
+    "assistantId": "your-assistant-id"
+  },
+  "createdAt": "2024-01-15T09:40:00Z",
+  "updatedAt": "2024-01-15T09:40:00Z"
+}
+```
+
+Save the returned `id` - you'll need it when creating simulation suites.
+  </Tab>
+</Tabs>
+
+<Note>
+  **Multiple simulations:** Create several simulations with different personality and scenario combinations to thoroughly test your assistant across various conditions.
+</Note>
+
+## Step 4: Create a simulation suite
+
+Simulation suites group multiple simulations into a single batch that runs together.
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Navigate to Suites">
+        1. In **Simulations**, click the **Suites** tab
+        2. Click **Create Suite**
+      </Step>
+
+      <Step title="Configure the suite">
+        1. **Name**: Enter "Appointment Booking Regression Suite"
+        2. **Description**: Add "Tests appointment booking across different customer types"
+        3. Click **Add Simulations**
+        4. Select the simulations you want to include:
+           - "Appointment Booking - Impatient Customer"
+           - "Appointment Booking - Decisive Customer"
+           - "Appointment Booking - Indecisive Customer"
+        5. Click **Save Suite**
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/simulation/suite" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Appointment Booking Regression Suite",
+    "description": "Tests appointment booking across different customer types",
+    "simulationIds": [
+      "simulation-abc",
+      "simulation-def",
+      "simulation-ghi"
+    ]
+  }'
+```
+
+**Response:**
+
+```json
+{
+  "id": "suite-xyz",
+  "orgId": "org-456",
+  "name": "Appointment Booking Regression Suite",
+  "description": "Tests appointment booking across different customer types",
+  "simulationIds": [
+    "simulation-abc",
+    "simulation-def",
+    "simulation-ghi"
+  ],
+  "createdAt": "2024-01-15T09:45:00Z",
+  "updatedAt": "2024-01-15T09:45:00Z"
+}
+```
+
+Save the returned `id` - you'll need it to run the suite.
+  </Tab>
+</Tabs>
+
+<Tip>
+  **Suite organization:** Group related simulations together. For example, create separate suites for "Booking Tests", "Cancellation Tests", and "Rescheduling Tests".
+</Tip>
+
+## Step 5: Run the suite
+
+Execute all simulations in your suite and monitor them in real time.
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Run the suite">
+        1. Navigate to your suite in the **Suites** tab
+        2. Click **Run Suite**
+        3. All simulations in the suite will be queued and executed
+      </Step>
+
+      <Step title="Monitor in real time">
+        1. Click the **Runs** tab to see live status updates
+        2. Watch as each simulation progresses:
+           - **Queued** - Waiting to start
+           - **Running** - Call in progress
+           - **Completed** - Test finished
+        3. Click **Listen** on any running test to hear the call live
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+**Run the suite:**
+
+```bash
+curl -X POST "https://api.vapi.ai/simulation/suite/suite-xyz/run" \
+  -H "Authorization: Bearer $VAPI_API_KEY"
+```
+
+**Response:**
+
+```json
+{
+  "id": "run-123",
+  "suiteId": "suite-xyz",
+  "status": "running",
+  "simulations": [
+    {
+      "simulationId": "simulation-abc",
+      "status": "queued"
+    },
+    {
+      "simulationId": "simulation-def",
+      "status": "queued"
+    },
+    {
+      "simulationId": "simulation-ghi",
+      "status": "queued"
+    }
+  ],
+  "createdAt": "2024-01-15T09:50:00Z"
+}
+```
+
+**Check run status:**
+
+```bash
+curl -X GET "https://api.vapi.ai/simulation/run/run-123" \
+  -H "Authorization: Bearer $VAPI_API_KEY"
+```
+  </Tab>
+</Tabs>
+
+<Warning>
+  Running a suite will execute actual voice calls to your assistant. Ensure your assistant is properly configured before running tests.
+</Warning>
+
+## Step 6: Review results
+
+Analyze the results of your simulation runs to understand how your assistant performed.
+
+### Successful run
+
+When all simulations pass, you'll see:
+
+```json
+{
+  "id": "run-123",
+  "suiteId": "suite-xyz",
+  "status": "completed",
+  "results": [
+    {
+      "simulationId": "simulation-abc",
+      "status": "pass",
+      "successCriteria": [
+        {
+          "criterion": "Appointment is confirmed with a specific date and time",
+          "passed": true
+        },
+        {
+          "criterion": "Confirmation number is provided",
+          "passed": true
+        }
+      ],
+      "duration": "45s"
+    }
+  ],
+  "summary": {
+    "total": 3,
+    "passed": 3,
+    "failed": 0
+  }
+}
+```
+
+**Pass criteria:**
+
+- `status` is "completed"
+- `results[].status` is "pass" for all simulations
+- All `successCriteria` items show `passed: true`
+
+### Failed run
+
+When validation fails, you'll see details about what went wrong:
+
+```json
+{
+  "id": "run-124",
+  "suiteId": "suite-xyz",
+  "status": "completed",
+  "results": [
+    {
+      "simulationId": "simulation-abc",
+      "status": "fail",
+      "successCriteria": [
+        {
+          "criterion": "Appointment is confirmed with a specific date and time",
+          "passed": true
+        },
+        {
+          "criterion": "Confirmation number is provided",
+          "passed": false,
+          "reason": "No confirmation number was mentioned in the conversation"
+        }
+      ],
+      "duration": "52s"
+    }
+  ],
+  "summary": {
+    "total": 3,
+    "passed": 2,
+    "failed": 1
+  }
+}
+```
+
+**Failure indicators:**
+
+- `results[].status` is "fail"
+- `successCriteria[].passed` is `false` with a `reason` explaining the failure
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="View run results">
+        1. Navigate to the **Runs** tab
+        2. Click on a completed run to see details
+        3. View the summary showing pass/fail counts
+      </Step>
+
+      <Step title="Investigate failures">
+        1. Click on any failed simulation
+        2. Review the **Timeline** to see the conversation flow
+        3. Check which success criteria failed and why
+        4. Click **Listen to Recording** to hear the full call
+      </Step>
+
+      <Step title="Track performance over time">
+        1. Go to the main **Simulations** page
+        2. Filter by **Suites** to see historical runs
+        3. Monitor pass rates and identify trends
+        4. Compare performance across different suite versions
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+**List all runs:**
+
+```bash
+curl -X GET "https://api.vapi.ai/simulation/run" \
+  -H "Authorization: Bearer $VAPI_API_KEY"
+```
+
+**Get detailed results for a specific run:**
+
+```bash
+curl -X GET "https://api.vapi.ai/simulation/run/run-123" \
+  -H "Authorization: Bearer $VAPI_API_KEY"
+```
+
+**Filter runs by suite:**
+
+```bash
+curl -X GET "https://api.vapi.ai/simulation/run?suiteId=suite-xyz" \
+  -H "Authorization: Bearer $VAPI_API_KEY"
+```
+  </Tab>
+</Tabs>
+
+<Note>
+  Full conversation recordings are available for all simulation runs, making it easy to understand exactly what happened during each test.
+</Note>
+
+## Troubleshooting
+
+| Issue | Solution |
+| --- | --- |
+| Simulation always fails | Check that success criteria are achievable with your assistant's current capabilities |
+| Run stuck in "running" | Verify your assistant is properly configured and responding to calls |
+| Personality not applied | Ensure the personality ID is correctly linked to the simulation |
+| Success criteria unclear | Make criteria specific and measurable (e.g., "mentions confirmation number" vs "completes task") |
+| No audio in recording | Check that your assistant has voice configuration enabled |
+| Suite won't start | Verify all simulations in the suite are valid and have targets assigned |
+
+### Common errors
+
+**"assistant-error" status:**
+
+- Check your assistant configuration (model, voice, tools)
+- Verify API keys are valid
+- Test the assistant manually before running simulations
+
+**Success criteria failures:**
+
+- Review the conversation recording to understand what happened
+- Adjust criteria to be more specific or more flexible as needed
+- Consider whether the personality is making the test unrealistically difficult
+
+<Warning>
+  If simulations consistently fail, test your assistant manually first to ensure it's working correctly before debugging the simulation configuration.
+</Warning>
+
+## Next steps
+
+<CardGroup cols={2}>
+  <Card
+    title="Assistants guide"
+    icon="robot"
+    href="/assistants/quickstart"
+  >
+    Create and configure assistants to test
+  </Card>
+
+  <Card
+    title="Squads documentation"
+    icon="users"
+    href="/squads"
+  >
+    Build multi-agent squads and test handoffs
+  </Card>
+
+  <Card
+    title="Evals quickstart"
+    icon="clipboard-check"
+    href="/observability/evals-quickstart"
+  >
+    Learn about chat-based testing with mock conversations
+  </Card>
+
+  <Card
+    title="Prompting guide"
+    icon="pen-to-square"
+    href="/prompting-guide"
+  >
+    Improve your assistant's responses with better prompts
+  </Card>
+</CardGroup>
+
+## Tips for success
+
+<Tip>
+  **Best practices for effective simulation testing:**
+
+  - **Start simple** - Begin with straightforward scenarios before testing edge cases
+  - **Use realistic personalities** - Model your test callers after actual customer types
+  - **Define clear success criteria** - Specific, measurable criteria lead to reliable tests
+  - **Group related tests** - Organize suites by feature or user flow
+  - **Monitor trends** - Track pass rates over time to catch regressions early
+  - **Test after changes** - Run your simulation suites after updating prompts or tools
+  - **Listen to recordings** - Audio recordings reveal issues that metrics alone miss
+  - **Iterate on failures** - Use failed tests to improve both your assistant and test design
+</Tip>
+
+## Get help
+
+Need assistance? We're here to help:
+
+- [Discord Community](https://discord.gg/pUFNcf2WmH)
+- [Support](mailto:support@vapi.ai)

From 2a4735454de51aa510ed589b4f56b26bd2adefda Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 15:51:27 -0800
Subject: [PATCH 02/10] fixed simulations description to match v2 and added
 advanced

---
 fern/docs.yml                                 |   3 +
 fern/observability/simulations-advanced.mdx   | 846 ++++++++++++++++++
 fern/observability/simulations-quickstart.mdx | 625 ++++++++-----
 3 files changed, 1261 insertions(+), 213 deletions(-)
 create mode 100644 fern/observability/simulations-advanced.mdx

diff --git a/fern/docs.yml b/fern/docs.yml
index 3c28388e5..3e00822db 100644
--- a/fern/docs.yml
+++ b/fern/docs.yml
@@ -295,6 +295,9 @@ navigation:
               - page: Quickstart
                 path: observability/simulations-quickstart.mdx
                 icon: fa-light fa-rocket
+              - page: Advanced
+                path: observability/simulations-advanced.mdx
+                icon: fa-light fa-flask-vial
           - page: Boards
             path: observability/boards-quickstart.mdx
             icon: fa-light fa-chart-line
diff --git a/fern/observability/simulations-advanced.mdx b/fern/observability/simulations-advanced.mdx
new file mode 100644
index 000000000..ac178ad75
--- /dev/null
+++ b/fern/observability/simulations-advanced.mdx
@@ -0,0 +1,846 @@
+---
+title: Advanced simulation testing
+subtitle: Master testing strategies and best practices for AI voice agent simulations
+slug: observability/simulations-advanced
+---
+
+## Overview
+
+This guide covers advanced simulation strategies, testing patterns, and best practices for building robust test suites that ensure your AI voice agents work reliably in production.
+
+**You'll learn:**
+
+- Advanced scenario configuration (tool mocks, hooks)
+- Strategic testing approaches (smoke, regression, edge cases)
+- Performance optimization techniques
+- CI/CD integration strategies
+- Maintenance and troubleshooting methods
+
+## Advanced scenario configuration
+
+### Tool mocks
+
+Mock tool call responses at the scenario level to test specific paths without calling real APIs. This is useful for:
+
+- Testing error handling paths
+- Simulating unavailable services
+- Deterministic test results
+- Faster test execution (no real API calls)
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Navigate to scenario">
+        1. Go to **Simulations** → **Scenarios**
+        2. Open the scenario you want to configure
+      </Step>
+
+      <Step title="Add tool mocks">
+        1. Scroll to **Tool Mocks** section
+        2. Click **Add Tool Mock**
+        3. **Tool Name**: Enter the exact function name (e.g., `bookAppointment`)
+        4. **Result**: Enter the JSON response to return:
+           ```json
+           {"status": "success", "confirmationId": "MOCK-12345"}
+           ```
+        5. **Enabled**: Toggle on/off to control when mock is active
+        6. Click **Save**
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/eval/simulation/scenario" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Book Appointment - API Error Path",
+    "instructions": "Try to book an appointment and handle the error gracefully when the system is unavailable.",
+    "evaluations": [
+      {
+        "structuredOutput": {
+          "name": "handled_error_gracefully",
+          "schema": {
+            "type": "boolean",
+            "description": "Whether the assistant apologized and offered alternatives"
+          }
+        },
+        "comparator": "=",
+        "value": true
+      }
+    ],
+    "toolMocks": [
+      {
+        "toolName": "bookAppointment",
+        "result": "{\"error\": \"Service temporarily unavailable\", \"code\": \"503\"}",
+        "enabled": true
+      }
+    ]
+  }'
+```
+  </Tab>
+</Tabs>
+
+**Common tool mock patterns:**
+
+<AccordionGroup>
+  <Accordion title="Success response">
+    ```json
+    {
+      "toolName": "bookAppointment",
+      "result": "{\"status\": \"success\", \"confirmationId\": \"APT-12345\", \"datetime\": \"2024-01-20T14:00:00Z\"}",
+      "enabled": true
+    }
+    ```
+  </Accordion>
+
+  <Accordion title="Error response">
+    ```json
+    {
+      "toolName": "bookAppointment",
+      "result": "{\"error\": \"Time slot no longer available\", \"availableSlots\": [\"14:30\", \"15:00\", \"15:30\"]}",
+      "enabled": true
+    }
+    ```
+  </Accordion>
+
+  <Accordion title="Timeout/unavailable">
+    ```json
+    {
+      "toolName": "checkInventory",
+      "result": "{\"error\": \"Request timeout\", \"code\": \"ETIMEDOUT\"}",
+      "enabled": true
+    }
+    ```
+  </Accordion>
+
+  <Accordion title="Partial success">
+    ```json
+    {
+      "toolName": "processOrder",
+      "result": "{\"status\": \"partial\", \"itemsProcessed\": 2, \"itemsFailed\": 1, \"failedReason\": \"Item out of stock\"}",
+      "enabled": true
+    }
+    ```
+  </Accordion>
+</AccordionGroup>
+
+<Tip>
+  **Tool mock tips:**
+  - Mock tool names must exactly match the function name configured in your assistant's tools
+  - Use realistic error responses that match your actual API error formats
+  - Create separate scenarios for success paths and error paths
+  - Disable mocks (`enabled: false`) to test against real APIs
+</Tip>
+
+### Simulation hooks
+
+Trigger actions on simulation lifecycle events. Hooks are useful for:
+
+- Notifying external systems when tests start/end
+- Logging test execution to your own systems
+- Triggering follow-up workflows
+- Custom analytics and reporting
+
+<Warning>
+  **Hooks are only supported in voice mode.** Hooks require `vapi.websocket` transport and will not trigger with `vapi.webchat` (chat mode).
+</Warning>
+
+<Tabs>
+  <Tab title="Dashboard">
+    <Steps>
+      <Step title="Add hooks to scenario">
+        1. Go to **Simulations** → **Scenarios**
+        2. Open your scenario
+        3. Scroll to **Hooks** section
+        4. Click **Add Hook**
+      </Step>
+
+      <Step title="Configure hook">
+        1. **Event**: Select when to trigger:
+           - `simulation.run.started` - When simulation run begins
+           - `simulation.run.ended` - When simulation run ends
+        2. **Action Type**: Select `webhook`
+        3. **Server URL**: Enter your webhook endpoint
+        4. Click **Save**
+      </Step>
+    </Steps>
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/eval/simulation/scenario" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Test with Lifecycle Hooks",
+    "instructions": "Complete the booking flow as a standard customer.",
+    "evaluations": [
+      {
+        "structuredOutput": {
+          "name": "booking_completed",
+          "schema": { "type": "boolean" }
+        },
+        "comparator": "=",
+        "value": true
+      }
+    ],
+    "hooks": [
+      {
+        "on": "simulation.run.started",
+        "do": [
+          {
+            "type": "webhook",
+            "server": {
+              "url": "https://your-server.com/webhooks/simulation-started"
+            }
+          }
+        ]
+      },
+      {
+        "on": "simulation.run.ended",
+        "do": [
+          {
+            "type": "webhook",
+            "server": {
+              "url": "https://your-server.com/webhooks/simulation-ended"
+            },
+            "include": {
+              "transcript": true,
+              "messages": true,
+              "recordingUrl": true
+            }
+          }
+        ]
+      }
+    ]
+  }'
+```
+  </Tab>
+</Tabs>
+
+**Webhook payload examples:**
+
+```json
+// simulation.run.started webhook payload
+{
+  "event": "simulation.run.started",
+  "simulationId": "550e8400-e29b-41d4-a716-446655440003",
+  "runId": "550e8400-e29b-41d4-a716-446655440007",
+  "timestamp": "2024-01-15T09:50:05Z"
+}
+
+// simulation.run.ended webhook payload
+{
+  "event": "simulation.run.ended",
+  "simulationId": "550e8400-e29b-41d4-a716-446655440003",
+  "runId": "550e8400-e29b-41d4-a716-446655440007",
+  "timestamp": "2024-01-15T09:52:30Z",
+  "duration": 145,
+  "status": "passed",
+  "transcript": "...",          // if include.transcript = true
+  "messages": [...],            // if include.messages = true
+  "recordingUrl": "https://..." // if include.recordingUrl = true
+}
+```
+
+### Using existing structured outputs
+
+Instead of defining inline structured outputs in each scenario, you can reference structured outputs you've already created. This provides:
+
+- Reusability across multiple scenarios
+- Centralized management of evaluation criteria
+- Consistency in how data is extracted
+
+<Tabs>
+  <Tab title="Dashboard">
+    1. Go to **Structured Outputs** in the sidebar
+    2. Create a new structured output or find an existing one
+    3. Copy the **ID**
+    4. In your scenario, select **Use Existing** when adding an evaluation
+    5. Paste the structured output ID
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+# First, create a reusable structured output
+curl -X POST "https://api.vapi.ai/structured-output" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "appointment_booked",
+    "schema": {
+      "type": "boolean",
+      "description": "Whether an appointment was successfully booked during the call"
+    }
+  }'
+
+# Response includes the ID
+# { "id": "so-abc123", ... }
+
+# Then reference it in your scenario
+curl -X POST "https://api.vapi.ai/eval/simulation/scenario" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Book Appointment",
+    "instructions": "Call to book an appointment for next Monday.",
+    "evaluations": [
+      {
+        "structuredOutputId": "so-abc123",
+        "comparator": "=",
+        "value": true
+      }
+    ]
+  }'
+```
+  </Tab>
+</Tabs>
+
+<Note>
+  **When to use existing vs inline:**
+  - **Existing (by ID)**: When the same evaluation criteria is used across multiple scenarios
+  - **Inline**: For scenario-specific evaluations that won't be reused
+</Note>
+
+## Testing strategies
+
+### Smoke tests
+
+Quick validation that core functionality works. Run these first to catch obvious issues.
+
+**Purpose:** Verify your assistant responds and basic conversation flow works before running comprehensive tests.
+
+```json
+{
+  "name": "Smoke Test - Basic Response",
+  "instructions": "Say hello and ask if the assistant can hear you.",
+  "evaluations": [
+    {
+      "structuredOutput": {
+        "name": "assistant_responded",
+        "schema": {
+          "type": "boolean",
+          "description": "Whether the assistant provided any response"
+        }
+      },
+      "comparator": "=",
+      "value": true
+    }
+  ]
+}
+```
+
+**Characteristics:**
+- Minimal evaluation criteria (just check for any response)
+- Fast execution (simple instructions)
+- Run before detailed tests
+- Use chat mode for speed
+
+**When to use:**
+- Before running expensive voice test suites
+- After deploying configuration changes
+- As health checks in monitoring
+- Quick validation during development
+
+### Regression tests
+
+Ensure fixes and updates don't break existing functionality.
+
+**Purpose:** Validate that known issues stay fixed and features keep working.
+
+<Tabs>
+  <Tab title="Dashboard">
+    1. Name scenarios with "Regression: " prefix
+    2. Include issue ticket number in the name
+    3. Add the exact scenario that previously failed
+    4. Document what was fixed
+
+    Example:
+    - Name: "Regression: Appointment Parsing Bug #1234"
+    - Instructions: Scenario that triggered the bug
+  </Tab>
+
+  <Tab title="cURL">
+```bash
+curl -X POST "https://api.vapi.ai/eval/simulation/scenario" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "Regression: Date Parsing Bug #1234",
+    "instructions": "Request an appointment for 3/15. The assistant should correctly parse this as March 15th, not fail or misinterpret the date.",
+    "evaluations": [
+      {
+        "structuredOutput": {
+          "name": "date_parsed_correctly",
+          "schema": {
+            "type": "boolean",
+            "description": "Whether the date 3/15 was correctly understood as March 15th"
+          }
+        },
+        "comparator": "=",
+        "value": true
+      }
+    ]
+  }'
+```
+  </Tab>
+</Tabs>
+
+**Best practices:**
+- Name tests after bugs they prevent
+- Include ticket/issue numbers
+- Add regression tests when fixing bugs
+- Run full regression suite before major releases
+
+### Edge case testing
+
+Test boundary conditions and unusual inputs your assistant might encounter.
+
+**Common edge cases to test:**
+
+<AccordionGroup>
+  <Accordion title="Confused or unclear requests">
+    ```json
+    {
+      "name": "Edge Case - Ambiguous Request",
+      "instructions": "Make a vague, unclear request like 'I need something done' without specifying what you want.",
+      "evaluations": [
+        {
+          "structuredOutput": {
+            "name": "asked_for_clarification",
+            "schema": {
+              "type": "boolean",
+              "description": "Whether the assistant asked for more details"
+            }
+          },
+          "comparator": "=",
+          "value": true
+        }
+      ]
+    }
+    ```
+  </Accordion>
+
+  <Accordion title="Rapid topic changes">
+    ```json
+    {
+      "name": "Edge Case - Topic Switch",
+      "instructions": "Start asking about booking an appointment, then suddenly switch to asking about cancellation policies mid-conversation.",
+      "evaluations": [
+        {
+          "structuredOutput": {
+            "name": "handled_topic_switch",
+            "schema": {
+              "type": "boolean",
+              "description": "Whether the assistant smoothly transitioned to the new topic"
+            }
+          },
+          "comparator": "=",
+          "value": true
+        }
+      ]
+    }
+    ```
+  </Accordion>
+
+  <Accordion title="Interruptions">
+    ```json
+    {
+      "name": "Edge Case - Interruption Handling",
+      "instructions": "Interrupt the assistant mid-sentence with a new question. See if it handles the interruption gracefully.",
+      "evaluations": [
+        {
+          "structuredOutput": {
+            "name": "handled_interruption",
+            "schema": {
+              "type": "boolean",
+              "description": "Whether the assistant stopped and addressed the interruption"
+            }
+          },
+          "comparator": "=",
+          "value": true
+        }
+      ]
+    }
+    ```
+
+    <Note>This edge case requires voice mode (`vapi.websocket`) to test actual audio interruptions.</Note>
+  </Accordion>
+
+  <Accordion title="Invalid data input">
+    ```json
+    {
+      "name": "Edge Case - Invalid Date",
+      "instructions": "Try to book an appointment for 'the 45th of Octember' - an obviously invalid date.",
+      "evaluations": [
+        {
+          "structuredOutput": {
+            "name": "handled_invalid_date",
+            "schema": {
+              "type": "boolean",
+              "description": "Whether the assistant politely asked for a valid date"
+            }
+          },
+          "comparator": "=",
+          "value": true
+        }
+      ]
+    }
+    ```
+  </Accordion>
+</AccordionGroup>
+
+**Edge case categories to cover:**
+- **Input boundaries:** Empty, maximum length, special characters
+- **Data formats:** Invalid dates, malformed phone numbers, unusual names
+- **Conversation patterns:** Interruptions, topic changes, contradictions
+- **Emotional scenarios:** Frustrated caller, confused caller, impatient caller
+
+## Best practices
+
+### Evaluation design principles
+
+<CardGroup cols={2}>
+  <Card title="Single responsibility" icon="bullseye">
+    Each evaluation should test one specific outcome.
+
+    ✅ **Good:** "Was the appointment booked?"
+
+    ❌ **Bad:** "Was the appointment booked, confirmed, and email sent?"
+  </Card>
+
+  <Card title="Clear naming" icon="tag">
+    Use descriptive names that explain what's being tested.
+
+    ✅ **Good:** "Booking - Handles Unavailable Slot"
+
+    ❌ **Bad:** "Test 1" or "Scenario ABC"
+  </Card>
+
+  <Card title="Realistic personalities" icon="user">
+    Model test personalities after actual customer types.
+
+    Consider: decisive, confused, impatient, detail-oriented, non-native speakers
+  </Card>
+
+  <Card title="Measurable criteria" icon="chart-bar">
+    Use boolean or numeric structured outputs that produce clear pass/fail results.
+
+    Avoid subjective criteria that are hard to evaluate consistently.
+  </Card>
+</CardGroup>
+
+### Choosing voice vs chat mode
+
+| Scenario | Recommended Mode | Reason |
+| --- | --- | --- |
+| Rapid iteration during development | Chat (`vapi.webchat`) | Faster, cheaper |
+| Testing speech recognition accuracy | Voice (`vapi.websocket`) | Tests actual STT |
+| Testing voice/TTS quality | Voice (`vapi.websocket`) | Tests actual TTS |
+| Testing interruption handling | Voice (`vapi.websocket`) | Requires audio |
+| CI/CD pipeline tests | Chat (`vapi.webchat`) | Speed and cost |
+| Pre-production validation | Voice (`vapi.websocket`) | Full end-to-end |
+| Testing hooks/webhooks | Voice (`vapi.websocket`) | Hooks require voice |
+
+### Performance optimization
+
+**Minimize test execution time:**
+
+1. **Use chat mode for initial development:**
+   - `vapi.webchat` runs faster than voice
+   - Switch to voice for final validation
+
+2. **Keep instructions focused:**
+   - Clear, specific instructions complete faster
+   - Avoid overly complex multi-step scenarios
+
+3. **Batch related tests:**
+   - Group similar simulations in suites
+   - Run suites instead of individual simulations
+
+4. **Use iterations strategically:**
+   - `iterations: 1` for deterministic scenarios
+   - Higher iterations for testing consistency
+
+**Cost optimization:**
+- Chat mode costs less (no STT/TTS)
+- Simple personalities (smaller models) cost less
+- Shorter conversations cost less
+
+## CI/CD integration
+
+Automate simulation runs in your deployment pipeline.
+
+### Basic workflow
+
+```yaml
+# .github/workflows/test-assistant.yml
+name: Test Assistant Changes
+
+on:
+  pull_request:
+    paths:
+      - 'assistants/**'
+      - 'prompts/**'
+
+jobs:
+  run-simulations:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Run smoke tests (chat mode)
+        run: |
+          # Create a simulation run
+          RUN_ID=$(curl -s -X POST "https://api.vapi.ai/eval/simulation/run" \
+            -H "Authorization: Bearer ${{ secrets.VAPI_API_KEY }}" \
+            -H "Content-Type: application/json" \
+            -d '{
+              "simulations": [{"type": "simulationSuite", "simulationSuiteId": "${{ vars.SMOKE_TEST_SUITE_ID }}"}],
+              "target": {"type": "assistant", "assistantId": "${{ vars.STAGING_ASSISTANT_ID }}"},
+              "transport": {"provider": "vapi.webchat"}
+            }' | jq -r '.id')
+
+          echo "Run ID: $RUN_ID"
+
+          # Poll for completion
+          while true; do
+            STATUS=$(curl -s "https://api.vapi.ai/eval/simulation/run/$RUN_ID" \
+              -H "Authorization: Bearer ${{ secrets.VAPI_API_KEY }}" | jq -r '.status')
+
+            if [ "$STATUS" = "ended" ]; then
+              break
+            fi
+
+            sleep 10
+          done
+
+          # Check results
+          RESULT=$(curl -s "https://api.vapi.ai/eval/simulation/run/$RUN_ID" \
+            -H "Authorization: Bearer ${{ secrets.VAPI_API_KEY }}")
+
+          PASSED=$(echo $RESULT | jq '.itemCounts.passed')
+          FAILED=$(echo $RESULT | jq '.itemCounts.failed')
+
+          if [ "$FAILED" -gt 0 ]; then
+            echo "Simulations failed: $FAILED"
+            exit 1
+          fi
+
+          echo "All simulations passed: $PASSED"
+```
+
+### Advanced patterns
+
+<AccordionGroup>
+  <Accordion title="Staging validation before production">
+    Run full simulation suite against staging before promoting to production:
+
+    ```bash
+    # Run comprehensive tests against staging
+    ./scripts/run-simulation-suite.sh \
+      --suite-id "$REGRESSION_SUITE_ID" \
+      --target-assistant "$STAGING_ASSISTANT_ID" \
+      --transport "vapi.websocket" \
+      --iterations 3
+
+    # Only deploy to production if all pass
+    if [ $? -eq 0 ]; then
+      ./scripts/deploy-to-production.sh
+    fi
+    ```
+  </Accordion>
+
+  <Accordion title="Scheduled nightly regression">
+    Run full regression suite nightly:
+
+    ```yaml
+    # .github/workflows/nightly-regression.yml
+    on:
+      schedule:
+        - cron: '0 2 * * *'  # 2 AM daily
+
+    jobs:
+      regression-suite:
+        runs-on: ubuntu-latest
+        steps:
+          - name: Run full regression (voice mode)
+            run: ./scripts/run-simulation-suite.sh --full-regression
+
+          - name: Notify on failures
+            if: failure()
+            run: |
+              # Send Slack notification
+              curl -X POST $SLACK_WEBHOOK_URL \
+                -d '{"text": "Nightly simulation regression failed!"}'
+    ```
+  </Accordion>
+
+  <Accordion title="Quality gates">
+    Block deployment if pass rate falls below threshold:
+
+    ```bash
+    RESULT=$(curl -s "https://api.vapi.ai/eval/simulation/run/$RUN_ID" \
+      -H "Authorization: Bearer $VAPI_API_KEY")
+
+    TOTAL=$(echo $RESULT | jq '.itemCounts.total')
+    PASSED=$(echo $RESULT | jq '.itemCounts.passed')
+
+    PASS_RATE=$((PASSED * 100 / TOTAL))
+
+    if [ $PASS_RATE -lt 95 ]; then
+      echo "Pass rate $PASS_RATE% below threshold 95%"
+      exit 1
+    fi
+    ```
+  </Accordion>
+</AccordionGroup>
+
+## Maintenance strategies
+
+### Regular review cycle
+
+<Steps>
+  <Step title="Weekly: Review failed tests">
+    Investigate all failures. Update tests if requirements changed, or fix assistant if behavior regressed.
+  </Step>
+
+  <Step title="Monthly: Audit test coverage">
+    Review simulation suite completeness:
+    - All critical user flows covered?
+    - New features have tests?
+    - Deprecated features removed?
+  </Step>
+
+  <Step title="Quarterly: Refactor and optimize">
+    - Remove duplicate simulations
+    - Update outdated scenarios
+    - Optimize personalities for cost
+    - Document test rationale
+  </Step>
+</Steps>
+
+### When to update simulations
+
+| Trigger | Action |
+| --- | --- |
+| Assistant prompt changes | Review affected simulations |
+| New feature added | Create simulations for new feature |
+| Bug fixed | Add regression test |
+| User feedback reveals edge case | Add edge case simulation |
+| Business requirements change | Update evaluation criteria |
+
+## Troubleshooting
+
+### Common issues
+
+| Issue | Cause | Solution |
+| --- | --- | --- |
+| Simulation always fails | Evaluation criteria too strict | Review structured output schema and expected values |
+| Run stuck in "running" | Assistant not responding | Check assistant configuration, verify credentials |
+| Inconsistent results | Non-deterministic behavior | Increase iterations, use more specific instructions |
+| No audio in recording | Using chat mode | Switch to `vapi.websocket` transport |
+| Hooks not triggering | Using chat mode | Hooks require `vapi.websocket` transport |
+| Tool mocks not working | Wrong tool name | Verify tool name matches exactly |
+
+### Debugging tips
+
+<Steps>
+  <Step title="Check run status">
+    ```bash
+    curl "https://api.vapi.ai/eval/simulation/run/$RUN_ID" \
+      -H "Authorization: Bearer $VAPI_API_KEY" | jq '.status, .endedReason'
+    ```
+  </Step>
+
+  <Step title="Review individual run items">
+    ```bash
+    curl "https://api.vapi.ai/eval/simulation/run/$RUN_ID/item" \
+      -H "Authorization: Bearer $VAPI_API_KEY" | jq '.[].status'
+    ```
+  </Step>
+
+  <Step title="Check conversation transcript">
+    In the Dashboard, click on a failed run item to see the full conversation transcript and evaluation results.
+  </Step>
+
+  <Step title="Test assistant manually">
+    If simulations consistently fail, test your assistant manually in the Dashboard to verify it's working correctly.
+  </Step>
+</Steps>
+
+### Getting help
+
+**Include these details when reporting issues:**
+- Simulation run ID
+- Scenario and personality IDs
+- Transport mode used (voice/chat)
+- Expected vs actual behavior
+- Assistant configuration
+
+**Resources:**
+- [Simulations Quickstart](/observability/simulations-quickstart)
+- [Discord Community](https://discord.gg/pUFNcf2WmH)
+- [Support](mailto:support@vapi.ai)
+
+## Next steps
+
+<CardGroup cols={2}>
+  <Card
+    title="Simulations quickstart"
+    icon="rocket"
+    href="/observability/simulations-quickstart"
+  >
+    Return to quickstart guide for basic setup
+  </Card>
+
+  <Card
+    title="Evals quickstart"
+    icon="clipboard-check"
+    href="/observability/evals-quickstart"
+  >
+    Learn about chat-based testing with mock conversations
+  </Card>
+
+  <Card
+    title="Structured outputs"
+    icon="table"
+    href="/assistants/structured-outputs"
+  >
+    Learn how to define structured outputs for evaluations
+  </Card>
+
+  <Card
+    title="Assistants guide"
+    icon="robot"
+    href="/assistants/quickstart"
+  >
+    Create and configure assistants to test
+  </Card>
+</CardGroup>
+
+## Summary
+
+<Tip>
+  **Key takeaways for advanced simulation testing:**
+
+  **Configuration:**
+  - Use tool mocks to test error paths without real API calls
+  - Use hooks for external notifications (voice mode only)
+  - Reference existing structured outputs for consistency
+
+  **Testing strategy:**
+  - Start with smoke tests, then regression, then edge cases
+  - Use chat mode for speed, voice mode for final validation
+  - Create personalities based on real customer types
+
+  **CI/CD:**
+  - Automate smoke tests in PR pipelines
+  - Run full regression before production deploys
+  - Set quality gate thresholds
+
+  **Maintenance:**
+  - Review failures weekly
+  - Audit coverage monthly
+  - Add regression tests when fixing bugs
+</Tip>
diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
index c58b5b3c7..38c6d98f8 100644
--- a/fern/observability/simulations-quickstart.mdx
+++ b/fern/observability/simulations-quickstart.mdx
@@ -6,17 +6,17 @@ slug: observability/simulations-quickstart
 
 ## Overview
 
-This quickstart guide will help you test your AI assistants and squads using realistic, AI-powered callers. In just a few minutes, you'll create test scenarios, define success criteria, and validate your agents work correctly under different conditions.
+This quickstart guide will help you test your AI assistants and squads using realistic, AI-powered callers. In just a few minutes, you'll create test scenarios, define evaluation criteria, and validate your agents work correctly under different conditions.
 
 ### What are Simulations?
 
-Simulations is Vapi's voice agent testing framework that enables you to systematically test assistants and squads using AI-powered callers that follow defined goals and evaluate outcomes. Instead of relying on manual testing or rigid scripts, Simulations recreate real conversations and measure whether your assistant behaves correctly. Test your agents by:
+Simulations is Vapi's voice agent testing framework that enables you to systematically test assistants and squads using AI-powered callers that follow defined instructions and evaluate outcomes using structured outputs. Instead of relying on manual testing or rigid scripts, Simulations recreate real conversations and measure whether your assistant behaves correctly. Test your agents by:
 
-1. **Creating personalities** - Define how the AI caller behaves (e.g., decisive, indecisive, impatient)
-2. **Defining scenarios** - Specify the caller's goal, constraints, and success criteria
-3. **Running simulations** - Pair scenarios with personalities to test your assistant
-4. **Monitoring results** - Watch tests in real time and review pass/fail outcomes
-5. **Tracking performance** - Analyze historical results to identify trends
+1. **Creating personalities** - Define a full assistant configuration for the AI tester (voice, model, system prompt)
+2. **Defining scenarios** - Specify instructions for the tester and evaluations using structured outputs
+3. **Creating simulations** - Pair scenarios with personalities
+4. **Running simulations** - Execute tests against your assistant or squad in voice or chat mode
+5. **Reviewing results** - Analyze pass/fail outcomes based on structured output evaluations
 
 ### When are Simulations useful?
 
@@ -29,14 +29,39 @@ Simulations help you maintain quality and catch issues early:
 - **Squad handoff testing** - Ensure smooth transitions between squad members
 - **Performance monitoring** - Track success rates over time and identify regressions
 
+### Voice vs Chat mode
+
+Simulations support two transport modes:
+
+<CardGroup cols={2}>
+  <Card title="Voice mode" icon="phone">
+    **`vapi.websocket`** - Full voice simulation with audio
+
+    - Realistic end-to-end testing
+    - Tests speech recognition and synthesis
+    - Produces call recordings
+  </Card>
+  <Card title="Chat mode" icon="message">
+    **`vapi.webchat`** - Text-based chat simulation
+
+    - Faster execution
+    - Lower cost (no audio processing)
+    - Ideal for rapid iteration
+  </Card>
+</CardGroup>
+
+<Tip>
+  Use **chat mode** during development for quick iteration, then switch to **voice mode** for final validation before deployment.
+</Tip>
+
 ### What you'll build
 
 A simulation suite for an appointment booking assistant that tests:
 
-- Different caller personalities (decisive vs. indecisive)
-- Goal completion and success criteria validation
-- Real-time monitoring of test calls
-- Historical performance tracking
+- Different caller personalities (confused user, impatient customer)
+- Evaluation criteria using structured outputs with comparators
+- Real-time monitoring of test runs
+- Both voice and chat mode execution
 
 ## Prerequisites
 
@@ -54,9 +79,9 @@ A simulation suite for an appointment booking assistant that tests:
   the Dashboard or use the API.
 </Note>
 
-## Step 1: Create a personality (optional)
+## Step 1: Create a personality
 
-Personalities define how the AI caller behaves during a test call. You can use built-in default personalities or create custom ones.
+Personalities define how the AI tester behaves during a simulation. A personality is a full assistant configuration that controls the tester's voice, model, and behavior via system prompt.
 
 <Tabs>
   <Tab title="Dashboard">
@@ -70,12 +95,16 @@ Personalities define how the AI caller behaves during a test call. You can use b
       <Step title="Create a personality">
         1. Click **Create Personality**
         2. **Name**: Enter "Impatient Customer"
-        3. **Description**: Add "A busy customer who wants quick answers and may interrupt"
-        4. **Behavior**: Define the personality traits:
-           - Speaks quickly and directly
-           - May interrupt if responses are too long
-           - Expects immediate solutions
-        5. Click **Save**
+        3. **Assistant Configuration**: Configure the tester assistant:
+           - **Model**: Select your preferred LLM (e.g., GPT-4o)
+           - **System Prompt**: Define the personality behavior:
+             ```
+             You are an impatient customer who wants quick answers.
+             Speak directly and may interrupt if responses are too long.
+             You expect immediate solutions to your problems.
+             ```
+           - **Voice**: Select a voice for the tester (optional for chat mode)
+        4. Click **Save**
       </Step>
     </Steps>
 
@@ -86,13 +115,27 @@ Personalities define how the AI caller behaves during a test call. You can use b
 
   <Tab title="cURL">
 ```bash
-curl -X POST "https://api.vapi.ai/simulation/personality" \
+curl -X POST "https://api.vapi.ai/eval/simulation/personality" \
   -H "Authorization: Bearer $VAPI_API_KEY" \
   -H "Content-Type: application/json" \
   -d '{
     "name": "Impatient Customer",
-    "description": "A busy customer who wants quick answers and may interrupt",
-    "behavior": "Speaks quickly and directly. May interrupt if responses are too long. Expects immediate solutions."
+    "assistant": {
+      "model": {
+        "provider": "openai",
+        "model": "gpt-4o",
+        "messages": [
+          {
+            "role": "system",
+            "content": "You are an impatient customer who wants quick answers. Speak directly and may interrupt if responses are too long. You expect immediate solutions to your problems."
+          }
+        ]
+      },
+      "voice": {
+        "provider": "cartesia",
+        "voiceId": "sonic-english"
+      }
+    }
   }'
 ```
 
@@ -100,11 +143,20 @@ curl -X POST "https://api.vapi.ai/simulation/personality" \
 
 ```json
 {
-  "id": "personality-123",
+  "id": "550e8400-e29b-41d4-a716-446655440001",
   "orgId": "org-456",
   "name": "Impatient Customer",
-  "description": "A busy customer who wants quick answers and may interrupt",
-  "behavior": "Speaks quickly and directly. May interrupt if responses are too long. Expects immediate solutions.",
+  "assistant": {
+    "model": {
+      "provider": "openai",
+      "model": "gpt-4o",
+      "messages": [...]
+    },
+    "voice": {
+      "provider": "cartesia",
+      "voiceId": "sonic-english"
+    }
+  },
   "createdAt": "2024-01-15T09:30:00Z",
   "updatedAt": "2024-01-15T09:30:00Z"
 }
@@ -115,12 +167,14 @@ Save the returned `id` - you'll need it when creating simulations.
 </Tabs>
 
 <Note>
-  **Personality types:** Consider creating personalities for different customer types you encounter: decisive buyers, hesitant customers, detail-oriented users, or frustrated callers.
+  **Personality types:** Consider creating personalities for different customer types you encounter: decisive buyers, confused users, detail-oriented customers, or frustrated callers.
 </Note>
 
 ## Step 2: Create a scenario
 
-Scenarios define what the test call is trying to accomplish, including the goal and success criteria.
+Scenarios define what the test is evaluating. A scenario contains:
+- **Instructions**: What the tester should do during the call
+- **Evaluations**: Structured outputs with expected values to validate outcomes
 
 <Tabs>
   <Tab title="Dashboard">
@@ -132,40 +186,67 @@ Scenarios define what the test call is trying to accomplish, including the goal
 
       <Step title="Configure the scenario">
         1. **Name**: Enter "Book Appointment"
-        2. **Description**: Add "Test that the assistant can successfully book an appointment"
-        3. **Goal**: Define what the caller is trying to accomplish:
-           - "Schedule an appointment for next Monday at 2pm"
-        4. **Constraints** (optional): Add any limitations:
-           - "Only available on weekdays"
-           - "Preferred morning appointments"
+        2. **Instructions**: Define what the tester should do:
+           ```
+           You are calling to book an appointment for next Monday at 2pm.
+           Confirm your identity when asked and provide any required information.
+           End the call once you receive a confirmation number.
+           ```
       </Step>
 
-      <Step title="Add success criteria">
-        1. Click **Add Success Criterion**
-        2. Define what must happen for the test to pass:
-           - "Appointment is confirmed with a specific date and time"
-           - "Confirmation number is provided"
-        3. Click **Save Scenario**
+      <Step title="Add evaluations">
+        Evaluations use structured outputs to extract data from the conversation and compare against expected values.
+
+        1. Click **Add Evaluation**
+        2. Create or select a structured output:
+           - **Name**: "appointment_booked"
+           - **Schema Type**: boolean
+        3. Set the **Comparator**: `=`
+        4. Set the **Expected Value**: `true`
+        5. Mark as **Required**: Yes
+        6. Add another evaluation for confirmation number:
+           - **Name**: "confirmation_provided"
+           - **Schema Type**: boolean
+           - **Comparator**: `=`
+           - **Expected Value**: `true`
+        7. Click **Save Scenario**
       </Step>
     </Steps>
   </Tab>
 
   <Tab title="cURL">
 ```bash
-curl -X POST "https://api.vapi.ai/simulation/scenario" \
+curl -X POST "https://api.vapi.ai/eval/simulation/scenario" \
   -H "Authorization: Bearer $VAPI_API_KEY" \
   -H "Content-Type: application/json" \
   -d '{
     "name": "Book Appointment",
-    "description": "Test that the assistant can successfully book an appointment",
-    "goal": "Schedule an appointment for next Monday at 2pm",
-    "constraints": [
-      "Only available on weekdays",
-      "Preferred morning appointments"
-    ],
-    "successCriteria": [
-      "Appointment is confirmed with a specific date and time",
-      "Confirmation number is provided"
+    "instructions": "You are calling to book an appointment for next Monday at 2pm. Confirm your identity when asked and provide any required information. End the call once you receive a confirmation number.",
+    "evaluations": [
+      {
+        "structuredOutput": {
+          "name": "appointment_booked",
+          "schema": {
+            "type": "boolean",
+            "description": "Whether an appointment was successfully booked"
+          }
+        },
+        "comparator": "=",
+        "value": true,
+        "required": true
+      },
+      {
+        "structuredOutput": {
+          "name": "confirmation_provided",
+          "schema": {
+            "type": "boolean",
+            "description": "Whether a confirmation number was provided"
+          }
+        },
+        "comparator": "=",
+        "value": true,
+        "required": true
+      }
     ]
   }'
 ```
@@ -174,18 +255,29 @@ curl -X POST "https://api.vapi.ai/simulation/scenario" \
 
 ```json
 {
-  "id": "scenario-789",
+  "id": "550e8400-e29b-41d4-a716-446655440002",
   "orgId": "org-456",
   "name": "Book Appointment",
-  "description": "Test that the assistant can successfully book an appointment",
-  "goal": "Schedule an appointment for next Monday at 2pm",
-  "constraints": [
-    "Only available on weekdays",
-    "Preferred morning appointments"
-  ],
-  "successCriteria": [
-    "Appointment is confirmed with a specific date and time",
-    "Confirmation number is provided"
+  "instructions": "You are calling to book an appointment for next Monday at 2pm...",
+  "evaluations": [
+    {
+      "structuredOutput": {
+        "name": "appointment_booked",
+        "schema": { "type": "boolean", "description": "..." }
+      },
+      "comparator": "=",
+      "value": true,
+      "required": true
+    },
+    {
+      "structuredOutput": {
+        "name": "confirmation_provided",
+        "schema": { "type": "boolean", "description": "..." }
+      },
+      "comparator": "=",
+      "value": true,
+      "required": true
+    }
   ],
   "createdAt": "2024-01-15T09:35:00Z",
   "updatedAt": "2024-01-15T09:35:00Z"
@@ -196,13 +288,40 @@ Save the returned `id` - you'll need it when creating simulations.
   </Tab>
 </Tabs>
 
+### Evaluation structure
+
+Each evaluation consists of:
+
+| Field | Description |
+| --- | --- |
+| `structuredOutputId` | Reference to an existing structured output (mutually exclusive with `structuredOutput`) |
+| `structuredOutput` | Inline structured output definition (mutually exclusive with `structuredOutputId`) |
+| `comparator` | Comparison operator: `=`, `!=`, `>`, `<`, `>=`, `<=` |
+| `value` | Expected value (string, number, or boolean) |
+| `required` | Whether this evaluation must pass for the simulation to pass (default: `true`) |
+
+<Note>
+  **Schema type restrictions:** Evaluations only support primitive schema types: `string`, `number`, `integer`, `boolean`. Objects and arrays are not supported.
+</Note>
+
+### Comparator options
+
+| Comparator | Description | Supported Types |
+| --- | --- | --- |
+| `=` | Equals | string, number, integer, boolean |
+| `!=` | Not equals | string, number, integer, boolean |
+| `>` | Greater than | number, integer |
+| `<` | Less than | number, integer |
+| `>=` | Greater than or equal | number, integer |
+| `<=` | Less than or equal | number, integer |
+
 <Tip>
-  **Success criteria tips:** Be specific about what constitutes success. Include both the action (appointment booked) and the verification (confirmation provided).
+  **Evaluation tips:** Use boolean structured outputs for pass/fail checks like "appointment_booked" or "issue_resolved". Use numeric outputs with comparators for metrics like "satisfaction_score >= 4".
 </Tip>
 
 ## Step 3: Create a simulation
 
-Simulations pair a scenario with a personality and select the assistant or squad you want to test.
+Simulations pair a scenario with a personality. The target assistant or squad is specified when you run the simulation.
 
 <Tabs>
   <Tab title="Dashboard">
@@ -213,29 +332,23 @@ Simulations pair a scenario with a personality and select the assistant or squad
       </Step>
 
       <Step title="Configure the simulation">
-        1. **Name**: Enter "Appointment Booking - Impatient Customer"
+        1. **Name**: Enter "Appointment Booking - Impatient Customer" (optional)
         2. **Scenario**: Select "Book Appointment" from the dropdown
-        3. **Personality**: Select "Impatient Customer" (or use a default)
-        4. **Target**: Choose **Assistant** or **Squad**
-        5. Select your assistant/squad from the dropdown
-        6. Click **Save Simulation**
+        3. **Personality**: Select "Impatient Customer" from the dropdown
+        4. Click **Save Simulation**
       </Step>
     </Steps>
   </Tab>
 
   <Tab title="cURL">
 ```bash
-curl -X POST "https://api.vapi.ai/simulation" \
+curl -X POST "https://api.vapi.ai/eval/simulation" \
   -H "Authorization: Bearer $VAPI_API_KEY" \
   -H "Content-Type: application/json" \
   -d '{
     "name": "Appointment Booking - Impatient Customer",
-    "scenarioId": "scenario-789",
-    "personalityId": "personality-123",
-    "target": {
-      "type": "assistant",
-      "assistantId": "your-assistant-id"
-    }
+    "scenarioId": "550e8400-e29b-41d4-a716-446655440002",
+    "personalityId": "550e8400-e29b-41d4-a716-446655440001"
   }'
 ```
 
@@ -243,21 +356,17 @@ curl -X POST "https://api.vapi.ai/simulation" \
 
 ```json
 {
-  "id": "simulation-abc",
+  "id": "550e8400-e29b-41d4-a716-446655440003",
   "orgId": "org-456",
   "name": "Appointment Booking - Impatient Customer",
-  "scenarioId": "scenario-789",
-  "personalityId": "personality-123",
-  "target": {
-    "type": "assistant",
-    "assistantId": "your-assistant-id"
-  },
+  "scenarioId": "550e8400-e29b-41d4-a716-446655440002",
+  "personalityId": "550e8400-e29b-41d4-a716-446655440001",
   "createdAt": "2024-01-15T09:40:00Z",
   "updatedAt": "2024-01-15T09:40:00Z"
 }
 ```
 
-Save the returned `id` - you'll need it when creating simulation suites.
+Save the returned `id` - you'll need it when running simulations.
   </Tab>
 </Tabs>
 
@@ -265,7 +374,7 @@ Save the returned `id` - you'll need it when creating simulation suites.
   **Multiple simulations:** Create several simulations with different personality and scenario combinations to thoroughly test your assistant across various conditions.
 </Note>
 
-## Step 4: Create a simulation suite
+## Step 4: Create a simulation suite (optional)
 
 Simulation suites group multiple simulations into a single batch that runs together.
 
@@ -279,29 +388,27 @@ Simulation suites group multiple simulations into a single batch that runs toget
 
       <Step title="Configure the suite">
         1. **Name**: Enter "Appointment Booking Regression Suite"
-        2. **Description**: Add "Tests appointment booking across different customer types"
-        3. Click **Add Simulations**
-        4. Select the simulations you want to include:
+        2. Click **Add Simulations**
+        3. Select the simulations you want to include:
            - "Appointment Booking - Impatient Customer"
+           - "Appointment Booking - Confused User"
            - "Appointment Booking - Decisive Customer"
-           - "Appointment Booking - Indecisive Customer"
-        5. Click **Save Suite**
+        4. Click **Save Suite**
       </Step>
     </Steps>
   </Tab>
 
   <Tab title="cURL">
 ```bash
-curl -X POST "https://api.vapi.ai/simulation/suite" \
+curl -X POST "https://api.vapi.ai/eval/simulation/suite" \
   -H "Authorization: Bearer $VAPI_API_KEY" \
   -H "Content-Type: application/json" \
   -d '{
     "name": "Appointment Booking Regression Suite",
-    "description": "Tests appointment booking across different customer types",
     "simulationIds": [
-      "simulation-abc",
-      "simulation-def",
-      "simulation-ghi"
+      "550e8400-e29b-41d4-a716-446655440003",
+      "550e8400-e29b-41d4-a716-446655440004",
+      "550e8400-e29b-41d4-a716-446655440005"
     ]
   }'
 ```
@@ -310,14 +417,13 @@ curl -X POST "https://api.vapi.ai/simulation/suite" \
 
 ```json
 {
-  "id": "suite-xyz",
+  "id": "550e8400-e29b-41d4-a716-446655440006",
   "orgId": "org-456",
   "name": "Appointment Booking Regression Suite",
-  "description": "Tests appointment booking across different customer types",
   "simulationIds": [
-    "simulation-abc",
-    "simulation-def",
-    "simulation-ghi"
+    "550e8400-e29b-41d4-a716-446655440003",
+    "550e8400-e29b-41d4-a716-446655440004",
+    "550e8400-e29b-41d4-a716-446655440005"
   ],
   "createdAt": "2024-01-15T09:45:00Z",
   "updatedAt": "2024-01-15T09:45:00Z"
@@ -332,74 +438,149 @@ Save the returned `id` - you'll need it to run the suite.
   **Suite organization:** Group related simulations together. For example, create separate suites for "Booking Tests", "Cancellation Tests", and "Rescheduling Tests".
 </Tip>
 
-## Step 5: Run the suite
+## Step 5: Run a simulation
 
-Execute all simulations in your suite and monitor them in real time.
+Execute simulations against your assistant or squad. You can run individual simulations or entire suites.
 
 <Tabs>
   <Tab title="Dashboard">
     <Steps>
-      <Step title="Run the suite">
-        1. Navigate to your suite in the **Suites** tab
-        2. Click **Run Suite**
-        3. All simulations in the suite will be queued and executed
+      <Step title="Start a run">
+        1. Navigate to your simulation or suite
+        2. Click **Run**
+        3. Select the **Target**:
+           - Choose **Assistant** or **Squad**
+           - Select from the dropdown
+        4. Configure **Transport** (optional):
+           - **Voice**: `vapi.websocket` (default)
+           - **Chat**: `vapi.webchat` (faster, no audio)
+        5. Set **Iterations** (optional): Number of times to run each simulation
+        6. Click **Start Run**
       </Step>
 
-      <Step title="Monitor in real time">
+      <Step title="Monitor progress">
         1. Click the **Runs** tab to see live status updates
         2. Watch as each simulation progresses:
            - **Queued** - Waiting to start
-           - **Running** - Call in progress
-           - **Completed** - Test finished
-        3. Click **Listen** on any running test to hear the call live
+           - **Running** - Test in progress
+           - **Ended** - Test finished
+        3. For voice mode, click **Listen** on any running test to hear the call live
       </Step>
     </Steps>
   </Tab>
 
   <Tab title="cURL">
-**Run the suite:**
+**Run a single simulation in voice mode:**
 
 ```bash
-curl -X POST "https://api.vapi.ai/simulation/suite/suite-xyz/run" \
-  -H "Authorization: Bearer $VAPI_API_KEY"
+curl -X POST "https://api.vapi.ai/eval/simulation/run" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "simulations": [
+      {
+        "type": "simulation",
+        "simulationId": "550e8400-e29b-41d4-a716-446655440003"
+      }
+    ],
+    "target": {
+      "type": "assistant",
+      "assistantId": "your-assistant-id"
+    },
+    "transport": {
+      "provider": "vapi.websocket"
+    }
+  }'
+```
+
+**Run a simulation in chat mode (faster, no audio):**
+
+```bash
+curl -X POST "https://api.vapi.ai/eval/simulation/run" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "simulations": [
+      {
+        "type": "simulation",
+        "simulationId": "550e8400-e29b-41d4-a716-446655440003"
+      }
+    ],
+    "target": {
+      "type": "assistant",
+      "assistantId": "your-assistant-id"
+    },
+    "transport": {
+      "provider": "vapi.webchat"
+    }
+  }'
+```
+
+**Run a suite with multiple iterations:**
+
+```bash
+curl -X POST "https://api.vapi.ai/eval/simulation/run" \
+  -H "Authorization: Bearer $VAPI_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "simulations": [
+      {
+        "type": "simulationSuite",
+        "simulationSuiteId": "550e8400-e29b-41d4-a716-446655440006"
+      }
+    ],
+    "target": {
+      "type": "assistant",
+      "assistantId": "your-assistant-id"
+    },
+    "iterations": 3
+  }'
 ```
 
 **Response:**
 
 ```json
 {
-  "id": "run-123",
-  "suiteId": "suite-xyz",
-  "status": "running",
+  "id": "550e8400-e29b-41d4-a716-446655440007",
+  "orgId": "org-456",
+  "status": "queued",
   "simulations": [
     {
-      "simulationId": "simulation-abc",
-      "status": "queued"
-    },
-    {
-      "simulationId": "simulation-def",
-      "status": "queued"
-    },
-    {
-      "simulationId": "simulation-ghi",
-      "status": "queued"
+      "type": "simulation",
+      "simulationId": "550e8400-e29b-41d4-a716-446655440003"
     }
   ],
-  "createdAt": "2024-01-15T09:50:00Z"
+  "target": {
+    "type": "assistant",
+    "assistantId": "your-assistant-id"
+  },
+  "transport": {
+    "provider": "vapi.websocket"
+  },
+  "queuedAt": "2024-01-15T09:50:00Z",
+  "createdAt": "2024-01-15T09:50:00Z",
+  "updatedAt": "2024-01-15T09:50:00Z"
 }
 ```
 
 **Check run status:**
 
 ```bash
-curl -X GET "https://api.vapi.ai/simulation/run/run-123" \
+curl -X GET "https://api.vapi.ai/eval/simulation/run/550e8400-e29b-41d4-a716-446655440007" \
   -H "Authorization: Bearer $VAPI_API_KEY"
 ```
   </Tab>
 </Tabs>
 
+### Transport options
+
+| Provider | Description | Use Case |
+| --- | --- | --- |
+| `vapi.websocket` | Full voice simulation with audio bridge | Production validation, end-to-end testing |
+| `vapi.webchat` | Text-based chat simulation | Rapid iteration, development testing |
+
 <Warning>
-  Running a suite will execute actual voice calls to your assistant. Ensure your assistant is properly configured before running tests.
+  **Hooks are only supported in voice mode.** If your scenario uses hooks (like `call.started` or `call.ended`), you must use `vapi.websocket` transport.
 </Warning>
 
 ## Step 6: Review results
@@ -408,83 +589,54 @@ Analyze the results of your simulation runs to understand how your assistant per
 
 ### Successful run
 
-When all simulations pass, you'll see:
+When all evaluations pass, you'll see:
 
 ```json
 {
-  "id": "run-123",
-  "suiteId": "suite-xyz",
-  "status": "completed",
-  "results": [
-    {
-      "simulationId": "simulation-abc",
-      "status": "pass",
-      "successCriteria": [
-        {
-          "criterion": "Appointment is confirmed with a specific date and time",
-          "passed": true
-        },
-        {
-          "criterion": "Confirmation number is provided",
-          "passed": true
-        }
-      ],
-      "duration": "45s"
-    }
-  ],
-  "summary": {
+  "id": "550e8400-e29b-41d4-a716-446655440007",
+  "status": "ended",
+  "itemCounts": {
     "total": 3,
     "passed": 3,
-    "failed": 0
-  }
+    "failed": 0,
+    "running": 0,
+    "queued": 0,
+    "canceled": 0
+  },
+  "startedAt": "2024-01-15T09:50:05Z",
+  "endedAt": "2024-01-15T09:52:30Z"
 }
 ```
 
 **Pass criteria:**
 
-- `status` is "completed"
-- `results[].status` is "pass" for all simulations
-- All `successCriteria` items show `passed: true`
+- `status` is "ended"
+- `itemCounts.passed` equals `itemCounts.total`
+- All required evaluations show `passed: true`
 
 ### Failed run
 
-When validation fails, you'll see details about what went wrong:
+When evaluation fails, you'll see details about what went wrong:
 
 ```json
 {
-  "id": "run-124",
-  "suiteId": "suite-xyz",
-  "status": "completed",
-  "results": [
-    {
-      "simulationId": "simulation-abc",
-      "status": "fail",
-      "successCriteria": [
-        {
-          "criterion": "Appointment is confirmed with a specific date and time",
-          "passed": true
-        },
-        {
-          "criterion": "Confirmation number is provided",
-          "passed": false,
-          "reason": "No confirmation number was mentioned in the conversation"
-        }
-      ],
-      "duration": "52s"
-    }
-  ],
-  "summary": {
+  "id": "550e8400-e29b-41d4-a716-446655440008",
+  "status": "ended",
+  "itemCounts": {
     "total": 3,
     "passed": 2,
-    "failed": 1
+    "failed": 1,
+    "running": 0,
+    "queued": 0,
+    "canceled": 0
   }
 }
 ```
 
 **Failure indicators:**
 
-- `results[].status` is "fail"
-- `successCriteria[].passed` is `false` with a `reason` explaining the failure
+- `itemCounts.failed` > 0
+- Individual run items show which evaluations failed and why
 
 <Tabs>
   <Tab title="Dashboard">
@@ -497,16 +649,15 @@ When validation fails, you'll see details about what went wrong:
 
       <Step title="Investigate failures">
         1. Click on any failed simulation
-        2. Review the **Timeline** to see the conversation flow
-        3. Check which success criteria failed and why
-        4. Click **Listen to Recording** to hear the full call
+        2. Review the **Conversation** to see the full transcript
+        3. Check which evaluations failed and their actual vs expected values
+        4. For voice mode, click **Listen to Recording** to hear the full call
       </Step>
 
       <Step title="Track performance over time">
         1. Go to the main **Simulations** page
-        2. Filter by **Suites** to see historical runs
-        3. Monitor pass rates and identify trends
-        4. Compare performance across different suite versions
+        2. View historical runs and their pass rates
+        3. Monitor trends to identify regressions
       </Step>
     </Steps>
   </Tab>
@@ -515,40 +666,40 @@ When validation fails, you'll see details about what went wrong:
 **List all runs:**
 
 ```bash
-curl -X GET "https://api.vapi.ai/simulation/run" \
+curl -X GET "https://api.vapi.ai/eval/simulation/run" \
   -H "Authorization: Bearer $VAPI_API_KEY"
 ```
 
 **Get detailed results for a specific run:**
 
 ```bash
-curl -X GET "https://api.vapi.ai/simulation/run/run-123" \
+curl -X GET "https://api.vapi.ai/eval/simulation/run/550e8400-e29b-41d4-a716-446655440007" \
   -H "Authorization: Bearer $VAPI_API_KEY"
 ```
 
-**Filter runs by suite:**
+**Filter runs by status:**
 
 ```bash
-curl -X GET "https://api.vapi.ai/simulation/run?suiteId=suite-xyz" \
+curl -X GET "https://api.vapi.ai/eval/simulation/run?status=ended" \
   -H "Authorization: Bearer $VAPI_API_KEY"
 ```
   </Tab>
 </Tabs>
 
 <Note>
-  Full conversation recordings are available for all simulation runs, making it easy to understand exactly what happened during each test.
+  Full conversation transcripts are available for all simulation runs, making it easy to understand exactly what happened during each test.
 </Note>
 
 ## Troubleshooting
 
 | Issue | Solution |
 | --- | --- |
-| Simulation always fails | Check that success criteria are achievable with your assistant's current capabilities |
-| Run stuck in "running" | Verify your assistant is properly configured and responding to calls |
-| Personality not applied | Ensure the personality ID is correctly linked to the simulation |
-| Success criteria unclear | Make criteria specific and measurable (e.g., "mentions confirmation number" vs "completes task") |
-| No audio in recording | Check that your assistant has voice configuration enabled |
-| Suite won't start | Verify all simulations in the suite are valid and have targets assigned |
+| Simulation always fails | Check that evaluations are achievable with your assistant's current capabilities |
+| Run stuck in "running" | Verify your assistant is properly configured and responding |
+| Evaluations not extracting data | Ensure structured output schemas match what your assistant can provide |
+| No audio in recording | Check that you're using `vapi.websocket` transport, not `vapi.webchat` |
+| Hooks not triggering | Hooks only work with `vapi.websocket` transport |
+| Suite won't start | Verify all simulations in the suite exist and have valid scenarios/personalities |
 
 ### Common errors
 
@@ -558,33 +709,61 @@ curl -X GET "https://api.vapi.ai/simulation/run?suiteId=suite-xyz" \
 - Verify API keys are valid
 - Test the assistant manually before running simulations
 
-**Success criteria failures:**
+**Evaluation failures:**
 
-- Review the conversation recording to understand what happened
-- Adjust criteria to be more specific or more flexible as needed
+- Review the conversation transcript to understand what happened
+- Adjust structured output schemas to better match expected responses
 - Consider whether the personality is making the test unrealistically difficult
 
 <Warning>
   If simulations consistently fail, test your assistant manually first to ensure it's working correctly before debugging the simulation configuration.
 </Warning>
 
+## API reference
+
+| Endpoint | Method | Description |
+| --- | --- | --- |
+| `/eval/simulation/personality` | POST | Create a personality |
+| `/eval/simulation/personality` | GET | List personalities |
+| `/eval/simulation/personality/:id` | GET | Get a personality |
+| `/eval/simulation/personality/:id` | PATCH | Update a personality |
+| `/eval/simulation/personality/:id` | DELETE | Delete a personality |
+| `/eval/simulation/scenario` | POST | Create a scenario |
+| `/eval/simulation/scenario` | GET | List scenarios |
+| `/eval/simulation/scenario/:id` | GET | Get a scenario |
+| `/eval/simulation/scenario/:id` | PATCH | Update a scenario |
+| `/eval/simulation/scenario/:id` | DELETE | Delete a scenario |
+| `/eval/simulation` | POST | Create a simulation |
+| `/eval/simulation` | GET | List simulations |
+| `/eval/simulation/:id` | GET | Get a simulation |
+| `/eval/simulation/:id` | PATCH | Update a simulation |
+| `/eval/simulation/:id` | DELETE | Delete a simulation |
+| `/eval/simulation/suite` | POST | Create a suite |
+| `/eval/simulation/suite` | GET | List suites |
+| `/eval/simulation/suite/:id` | GET | Get a suite |
+| `/eval/simulation/suite/:id` | PATCH | Update a suite |
+| `/eval/simulation/suite/:id` | DELETE | Delete a suite |
+| `/eval/simulation/run` | POST | Start a simulation run |
+| `/eval/simulation/run` | GET | List runs |
+| `/eval/simulation/run/:id` | GET | Get run details |
+
 ## Next steps
 
 <CardGroup cols={2}>
   <Card
-    title="Assistants guide"
-    icon="robot"
-    href="/assistants/quickstart"
+    title="Advanced simulation testing"
+    icon="flask"
+    href="/observability/simulations-advanced"
   >
-    Create and configure assistants to test
+    Learn about tool mocks, hooks, CI/CD integration, and testing strategies
   </Card>
 
   <Card
-    title="Squads documentation"
-    icon="users"
-    href="/squads"
+    title="Assistants guide"
+    icon="robot"
+    href="/assistants/quickstart"
   >
-    Build multi-agent squads and test handoffs
+    Create and configure assistants to test
   </Card>
 
   <Card
@@ -596,11 +775,11 @@ curl -X GET "https://api.vapi.ai/simulation/run?suiteId=suite-xyz" \
   </Card>
 
   <Card
-    title="Prompting guide"
-    icon="pen-to-square"
-    href="/prompting-guide"
+    title="Structured outputs"
+    icon="table"
+    href="/assistants/structured-outputs"
   >
-    Improve your assistant's responses with better prompts
+    Learn how to define structured outputs for evaluations
   </Card>
 </CardGroup>
 
@@ -609,9 +788,9 @@ curl -X GET "https://api.vapi.ai/simulation/run?suiteId=suite-xyz" \
 <Tip>
   **Best practices for effective simulation testing:**
 
-  - **Start simple** - Begin with straightforward scenarios before testing edge cases
+  - **Start with chat mode** - Use `vapi.webchat` for rapid iteration, then validate with voice
   - **Use realistic personalities** - Model your test callers after actual customer types
-  - **Define clear success criteria** - Specific, measurable criteria lead to reliable tests
+  - **Define clear evaluations** - Use specific, measurable structured outputs
   - **Group related tests** - Organize suites by feature or user flow
   - **Monitor trends** - Track pass rates over time to catch regressions early
   - **Test after changes** - Run your simulation suites after updating prompts or tools
@@ -619,6 +798,26 @@ curl -X GET "https://api.vapi.ai/simulation/run?suiteId=suite-xyz" \
   - **Iterate on failures** - Use failed tests to improve both your assistant and test design
 </Tip>
 
+## Frequently asked questions
+
+<AccordionGroup>
+  <Accordion title="Is running simulations free?" icon="dollar-sign">
+    No, simulations cost the same as regular calls. Both the tester and target assistants are charged normally for LLM, TTS, and STT usage. Chat mode (`vapi.webchat`) is typically cheaper since it doesn't use voice processing.
+  </Accordion>
+
+  <Accordion title="What's the difference between Simulations and Evals?" icon="scale-balanced">
+    **Simulations** use AI-powered testers that have actual conversations with your assistant, producing real call recordings and transcripts. **Evals** use mock conversations with predefined messages and judge the responses. Use Simulations for realistic end-to-end testing; use Evals for faster, more controlled validation.
+  </Accordion>
+
+  <Accordion title="Can I use my own structured outputs?" icon="table">
+    Yes! You can either define inline structured outputs in your scenario evaluations, or reference existing structured outputs by ID using the `structuredOutputId` field.
+  </Accordion>
+
+  <Accordion title="How do I test squad handoffs?" icon="users">
+    Create a simulation that targets a squad instead of an assistant. Use the `target.type: "squad"` and `target.squadId` fields when creating a run.
+  </Accordion>
+</AccordionGroup>
+
 ## Get help
 
 Need assistance? We're here to help:

From 3690422e8d0c18f1ba6c28c26a3537610548f366 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 20:23:58 -0800
Subject: [PATCH 03/10] a few fixes

---
 fern/observability/simulations-advanced.mdx   | 25 -------
 fern/observability/simulations-quickstart.mdx | 74 +------------------
 2 files changed, 2 insertions(+), 97 deletions(-)

diff --git a/fern/observability/simulations-advanced.mdx b/fern/observability/simulations-advanced.mdx
index ac178ad75..4ab5a0e95 100644
--- a/fern/observability/simulations-advanced.mdx
+++ b/fern/observability/simulations-advanced.mdx
@@ -544,31 +544,6 @@ Test boundary conditions and unusual inputs your assistant might encounter.
 | Pre-production validation | Voice (`vapi.websocket`) | Full end-to-end |
 | Testing hooks/webhooks | Voice (`vapi.websocket`) | Hooks require voice |
 
-### Performance optimization
-
-**Minimize test execution time:**
-
-1. **Use chat mode for initial development:**
-   - `vapi.webchat` runs faster than voice
-   - Switch to voice for final validation
-
-2. **Keep instructions focused:**
-   - Clear, specific instructions complete faster
-   - Avoid overly complex multi-step scenarios
-
-3. **Batch related tests:**
-   - Group similar simulations in suites
-   - Run suites instead of individual simulations
-
-4. **Use iterations strategically:**
-   - `iterations: 1` for deterministic scenarios
-   - Higher iterations for testing consistency
-
-**Cost optimization:**
-- Chat mode costs less (no STT/TTS)
-- Simple personalities (smaller models) cost less
-- Shorter conversations cost less
-
 ## CI/CD integration
 
 Automate simulation runs in your deployment pipeline.
diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
index 38c6d98f8..ce35a2d46 100644
--- a/fern/observability/simulations-quickstart.mdx
+++ b/fern/observability/simulations-quickstart.mdx
@@ -35,15 +35,13 @@ Simulations support two transport modes:
 
 <CardGroup cols={2}>
   <Card title="Voice mode" icon="phone">
-    **`vapi.websocket`** - Full voice simulation with audio
-
+    - Full voice simulation with audio
     - Realistic end-to-end testing
     - Tests speech recognition and synthesis
     - Produces call recordings
   </Card>
   <Card title="Chat mode" icon="message">
-    **`vapi.webchat`** - Text-based chat simulation
-
+    - Text-based chat simulation
     - Faster execution
     - Lower cost (no audio processing)
     - Ideal for rapid iteration
@@ -572,17 +570,6 @@ curl -X GET "https://api.vapi.ai/eval/simulation/run/550e8400-e29b-41d4-a716-446
   </Tab>
 </Tabs>
 
-### Transport options
-
-| Provider | Description | Use Case |
-| --- | --- | --- |
-| `vapi.websocket` | Full voice simulation with audio bridge | Production validation, end-to-end testing |
-| `vapi.webchat` | Text-based chat simulation | Rapid iteration, development testing |
-
-<Warning>
-  **Hooks are only supported in voice mode.** If your scenario uses hooks (like `call.started` or `call.ended`), you must use `vapi.websocket` transport.
-</Warning>
-
 ## Step 6: Review results
 
 Analyze the results of your simulation runs to understand how your assistant performed.
@@ -690,63 +677,6 @@ curl -X GET "https://api.vapi.ai/eval/simulation/run?status=ended" \
   Full conversation transcripts are available for all simulation runs, making it easy to understand exactly what happened during each test.
 </Note>
 
-## Troubleshooting
-
-| Issue | Solution |
-| --- | --- |
-| Simulation always fails | Check that evaluations are achievable with your assistant's current capabilities |
-| Run stuck in "running" | Verify your assistant is properly configured and responding |
-| Evaluations not extracting data | Ensure structured output schemas match what your assistant can provide |
-| No audio in recording | Check that you're using `vapi.websocket` transport, not `vapi.webchat` |
-| Hooks not triggering | Hooks only work with `vapi.websocket` transport |
-| Suite won't start | Verify all simulations in the suite exist and have valid scenarios/personalities |
-
-### Common errors
-
-**"assistant-error" status:**
-
-- Check your assistant configuration (model, voice, tools)
-- Verify API keys are valid
-- Test the assistant manually before running simulations
-
-**Evaluation failures:**
-
-- Review the conversation transcript to understand what happened
-- Adjust structured output schemas to better match expected responses
-- Consider whether the personality is making the test unrealistically difficult
-
-<Warning>
-  If simulations consistently fail, test your assistant manually first to ensure it's working correctly before debugging the simulation configuration.
-</Warning>
-
-## API reference
-
-| Endpoint | Method | Description |
-| --- | --- | --- |
-| `/eval/simulation/personality` | POST | Create a personality |
-| `/eval/simulation/personality` | GET | List personalities |
-| `/eval/simulation/personality/:id` | GET | Get a personality |
-| `/eval/simulation/personality/:id` | PATCH | Update a personality |
-| `/eval/simulation/personality/:id` | DELETE | Delete a personality |
-| `/eval/simulation/scenario` | POST | Create a scenario |
-| `/eval/simulation/scenario` | GET | List scenarios |
-| `/eval/simulation/scenario/:id` | GET | Get a scenario |
-| `/eval/simulation/scenario/:id` | PATCH | Update a scenario |
-| `/eval/simulation/scenario/:id` | DELETE | Delete a scenario |
-| `/eval/simulation` | POST | Create a simulation |
-| `/eval/simulation` | GET | List simulations |
-| `/eval/simulation/:id` | GET | Get a simulation |
-| `/eval/simulation/:id` | PATCH | Update a simulation |
-| `/eval/simulation/:id` | DELETE | Delete a simulation |
-| `/eval/simulation/suite` | POST | Create a suite |
-| `/eval/simulation/suite` | GET | List suites |
-| `/eval/simulation/suite/:id` | GET | Get a suite |
-| `/eval/simulation/suite/:id` | PATCH | Update a suite |
-| `/eval/simulation/suite/:id` | DELETE | Delete a suite |
-| `/eval/simulation/run` | POST | Start a simulation run |
-| `/eval/simulation/run` | GET | List runs |
-| `/eval/simulation/run/:id` | GET | Get run details |
-
 ## Next steps
 
 <CardGroup cols={2}>

From aafb19d62123d197e7648433a49f9cc2fbb51eb9 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 20:30:15 -0800
Subject: [PATCH 04/10] alpha badges

---
 fern/assets/styles.css                        | 13 +++++++++++++
 fern/observability/simulations-advanced.mdx   |  2 ++
 fern/observability/simulations-quickstart.mdx |  2 ++
 3 files changed, 17 insertions(+)

diff --git a/fern/assets/styles.css b/fern/assets/styles.css
index ebec09075..170103053 100644
--- a/fern/assets/styles.css
+++ b/fern/assets/styles.css
@@ -38,6 +38,13 @@
   border: 1px solid #C7D2FE;
 }
 
+/* Alpha badge - purple to match dashboard */
+.vapi-badge-alpha {
+  background-color: rgba(168, 85, 247, 0.2);
+  color: #A78BFA;
+  border: 1px solid rgba(168, 85, 247, 0.4);
+}
+
 /* Dark mode adjustments */
 :is(.dark) .vapi-badge-assistant {
   background-color: #134E4A;
@@ -57,6 +64,12 @@
   border: 1px solid #6366F1;
 }
 
+:is(.dark) .vapi-badge-alpha {
+  background-color: rgba(168, 85, 247, 0.2);
+  color: #C4B5FD;
+  border: 1px solid rgba(168, 85, 247, 0.4);
+}
+
 /* for a grid of videos */
 
 .video-grid {
diff --git a/fern/observability/simulations-advanced.mdx b/fern/observability/simulations-advanced.mdx
index 4ab5a0e95..698aa57cf 100644
--- a/fern/observability/simulations-advanced.mdx
+++ b/fern/observability/simulations-advanced.mdx
@@ -4,6 +4,8 @@ subtitle: Master testing strategies and best practices for AI voice agent simula
 slug: observability/simulations-advanced
 ---
 
+<div class="vapi-badge vapi-badge-alpha">Alpha</div>
+
 ## Overview
 
 This guide covers advanced simulation strategies, testing patterns, and best practices for building robust test suites that ensure your AI voice agents work reliably in production.
diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
index ce35a2d46..cf58c8e1c 100644
--- a/fern/observability/simulations-quickstart.mdx
+++ b/fern/observability/simulations-quickstart.mdx
@@ -4,6 +4,8 @@ subtitle: Test your AI assistants with realistic AI-powered callers
 slug: observability/simulations-quickstart
 ---
 
+<div class="vapi-badge vapi-badge-alpha">Alpha</div>
+
 ## Overview
 
 This quickstart guide will help you test your AI assistants and squads using realistic, AI-powered callers. In just a few minutes, you'll create test scenarios, define evaluation criteria, and validate your agents work correctly under different conditions.

From 5c5a154167d69699e960b155ee1787197d325d8c Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 21:25:36 -0800
Subject: [PATCH 05/10] adjusting alpha badge

---
 fern/assets/styles.css                        | 19 +++++++++++++++++++
 fern/docs.yml                                 |  1 +
 fern/observability/simulations-advanced.mdx   |  3 +--
 fern/observability/simulations-quickstart.mdx |  3 +--
 4 files changed, 22 insertions(+), 4 deletions(-)

diff --git a/fern/assets/styles.css b/fern/assets/styles.css
index 170103053..06103ba24 100644
--- a/fern/assets/styles.css
+++ b/fern/assets/styles.css
@@ -70,6 +70,25 @@
   border: 1px solid rgba(168, 85, 247, 0.4);
 }
 
+/* Override Fern's pre-release availability badge to show "Alpha" with purple styling */
+.fern-docs-badge[title="Pre-release"] {
+  background-color: rgba(168, 85, 247, 0.2) !important;
+  color: #A78BFA !important;
+  border-color: rgba(168, 85, 247, 0.4) !important;
+  font-size: 0 !important;
+}
+
+.fern-docs-badge[title="Pre-release"]::after {
+  content: "Alpha";
+  font-size: 0.75rem;
+}
+
+:is(.dark) .fern-docs-badge[title="Pre-release"] {
+  background-color: rgba(168, 85, 247, 0.2) !important;
+  color: #C4B5FD !important;
+  border-color: rgba(168, 85, 247, 0.4) !important;
+}
+
 /* for a grid of videos */
 
 .video-grid {
diff --git a/fern/docs.yml b/fern/docs.yml
index 3e00822db..762f9844c 100644
--- a/fern/docs.yml
+++ b/fern/docs.yml
@@ -291,6 +291,7 @@ navigation:
                 icon: fa-light fa-clipboard-check
           - section: Simulations
             icon: fa-light fa-flask-vial
+            availability: pre-release
             contents:
               - page: Quickstart
                 path: observability/simulations-quickstart.mdx
diff --git a/fern/observability/simulations-advanced.mdx b/fern/observability/simulations-advanced.mdx
index 698aa57cf..414f1cfec 100644
--- a/fern/observability/simulations-advanced.mdx
+++ b/fern/observability/simulations-advanced.mdx
@@ -2,10 +2,9 @@
 title: Advanced simulation testing
 subtitle: Master testing strategies and best practices for AI voice agent simulations
 slug: observability/simulations-advanced
+availability: pre-release
 ---
 
-<div class="vapi-badge vapi-badge-alpha">Alpha</div>
-
 ## Overview
 
 This guide covers advanced simulation strategies, testing patterns, and best practices for building robust test suites that ensure your AI voice agents work reliably in production.
diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
index cf58c8e1c..306f2684d 100644
--- a/fern/observability/simulations-quickstart.mdx
+++ b/fern/observability/simulations-quickstart.mdx
@@ -2,10 +2,9 @@
 title: Simulations quickstart
 subtitle: Test your AI assistants with realistic AI-powered callers
 slug: observability/simulations-quickstart
+availability: pre-release
 ---
 
-<div class="vapi-badge vapi-badge-alpha">Alpha</div>
-
 ## Overview
 
 This quickstart guide will help you test your AI assistants and squads using realistic, AI-powered callers. In just a few minutes, you'll create test scenarios, define evaluation criteria, and validate your agents work correctly under different conditions.

From 6834d11d9d731c88f34bd3737900b5dadabafe18 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 21:57:13 -0800
Subject: [PATCH 06/10] formatting alpha badge

---
 fern/assets/styles.css                      | 26 +++++++++++++++------
 fern/observability/simulations-advanced.mdx |  2 +-
 2 files changed, 20 insertions(+), 8 deletions(-)

diff --git a/fern/assets/styles.css b/fern/assets/styles.css
index 06103ba24..7b3a8d378 100644
--- a/fern/assets/styles.css
+++ b/fern/assets/styles.css
@@ -40,9 +40,10 @@
 
 /* Alpha badge - purple to match dashboard */
 .vapi-badge-alpha {
-  background-color: rgba(168, 85, 247, 0.2);
-  color: #A78BFA;
-  border: 1px solid rgba(168, 85, 247, 0.4);
+  background-color: rgba(168, 85, 247, 0.2) !important;
+  color: #A78BFA !important;
+  border: 1px solid rgba(168, 85, 247, 0.4) !important;
+  border-color: rgba(168, 85, 247, 0.4) !important;
 }
 
 /* Dark mode adjustments */
@@ -65,22 +66,33 @@
 }
 
 :is(.dark) .vapi-badge-alpha {
-  background-color: rgba(168, 85, 247, 0.2);
-  color: #C4B5FD;
-  border: 1px solid rgba(168, 85, 247, 0.4);
+  background-color: rgba(168, 85, 247, 0.2) !important;
+  color: #C4B5FD !important;
+  border: 1px solid rgba(168, 85, 247, 0.4) !important;
+  border-color: rgba(168, 85, 247, 0.4) !important;
 }
 
 /* Override Fern's pre-release availability badge to show "Alpha" with purple styling */
 .fern-docs-badge[title="Pre-release"] {
   background-color: rgba(168, 85, 247, 0.2) !important;
-  color: #A78BFA !important;
   border-color: rgba(168, 85, 247, 0.4) !important;
   font-size: 0 !important;
+  position: relative !important;
+  min-width: 52px !important;
+  min-height: 24px !important;
+  display: inline-flex !important;
 }
 
 .fern-docs-badge[title="Pre-release"]::after {
   content: "Alpha";
+  position: absolute;
+  top: 50%;
+  left: 50%;
+  transform: translate(-50%, -50%);
+  color: #A78BFA;
   font-size: 0.75rem;
+  line-height: 1;
+  white-space: nowrap;
 }
 
 :is(.dark) .fern-docs-badge[title="Pre-release"] {
diff --git a/fern/observability/simulations-advanced.mdx b/fern/observability/simulations-advanced.mdx
index 414f1cfec..cdafbf808 100644
--- a/fern/observability/simulations-advanced.mdx
+++ b/fern/observability/simulations-advanced.mdx
@@ -1,5 +1,5 @@
 ---
-title: Advanced simulation testing
+title: Simulations advanced
 subtitle: Master testing strategies and best practices for AI voice agent simulations
 slug: observability/simulations-advanced
 availability: pre-release

From 66e31f129e9cfc7feae21ecd15a1c9fb3241c2bc Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 22:12:13 -0800
Subject: [PATCH 07/10] fix subheader and make it white

---
 fern/assets/styles.css | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/fern/assets/styles.css b/fern/assets/styles.css
index 7b3a8d378..a029c31a7 100644
--- a/fern/assets/styles.css
+++ b/fern/assets/styles.css
@@ -277,4 +277,9 @@ html.dark button[data-highlighted] .fern-api-property-meta {
 
 .light .fern-theme-default.fern-container {
   background-color: #fff !important;
+}
+
+/* Fix: Make subtitle white on pages with availability badges in dark mode */
+:is(.dark) .prose-p\:text-\(color\:--grayscale-a11\) :where(p):not(:where([class~=not-prose],[class~=not-prose] *)) {
+  color: var(--grayscale-12) !important;
 }
\ No newline at end of file

From 67ff69138691d59d4d23df5b70d30c946b789388 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 22:14:50 -0800
Subject: [PATCH 08/10] scope white text for subtitle only to this page

---
 fern/assets/styles.css | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fern/assets/styles.css b/fern/assets/styles.css
index a029c31a7..8f1df1b39 100644
--- a/fern/assets/styles.css
+++ b/fern/assets/styles.css
@@ -279,7 +279,7 @@ html.dark button[data-highlighted] .fern-api-property-meta {
   background-color: #fff !important;
 }
 
-/* Fix: Make subtitle white on pages with availability badges in dark mode */
-:is(.dark) .prose-p\:text-\(color\:--grayscale-a11\) :where(p):not(:where([class~=not-prose],[class~=not-prose] *)) {
+/* Fix: Make subtitle white on Simulations pages in dark mode */
+:is(.dark) [id*="simulations"] .prose-p\:text-\(color\:--grayscale-a11\) :where(p):not(:where([class~=not-prose],[class~=not-prose] *)) {
   color: var(--grayscale-12) !important;
 }
\ No newline at end of file

From e454051ff80d8f5128573d50a5c16675d9730d66 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 22:33:21 -0800
Subject: [PATCH 09/10] fixed faq

---
 fern/observability/simulations-quickstart.mdx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
index 306f2684d..5941b1479 100644
--- a/fern/observability/simulations-quickstart.mdx
+++ b/fern/observability/simulations-quickstart.mdx
@@ -732,8 +732,8 @@ curl -X GET "https://api.vapi.ai/eval/simulation/run?status=ended" \
 ## Frequently asked questions
 
 <AccordionGroup>
-  <Accordion title="Is running simulations free?" icon="dollar-sign">
-    No, simulations cost the same as regular calls. Both the tester and target assistants are charged normally for LLM, TTS, and STT usage. Chat mode (`vapi.webchat`) is typically cheaper since it doesn't use voice processing.
+  <Accordion title="How many concurrent simulations can I run?" icon="gauge">
+    Simulation concurrency follows your organization's call concurrency limits. Each **voice simulation** uses **2 concurrent call slots** (one for the AI tester, one for your assistant being tested). **Chat mode** simulations are more efficient since they don't require audio processing. If you need higher concurrency limits, contact support.
   </Accordion>
 
   <Accordion title="What's the difference between Simulations and Evals?" icon="scale-balanced">

From 7588a5853bef94d0607bfc46bf2340132d7cbb86 Mon Sep 17 00:00:00 2001
From: Noah Raynor <noah.raynor@vapi.ai>
Date: Tue, 3 Feb 2026 22:38:45 -0800
Subject: [PATCH 10/10] more faq fixes

---
 fern/observability/simulations-quickstart.mdx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fern/observability/simulations-quickstart.mdx b/fern/observability/simulations-quickstart.mdx
index 5941b1479..6416004d1 100644
--- a/fern/observability/simulations-quickstart.mdx
+++ b/fern/observability/simulations-quickstart.mdx
@@ -733,11 +733,11 @@ curl -X GET "https://api.vapi.ai/eval/simulation/run?status=ended" \
 
 <AccordionGroup>
   <Accordion title="How many concurrent simulations can I run?" icon="gauge">
-    Simulation concurrency follows your organization's call concurrency limits. Each **voice simulation** uses **2 concurrent call slots** (one for the AI tester, one for your assistant being tested). **Chat mode** simulations are more efficient since they don't require audio processing. If you need higher concurrency limits, contact support.
+    Simulation concurrency follows your organization's call concurrency limits. Each voice simulation uses 2 concurrent call slots (one for the AI tester, one for your assistant being tested). Chat mode simulations are more efficient since they don't require audio processing. If you need higher concurrency limits, contact support.
   </Accordion>
 
   <Accordion title="What's the difference between Simulations and Evals?" icon="scale-balanced">
-    **Simulations** use AI-powered testers that have actual conversations with your assistant, producing real call recordings and transcripts. **Evals** use mock conversations with predefined messages and judge the responses. Use Simulations for realistic end-to-end testing; use Evals for faster, more controlled validation.
+    Simulations use AI-powered testers that have actual conversations with your assistant, producing real call recordings and transcripts. Evals use mock conversations with predefined messages and judge the responses. Use Simulations for realistic end-to-end testing; use Evals for faster, more controlled validation.
   </Accordion>
 
   <Accordion title="Can I use my own structured outputs?" icon="table">