From 65a738c39419c1440da9e4f9f3360565e8508078 Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Mon, 29 Dec 2025 11:32:47 -0800
Subject: [PATCH 01/11] code clean up and  added readme

---
 .../azure-ai-projects/tests/samples/README.md | 109 +++++
 .../tests/samples/sample_executor.py          | 383 ++++++++++++++++++
 .../tests/samples/sample_executor_helpers.py  | 206 ----------
 .../tests/samples/test_samples.py             |  88 +---
 .../tests/samples/test_samples_async.py       |  91 +----
 .../tests/samples/test_samples_helpers.py     |  54 +++
 sdk/ai/azure-ai-projects/tests/test_base.py   |   8 +
 7 files changed, 567 insertions(+), 372 deletions(-)
 create mode 100644 sdk/ai/azure-ai-projects/tests/samples/README.md
 create mode 100644 sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
 delete mode 100644 sdk/ai/azure-ai-projects/tests/samples/sample_executor_helpers.py
 create mode 100644 sdk/ai/azure-ai-projects/tests/samples/test_samples_helpers.py

diff --git a/sdk/ai/azure-ai-projects/tests/samples/README.md b/sdk/ai/azure-ai-projects/tests/samples/README.md
new file mode 100644
index 000000000000..604dfddb63f3
--- /dev/null
+++ b/sdk/ai/azure-ai-projects/tests/samples/README.md
@@ -0,0 +1,109 @@
+## Recorded sample tests
+
+Use recorded tests to validate samples with `SyncSampleExecutor` and `AsyncSampleExecutor`. Tests run the sample code, fail on exceptions, and can optionally validate captured `print` output through LLM instructions.
+
+### Prerequisites
+- In `.env`, set the variables required by your samples plus `AZURE_TEST_RUN_LIVE=true` and `AZURE_SKIP_LIVE_RECORDING=false` when capturing recordings. CI playback typically uses `AZURE_TEST_RUN_LIVE=false` and `AZURE_SKIP_LIVE_RECORDING=true`.
+- Provide sanitized defaults via `servicePreparer` so recordings do not leak secrets.
+
+### Sync example
+```python
+import pytest
+import os
+from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
+from test_base import servicePreparer
+from sample_executor import SyncSampleExecutor, get_sample_paths, SamplePathPasser
+from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
+
+class TestSamples(AzureRecordedTestCase):
+    @servicePreparer()
+    @pytest.mark.parametrize(
+        "sample_path",
+        get_sample_paths(
+            "agents/tools",
+            samples_to_skip=[
+                "sample_agent_bing_custom_search.py",
+                "sample_agent_bing_grounding.py",
+                "sample_agent_browser_automation.py",
+                "sample_agent_fabric.py",
+                "sample_agent_mcp_with_project_connection.py",
+                "sample_agent_openapi_with_project_connection.py",
+                "sample_agent_to_agent.py",
+            ],
+        ),
+    )
+    @SamplePathPasser()
+    @recorded_by_proxy(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
+    def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
+        env_var_mapping = get_sample_environment_variables_map()
+        executor = SyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
+        executor.execute()
+        executor.validate_print_calls_by_llm(
+            instructions=agent_tools_instructions,
+            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+        )        
+```
+
+### Async example
+```python
+import pytest
+from devtools_testutils.aio import recorded_by_proxy_async
+import os
+from devtools_testutils import AzureRecordedTestCase, RecordedTransport
+from test_base import servicePreparer
+from sample_executor import AsyncSampleExecutor, get_async_sample_paths, SamplePathPasser
+from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
+
+class TestSamplesAsync(AzureRecordedTestCase):
+
+    @servicePreparer()
+    @pytest.mark.parametrize(
+        "sample_path",
+        get_async_sample_paths(
+            "agents/tools",
+            samples_to_skip=[
+                "sample_agent_mcp_with_project_connection_async.py",
+            ],
+        ),
+    )
+    @SamplePathPasser()
+    @recorded_by_proxy_async(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
+    async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> None:
+        env_var_mapping = get_sample_environment_variables_map()
+        executor = AsyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
+        await executor.execute_async()
+        await executor.validate_print_calls_by_llm(
+            instructions=agent_tools_instructions,
+            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+        )
+```
+
+### Key pieces
+- `@servicePreparer()`: Supplies sanitized environment variables for playback (often via `EnvironmentVariableLoader`). Use an empty string as the prefix if your variables do not share one.
+- Example:
+```python
+import functools
+from devtools_testutils import EnvironmentVariableLoader
+
+servicePreparer = functools.partial(
+    EnvironmentVariableLoader,
+    "azure_ai_projects_tests",
+    azure_ai_projects_tests_project_endpoint="https://sanitized-account-name.services.ai.azure.com/api/projects/sanitized-project-name",
+    azure_ai_projects_tests_model_deployment_name="gpt-4o",
+    # add other sanitized vars here
+)
+```
+- `@pytest.mark.parametrize`: Drives one test per sample file. Use `samples_to_test` or `samples_to_skip` with `get_sample_paths` / `get_async_sample_paths`.
+- `@SamplePathPasser`: Forwards the sample path to the recorder decorators.
+- `recorded_by_proxy` / `recorded_by_proxy_async`: Wrap tests for recording/playback. Include `RecordedTransport.HTTPX` when samples use httpx in addition to the default `RecordedTransport.AZURE_CORE`.
+- `get_sample_environment_variables_map`: Map test env vars to the names expected by samples. Pass `{}` if you already export the sample variables directly. Example:
+```python
+def get_sample_environment_variables_map(operation_group: str | None = None) -> dict[str, str]:
+    return {
+        "AZURE_AI_PROJECT_ENDPOINT":  "azure_ai_projects_tests_project_endpoint",
+        "AZURE_AI_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_model_deployment_name",
+        # add other mappings as needed
+    }
+```
+- `execute` / `execute_async`: Run the sample; any exception fails the test.
+- `validate_print_calls_by_llm`: Optionally validate captured print output with LLM instructions and an explicit `project_endpoint` (and optional `model`).
diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
new file mode 100644
index 000000000000..0788356daa7f
--- /dev/null
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -0,0 +1,383 @@
+# pylint: disable=line-too-long,useless-suppression
+# ------------------------------------
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+# ------------------------------------
+"""Shared base code for sample tests - sync dependencies only."""
+import os
+import sys
+import pytest
+import inspect
+import importlib.util
+from typing import overload, Union
+from pydantic import BaseModel
+
+import json
+import unittest.mock as mock
+from typing import cast
+import pytest
+from azure.core.credentials import TokenCredential
+from azure.core.credentials_async import AsyncTokenCredential
+from devtools_testutils.fake_credentials import FakeTokenCredential
+from devtools_testutils.fake_credentials_async import AsyncFakeCredential
+from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
+from azure.ai.projects import AIProjectClient
+from pytest import MonkeyPatch
+from azure.ai.projects.aio import AIProjectClient as AsyncAIProjectClient
+
+
+@overload
+def get_sample_paths(sub_folder: str, *, samples_to_test: list[str]) -> list:
+    """Get sample paths for testing (whitelist mode).
+
+    Args:
+        sub_folder: Relative path to the samples subfolder (e.g., "agents/tools")
+        samples_to_test: Whitelist of sample filenames to include
+
+    Returns:
+        List of pytest.param objects with sample paths and test IDs
+    """
+    ...
+
+
+@overload
+def get_sample_paths(sub_folder: str, *, samples_to_skip: list[str]) -> list:
+    """Get sample paths for testing (blacklist mode).
+
+    Args:
+        sub_folder: Relative path to the samples subfolder (e.g., "agents/tools")
+        samples_to_skip: Blacklist of sample filenames to exclude (auto-discovers all samples)
+
+    Returns:
+        List of pytest.param objects with sample paths and test IDs
+    """
+    ...
+
+
+def get_sample_paths(
+    sub_folder: str,
+    *,
+    samples_to_skip: Union[list[str], None] = None,
+    samples_to_test: Union[list[str], None] = None,
+) -> list:
+    return _get_sample_paths(
+        sub_folder, samples_to_skip=samples_to_skip, samples_to_test=samples_to_test, is_async=False
+    )
+
+
+@overload
+def get_async_sample_paths(sub_folder: str, *, samples_to_test: list[str]) -> list:
+    """Get async sample paths for testing (whitelist mode).
+
+    Args:
+        sub_folder: Relative path to the samples subfolder (e.g., "agents/tools")
+        samples_to_test: Whitelist of sample filenames to include
+
+    Returns:
+        List of pytest.param objects with sample paths and test IDs
+    """
+    ...
+
+
+@overload
+def get_async_sample_paths(sub_folder: str, *, samples_to_skip: list[str]) -> list:
+    """Get async sample paths for testing (blacklist mode).
+
+    Args:
+        sub_folder: Relative path to the samples subfolder (e.g., "agents/tools")
+        samples_to_skip: Blacklist of sample filenames to exclude (auto-discovers all samples)
+        is_async: Whether to filter for async samples (_async.py suffix)
+
+    Returns:
+        List of pytest.param objects with sample paths and test IDs
+    """
+    ...
+
+
+def get_async_sample_paths(
+    sub_folder: str,
+    *,
+    samples_to_skip: Union[list[str], None] = None,
+    samples_to_test: Union[list[str], None] = None,
+) -> list:
+    return _get_sample_paths(
+        sub_folder, samples_to_skip=samples_to_skip, samples_to_test=samples_to_test, is_async=True
+    )
+
+
+def _get_sample_paths(
+    sub_folder: str,
+    *,
+    samples_to_skip: Union[list[str], None] = None,
+    is_async: Union[bool, None] = None,
+    samples_to_test: Union[list[str], None] = None,
+) -> list:
+    # Get the path to the samples folder
+    current_dir = os.path.dirname(os.path.abspath(__file__))
+    samples_folder_path = os.path.normpath(os.path.join(current_dir, os.pardir, os.pardir))
+    target_folder = os.path.join(samples_folder_path, "samples", *sub_folder.split("/"))
+
+    if not os.path.exists(target_folder):
+        raise ValueError(f"Target folder does not exist: {target_folder}")
+
+    # Discover all sample files in the folder
+    all_files = [f for f in os.listdir(target_folder) if f.startswith("sample_") and f.endswith(".py")]
+
+    # Filter by async suffix only when using samples_to_skip
+    if samples_to_skip is not None and is_async is not None:
+        if is_async:
+            all_files = [f for f in all_files if f.endswith("_async.py")]
+        else:
+            all_files = [f for f in all_files if not f.endswith("_async.py")]
+
+    # Apply whitelist or blacklist
+    if samples_to_test is not None:
+        files_to_test = [f for f in all_files if f in samples_to_test]
+    else:  # samples_to_skip is not None
+        assert samples_to_skip is not None
+        files_to_test = [f for f in all_files if f not in samples_to_skip]
+
+    # Create pytest.param objects
+    samples = []
+    for filename in sorted(files_to_test):
+        sample_path = os.path.join(target_folder, filename)
+        test_id = filename.replace(".py", "")
+        samples.append(pytest.param(sample_path, id=test_id))
+
+    return samples
+
+
+class BaseSampleExecutor:
+    """Base helper class for executing sample files with proper environment setup.
+
+    This class contains all shared logic that doesn't require async/aio imports.
+    Subclasses implement sync/async specific credential and execution logic.
+    """
+
+    class TestReport(BaseModel):
+        """Schema for validation test report."""
+
+        model_config = {"extra": "forbid"}
+        correct: bool
+        reason: str
+
+    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
+        self.test_instance = test_instance
+        self.sample_path = sample_path
+        self.print_calls: list[str] = []
+        self._original_print = print
+
+        # Prepare environment variables
+        self.env_vars = {}
+        for sample_var, test_var in env_var_mapping.items():
+            value = kwargs.pop(test_var, None)
+            if value is not None:
+                self.env_vars[sample_var] = value
+
+        # Add the sample's directory to sys.path so it can import local modules
+        self.sample_dir = os.path.dirname(sample_path)
+        if self.sample_dir not in sys.path:
+            sys.path.insert(0, self.sample_dir)
+
+        # Create module spec for dynamic import
+        module_name = os.path.splitext(os.path.basename(self.sample_path))[0]
+        spec = importlib.util.spec_from_file_location(module_name, self.sample_path)
+        if spec is None or spec.loader is None:
+            raise ImportError(f"Could not load module {module_name} from {self.sample_path}")
+
+        self.module = importlib.util.module_from_spec(spec)
+        self.spec = spec
+
+    def _capture_print(self, *args, **kwargs):
+        """Capture print calls while still outputting to console."""
+        self.print_calls.append(" ".join(str(arg) for arg in args))
+        self._original_print(*args, **kwargs)
+
+    def _get_validation_request_params(self, instructions: str, model: str = "gpt-4o") -> dict:
+        """Get common parameters for validation request."""
+        return {
+            "model": model,
+            "instructions": instructions,
+            "text": {
+                "format": {
+                    "type": "json_schema",
+                    "name": "TestReport",
+                    "schema": self.TestReport.model_json_schema(),
+                }
+            },
+            # The input field is sanitized in recordings (see conftest.py) by matching the unique prefix
+            # "print contents array = ". This allows sample print statements to change without breaking playback.
+            # The instructions field is preserved as-is in recordings. If you modify the instructions,
+            # you must re-record the tests.
+            "input": f"print contents array = {self.print_calls}",
+        }
+
+    def _assert_validation_result(self, test_report: dict) -> None:
+        """Assert validation result and print reason."""
+        if not test_report["correct"]:
+            # Write print statements to log file in temp folder for debugging
+            import tempfile
+            from datetime import datetime
+
+            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+            log_file = os.path.join(tempfile.gettempdir(), f"sample_validation_error_{timestamp}.log")
+            with open(log_file, "w") as f:
+                f.write(f"Sample: {self.sample_path}\n")
+                f.write(f"Validation Error: {test_report['reason']}\n\n")
+                f.write("Print Statements:\n")
+                f.write("=" * 80 + "\n")
+                for i, print_call in enumerate(self.print_calls, 1):
+                    f.write(f"{i}. {print_call}\n")
+            print(f"\nValidation failed! Print statements logged to: {log_file}")
+        assert test_report["correct"], f"Error is identified: {test_report['reason']}"
+        print(f"Reason: {test_report['reason']}")
+
+
+class SamplePathPasser:
+    """Decorator for passing sample path to test functions."""
+
+    def __call__(self, fn):
+        if inspect.iscoroutinefunction(fn):
+
+            async def _wrapper_async(test_class, sample_path, **kwargs):
+                return await fn(test_class, sample_path, **kwargs)
+
+            return _wrapper_async
+        else:
+
+            def _wrapper_sync(test_class, sample_path, **kwargs):
+                return fn(test_class, sample_path, **kwargs)
+
+            return _wrapper_sync
+
+
+class SyncSampleExecutor(BaseSampleExecutor):
+    """Synchronous sample executor that only uses sync credentials."""
+
+    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
+        super().__init__(test_instance, sample_path, env_var_mapping, **kwargs)
+        self.tokenCredential: TokenCredential | FakeTokenCredential | None = None
+
+    def _get_mock_credential(self):
+        """Get a mock credential that supports context manager protocol."""
+        self.tokenCredential = self.test_instance.get_credential(AIProjectClient, is_async=False)
+        patch_target = "azure.identity.DefaultAzureCredential"
+
+        # Create a mock that returns a context manager wrapping the credential
+        mock_credential_class = mock.MagicMock()
+        mock_credential_class.return_value.__enter__ = mock.MagicMock(return_value=self.tokenCredential)
+        mock_credential_class.return_value.__exit__ = mock.MagicMock(return_value=None)
+
+        return mock.patch(patch_target, new=mock_credential_class)
+
+    def execute(self):
+        """Execute a synchronous sample with proper mocking and environment setup."""
+        from test_base import patched_open_crlf_to_lf
+
+        with (
+            MonkeyPatch.context() as mp,
+            self._get_mock_credential(),
+        ):
+            for var_name, var_value in self.env_vars.items():
+                mp.setenv(var_name, var_value)
+            if self.spec.loader is None:
+                raise ImportError(f"Could not load module {self.spec.name} from {self.sample_path}")
+
+            with (
+                mock.patch("builtins.print", side_effect=self._capture_print),
+                mock.patch("builtins.open", side_effect=patched_open_crlf_to_lf),
+            ):
+                self.spec.loader.exec_module(self.module)
+
+    def validate_print_calls_by_llm(
+        self,
+        *,
+        instructions: str,
+        project_endpoint: str,
+        model: str = "gpt-4o",
+    ):
+        """Validate captured print output using synchronous OpenAI client."""
+        if not instructions or not instructions.strip():
+            raise ValueError("instructions must be a non-empty string")
+        if not project_endpoint:
+            raise ValueError("project_endpoint must be provided")
+        endpoint = project_endpoint
+        print(f"For validating console output, creating AIProjectClient with endpoint: {endpoint}")
+        assert isinstance(self.tokenCredential, TokenCredential) or isinstance(
+            self.tokenCredential, FakeTokenCredential
+        )
+        with (
+            AIProjectClient(
+                endpoint=endpoint, credential=cast(TokenCredential, self.tokenCredential)
+            ) as project_client,
+            project_client.get_openai_client() as openai_client,
+        ):
+            response = openai_client.responses.create(**self._get_validation_request_params(instructions, model=model))
+            test_report = json.loads(response.output_text)
+            self._assert_validation_result(test_report)
+
+
+class AsyncSampleExecutor(BaseSampleExecutor):
+    """Asynchronous sample executor that uses async credentials."""
+
+    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
+        super().__init__(test_instance, sample_path, env_var_mapping, **kwargs)
+        self.tokenCredential: AsyncTokenCredential | AsyncFakeCredential | None = None
+
+    def _get_mock_credential(self):
+        """Get a mock credential that supports async context manager protocol."""
+        self.tokenCredential = self.test_instance.get_credential(AsyncAIProjectClient, is_async=True)
+        patch_target = "azure.identity.aio.DefaultAzureCredential"
+
+        # Create a mock that returns an async context manager wrapping the credential
+        mock_credential_class = mock.MagicMock()
+        mock_credential_class.return_value.__aenter__ = mock.AsyncMock(return_value=self.tokenCredential)
+        mock_credential_class.return_value.__aexit__ = mock.AsyncMock(return_value=None)
+
+        return mock.patch(patch_target, new=mock_credential_class)
+
+    async def execute_async(self):
+        """Execute an asynchronous sample with proper mocking and environment setup."""
+        from test_base import patched_open_crlf_to_lf
+
+        with (
+            MonkeyPatch.context() as mp,
+            self._get_mock_credential(),
+            mock.patch("builtins.print", side_effect=self._capture_print),
+            mock.patch("builtins.open", side_effect=patched_open_crlf_to_lf),
+        ):
+            for var_name, var_value in self.env_vars.items():
+                mp.setenv(var_name, var_value)
+            if self.spec.loader is None:
+                raise ImportError(f"Could not load module {self.spec.name} from {self.sample_path}")
+            self.spec.loader.exec_module(self.module)
+            await self.module.main()
+
+    async def validate_print_calls_by_llm(
+        self,
+        *,
+        instructions: str,
+        project_endpoint: str,
+        model: str = "gpt-4o",
+    ):
+        """Validate captured print output using asynchronous OpenAI client."""
+        if not instructions or not instructions.strip():
+            raise ValueError("instructions must be a non-empty string")
+        if not project_endpoint:
+            raise ValueError("project_endpoint must be provided")
+        endpoint = project_endpoint
+        print(f"For validating console output, creating AIProjectClient with endpoint: {endpoint}")
+        assert isinstance(self.tokenCredential, AsyncTokenCredential) or isinstance(
+            self.tokenCredential, AsyncFakeCredential
+        )
+        async with (
+            AsyncAIProjectClient(
+                endpoint=endpoint, credential=cast(AsyncTokenCredential, self.tokenCredential)
+            ) as project_client,
+        ):
+            async with project_client.get_openai_client() as openai_client:
+                response = await openai_client.responses.create(
+                    **self._get_validation_request_params(instructions, model=model)
+                )
+                test_report = json.loads(response.output_text)
+                self._assert_validation_result(test_report)
diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor_helpers.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor_helpers.py
deleted file mode 100644
index 8697362b1631..000000000000
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor_helpers.py
+++ /dev/null
@@ -1,206 +0,0 @@
-# pylint: disable=line-too-long,useless-suppression
-# ------------------------------------
-# Copyright (c) Microsoft Corporation.
-# Licensed under the MIT License.
-# ------------------------------------
-"""Shared base code for sample tests - sync dependencies only."""
-import os
-import sys
-import pytest
-import inspect
-import importlib.util
-from typing import Optional
-from pydantic import BaseModel
-
-
-class BaseSampleExecutor:
-    """Base helper class for executing sample files with proper environment setup.
-
-    This class contains all shared logic that doesn't require async/aio imports.
-    Subclasses implement sync/async specific credential and execution logic.
-    """
-
-    class TestReport(BaseModel):
-        """Schema for validation test report."""
-
-        model_config = {"extra": "forbid"}
-        correct: bool
-        reason: str
-
-    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
-        self.test_instance = test_instance
-        self.sample_path = sample_path
-        self.print_calls: list[str] = []
-        self._original_print = print
-
-        # Prepare environment variables
-        self.env_vars = {}
-        for sample_var, test_var in env_var_mapping.items():
-            value = kwargs.pop(test_var, None)
-            if value is not None:
-                self.env_vars[sample_var] = value
-
-        # Add the sample's directory to sys.path so it can import local modules
-        self.sample_dir = os.path.dirname(sample_path)
-        if self.sample_dir not in sys.path:
-            sys.path.insert(0, self.sample_dir)
-
-        # Create module spec for dynamic import
-        module_name = os.path.splitext(os.path.basename(self.sample_path))[0]
-        spec = importlib.util.spec_from_file_location(module_name, self.sample_path)
-        if spec is None or spec.loader is None:
-            raise ImportError(f"Could not load module {module_name} from {self.sample_path}")
-
-        self.module = importlib.util.module_from_spec(spec)
-        self.spec = spec
-
-    def _capture_print(self, *args, **kwargs):
-        """Capture print calls while still outputting to console."""
-        self.print_calls.append(" ".join(str(arg) for arg in args))
-        self._original_print(*args, **kwargs)
-
-    def _get_validation_request_params(self) -> dict:
-        """Get common parameters for validation request."""
-        return {
-            "model": "gpt-4o",
-            "instructions": """We just run Python code and captured a Python array of print statements.
-Validating the printed content to determine if correct or not:
-Respond false if any entries show:
-- Error messages or exception text
-- Empty or null results where data is expected
-- Malformed or corrupted data
-- Timeout or connection errors
-- Warning messages indicating failures
-- Failure to retrieve or process data
-- Statements saying documents/information didn't provide relevant data
-- Statements saying unable to find/retrieve information
-- Asking the user to specify, clarify, or provide more details
-- Suggesting to use other tools or sources
-- Asking follow-up questions to complete the task
-- Indicating lack of knowledge or missing information
-- Responses that defer answering or redirect the question
-Respond with true only if the result provides a complete, substantive answer with actual data/information.
-Always respond with `reason` indicating the reason for the response.""",
-            "text": {
-                "format": {
-                    "type": "json_schema",
-                    "name": "TestReport",
-                    "schema": self.TestReport.model_json_schema(),
-                }
-            },
-            # The input field is sanitized in recordings (see conftest.py) by matching the unique prefix
-            # "print contents array = ". This allows sample print statements to change without breaking playback.
-            # The instructions field is preserved as-is in recordings. If you modify the instructions,
-            # you must re-record the tests.
-            "input": f"print contents array = {self.print_calls}",
-        }
-
-    def _assert_validation_result(self, test_report: dict) -> None:
-        """Assert validation result and print reason."""
-        if not test_report["correct"]:
-            # Write print statements to log file in temp folder for debugging
-            import tempfile
-            from datetime import datetime
-
-            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
-            log_file = os.path.join(tempfile.gettempdir(), f"sample_validation_error_{timestamp}.log")
-            with open(log_file, "w") as f:
-                f.write(f"Sample: {self.sample_path}\n")
-                f.write(f"Validation Error: {test_report['reason']}\n\n")
-                f.write("Print Statements:\n")
-                f.write("=" * 80 + "\n")
-                for i, print_call in enumerate(self.print_calls, 1):
-                    f.write(f"{i}. {print_call}\n")
-            print(f"\nValidation failed! Print statements logged to: {log_file}")
-        assert test_report["correct"], f"Error is identified: {test_report['reason']}"
-        print(f"Reason: {test_report['reason']}")
-
-
-class SamplePathPasser:
-    """Decorator for passing sample path to test functions."""
-
-    def __call__(self, fn):
-        if inspect.iscoroutinefunction(fn):
-
-            async def _wrapper_async(test_class, sample_path, **kwargs):
-                return await fn(test_class, sample_path, **kwargs)
-
-            return _wrapper_async
-        else:
-
-            def _wrapper_sync(test_class, sample_path, **kwargs):
-                return fn(test_class, sample_path, **kwargs)
-
-            return _wrapper_sync
-
-
-def get_sample_paths(
-    sub_folder: str,
-    *,
-    samples_to_skip: Optional[list[str]] = None,
-    is_async: Optional[bool] = False,
-) -> list:
-    """Get list of sample paths for testing."""
-    # Get the path to the samples folder
-    current_dir = os.path.dirname(os.path.abspath(__file__))
-    samples_folder_path = os.path.normpath(os.path.join(current_dir, os.pardir, os.pardir))
-    target_folder = os.path.join(samples_folder_path, "samples", *sub_folder.split("/"))
-
-    if not os.path.exists(target_folder):
-        raise ValueError(f"Target folder does not exist: {target_folder}")
-
-    print("Target folder for samples:", target_folder)
-    print("is_async:", is_async)
-    print("samples_to_skip:", samples_to_skip)
-    # Discover all sync or async sample files in the folder
-    all_files = [
-        f
-        for f in os.listdir(target_folder)
-        if (
-            f.startswith("sample_")
-            and (f.endswith("_async.py") if is_async else (f.endswith(".py") and not f.endswith("_async.py")))
-        )
-    ]
-
-    if samples_to_skip:
-        files_to_test = [f for f in all_files if f not in samples_to_skip]
-    else:
-        files_to_test = all_files
-
-    print(f"Running the following samples as test:\n{files_to_test}")
-
-    # Create pytest.param objects
-    samples = []
-    for filename in sorted(files_to_test):
-        sample_path = os.path.join(target_folder, filename)
-        test_id = filename.replace(".py", "")
-        samples.append(pytest.param(sample_path, id=test_id))
-
-    return samples
-
-
-def get_sample_environment_variables_map(operation_group: Optional[str] = None) -> dict[str, str]:
-    """Get the mapping of sample environment variables to test environment variables.
-
-    Args:
-        operation_group: Optional operation group name (e.g., "agents") to scope the endpoint variable.
-
-    Returns:
-        Dictionary mapping sample env var names to test env var names.
-    """
-    return {
-        "AZURE_AI_PROJECT_ENDPOINT": (
-            "azure_ai_projects_tests_project_endpoint"
-            if operation_group is None
-            else f"azure_ai_projects_tests_{operation_group}_project_endpoint"
-        ),
-        "AZURE_AI_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_model_deployment_name",
-        "IMAGE_GENERATION_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_image_generation_model_deployment_name",
-        "AI_SEARCH_PROJECT_CONNECTION_ID": "azure_ai_projects_tests_ai_search_project_connection_id",
-        "AI_SEARCH_INDEX_NAME": "azure_ai_projects_tests_ai_search_index_name",
-        "AI_SEARCH_USER_INPUT": "azure_ai_projects_tests_ai_search_user_input",
-        "SHAREPOINT_USER_INPUT": "azure_ai_projects_tests_sharepoint_user_input",
-        "SHAREPOINT_PROJECT_CONNECTION_ID": "azure_ai_projects_tests_sharepoint_project_connection_id",
-        "MEMORY_STORE_CHAT_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_memory_store_chat_model_deployment_name",
-        "MEMORY_STORE_EMBEDDING_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_memory_store_embedding_model_deployment_name",
-    }
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
index f606368a3b12..1c34cffb44c1 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
@@ -4,90 +4,11 @@
 # Licensed under the MIT License.
 # ------------------------------------
 import os
-import json
-import unittest.mock as mock
-from typing import cast
 import pytest
-from azure.core.credentials import TokenCredential
-from devtools_testutils.fake_credentials import FakeTokenCredential
 from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
-from azure.ai.projects import AIProjectClient
-from pytest import MonkeyPatch
 from test_base import servicePreparer
-from sample_executor_helpers import (
-    BaseSampleExecutor,
-    SamplePathPasser,
-    get_sample_paths,
-    get_sample_environment_variables_map,
-)
-
-
-class SyncSampleExecutor(BaseSampleExecutor):
-    """Synchronous sample executor that only uses sync credentials."""
-
-    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
-        super().__init__(test_instance, sample_path, env_var_mapping, **kwargs)
-        self.tokenCredential: TokenCredential | FakeTokenCredential | None = None
-
-    def _get_mock_credential(self):
-        """Get a mock credential that supports context manager protocol."""
-        self.tokenCredential = self.test_instance.get_credential(AIProjectClient, is_async=False)
-        patch_target = "azure.identity.DefaultAzureCredential"
-
-        # Create a mock that returns a context manager wrapping the credential
-        mock_credential_class = mock.MagicMock()
-        mock_credential_class.return_value.__enter__ = mock.MagicMock(return_value=self.tokenCredential)
-        mock_credential_class.return_value.__exit__ = mock.MagicMock(return_value=None)
-
-        return mock.patch(patch_target, new=mock_credential_class)
-
-    def execute(self, enable_llm_validation: bool = True, patched_open_fn=None):
-        """Execute a synchronous sample with proper mocking and environment setup."""
-        # Import patched_open_crlf_to_lf here to avoid circular import
-        if patched_open_fn is None:
-            from test_base import patched_open_crlf_to_lf
-
-            patched_open_fn = patched_open_crlf_to_lf
-
-        with (
-            MonkeyPatch.context() as mp,
-            self._get_mock_credential(),
-        ):
-            for var_name, var_value in self.env_vars.items():
-                mp.setenv(var_name, var_value)
-
-            self._execute_module(patched_open_fn)
-
-            if enable_llm_validation:
-                self._validate_output()
-
-    def _execute_module(self, patched_open_fn):
-        """Execute the module with environment setup and mocking."""
-        if self.spec.loader is None:
-            raise ImportError(f"Could not load module {self.spec.name} from {self.sample_path}")
-
-        with (
-            mock.patch("builtins.print", side_effect=self._capture_print),
-            mock.patch("builtins.open", side_effect=patched_open_fn),
-        ):
-            self.spec.loader.exec_module(self.module)
-
-    def _validate_output(self):
-        """Validate sample output using synchronous OpenAI client."""
-        endpoint = os.environ["AZURE_AI_PROJECT_ENDPOINT"]
-        print(f"For validating console output, creating AIProjectClient with endpoint: {endpoint}")
-        assert isinstance(self.tokenCredential, TokenCredential) or isinstance(
-            self.tokenCredential, FakeTokenCredential
-        )
-        with (
-            AIProjectClient(
-                endpoint=endpoint, credential=cast(TokenCredential, self.tokenCredential)
-            ) as project_client,
-            project_client.get_openai_client() as openai_client,
-        ):
-            response = openai_client.responses.create(**self._get_validation_request_params())
-            test_report = json.loads(response.output_text)
-            self._assert_validation_result(test_report)
+from sample_executor import SyncSampleExecutor, get_sample_paths, SamplePathPasser
+from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
 
 
 class TestSamples(AzureRecordedTestCase):
@@ -108,7 +29,6 @@ class TestSamples(AzureRecordedTestCase):
                 "sample_agent_openapi_with_project_connection.py",
                 "sample_agent_to_agent.py",
             ],
-            is_async=False,
         ),
     )
     @SamplePathPasser()
@@ -117,3 +37,7 @@ def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
         env_var_mapping = get_sample_environment_variables_map(operation_group="agents")
         executor = SyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
         executor.execute()
+        executor.validate_print_calls_by_llm(
+            instructions=agent_tools_instructions,
+            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+        )
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index 72e0ba9b7f33..276918b37207 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -4,93 +4,12 @@
 # Licensed under the MIT License.
 # ------------------------------------
 import os
-import json
-import unittest.mock as mock
-from typing import cast
 import pytest
-from azure.core.credentials_async import AsyncTokenCredential
-from devtools_testutils.fake_credentials_async import AsyncFakeCredential
 from devtools_testutils.aio import recorded_by_proxy_async
 from devtools_testutils import AzureRecordedTestCase, RecordedTransport
-from azure.ai.projects.aio import AIProjectClient as AsyncAIProjectClient
-from pytest import MonkeyPatch
 from test_base import servicePreparer
-from sample_executor_helpers import (
-    BaseSampleExecutor,
-    SamplePathPasser,
-    get_sample_paths,
-    get_sample_environment_variables_map,
-)
-
-
-class AsyncSampleExecutor(BaseSampleExecutor):
-    """Asynchronous sample executor that uses async credentials."""
-
-    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
-        super().__init__(test_instance, sample_path, env_var_mapping, **kwargs)
-        self.tokenCredential: AsyncTokenCredential | AsyncFakeCredential | None = None
-
-    def _get_mock_credential(self):
-        """Get a mock credential that supports async context manager protocol."""
-        self.tokenCredential = self.test_instance.get_credential(AsyncAIProjectClient, is_async=True)
-        patch_target = "azure.identity.aio.DefaultAzureCredential"
-
-        # Create a mock that returns an async context manager wrapping the credential
-        mock_credential_class = mock.MagicMock()
-        mock_credential_class.return_value.__aenter__ = mock.AsyncMock(return_value=self.tokenCredential)
-        mock_credential_class.return_value.__aexit__ = mock.AsyncMock(return_value=None)
-
-        return mock.patch(patch_target, new=mock_credential_class)
-
-    async def execute_async(self, enable_llm_validation: bool = True, patched_open_fn=None):
-        """Execute an asynchronous sample with proper mocking and environment setup."""
-        # Import patched_open_crlf_to_lf here to avoid circular import
-        if patched_open_fn is None:
-            from test_base import patched_open_crlf_to_lf
-
-            patched_open_fn = patched_open_crlf_to_lf
-
-        with (
-            MonkeyPatch.context() as mp,
-            self._get_mock_credential(),
-            mock.patch("builtins.print", side_effect=self._capture_print),
-            mock.patch("builtins.open", side_effect=patched_open_fn),
-        ):
-            for var_name, var_value in self.env_vars.items():
-                mp.setenv(var_name, var_value)
-
-            self._execute_module()
-            await self.module.main()
-
-            if enable_llm_validation:
-                await self._validate_output_async()
-
-    def _execute_module(self):
-        """Execute the module without applying patches (patches applied at caller level)."""
-        if self.spec.loader is None:
-            raise ImportError(f"Could not load module {self.spec.name} from {self.sample_path}")
-        self.spec.loader.exec_module(self.module)
-
-    async def _validate_output_async(self):
-        """Validate sample output using asynchronous OpenAI client."""
-        endpoint = os.environ["AZURE_AI_PROJECT_ENDPOINT"]
-        print(f"For validating console output, creating AIProjectClient with endpoint: {endpoint}")
-        assert isinstance(self.tokenCredential, AsyncTokenCredential) or isinstance(
-            self.tokenCredential, AsyncFakeCredential
-        )
-        async with (
-            AsyncAIProjectClient(
-                endpoint=endpoint, credential=cast(AsyncTokenCredential, self.tokenCredential)
-            ) as project_client,
-        ):
-            async with project_client.get_openai_client() as openai_client:
-                response = await openai_client.responses.create(**self._get_validation_request_params())
-                test_report = json.loads(response.output_text)
-                self._assert_validation_result(test_report)
-
-
-def _get_async_sample_paths(sub_folder: str, *, samples_to_skip: list[str]) -> list:
-    return get_sample_paths(sub_folder, samples_to_skip=samples_to_skip, is_async=True)
+from sample_executor import AsyncSampleExecutor, get_async_sample_paths, SamplePathPasser
+from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
 
 
 class TestSamplesAsync(AzureRecordedTestCase):
@@ -101,7 +20,7 @@ class TestSamplesAsync(AzureRecordedTestCase):
     @servicePreparer()
     @pytest.mark.parametrize(
         "sample_path",
-        _get_async_sample_paths(
+        get_async_sample_paths(
             "agents/tools",
             samples_to_skip=[
                 "sample_agent_mcp_with_project_connection_async.py",
@@ -114,3 +33,7 @@ async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> No
         env_var_mapping = get_sample_environment_variables_map(operation_group="agents")
         executor = AsyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
         await executor.execute_async()
+        await executor.validate_print_calls_by_llm(
+            instructions=agent_tools_instructions,
+            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+        )
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_helpers.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_helpers.py
new file mode 100644
index 000000000000..04ab548f57ab
--- /dev/null
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_helpers.py
@@ -0,0 +1,54 @@
+# pylint: disable=line-too-long,useless-suppression
+# ------------------------------------
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+# ------------------------------------
+"""Shared base code for sample tests - sync dependencies only."""
+from typing import Optional
+
+
+agent_tools_instructions = """We just run Python code and captured a Python array of print statements.
+Validating the printed content to determine if correct or not:
+Respond false if any entries show:
+- Error messages or exception text
+- Empty or null results where data is expected
+- Malformed or corrupted data
+- Timeout or connection errors
+- Warning messages indicating failures
+- Failure to retrieve or process data
+- Statements saying documents/information didn't provide relevant data
+- Statements saying unable to find/retrieve information
+- Asking the user to specify, clarify, or provide more details
+- Suggesting to use other tools or sources
+- Asking follow-up questions to complete the task
+- Indicating lack of knowledge or missing information
+- Responses that defer answering or redirect the question
+Respond with true only if the result provides a complete, substantive answer with actual data/information.
+Always respond with `reason` indicating the reason for the response."""
+
+
+def get_sample_environment_variables_map(operation_group: Optional[str] = None) -> dict[str, str]:
+    """Get the mapping of sample environment variables to test environment variables.
+
+    Args:
+        operation_group: Optional operation group name (e.g., "agents") to scope the endpoint variable.
+
+    Returns:
+        Dictionary mapping sample env var names to test env var names.
+    """
+    return {
+        "AZURE_AI_PROJECT_ENDPOINT": (
+            "azure_ai_projects_tests_project_endpoint"
+            if operation_group is None
+            else f"azure_ai_projects_tests_{operation_group}_project_endpoint"
+        ),
+        "AZURE_AI_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_model_deployment_name",
+        "IMAGE_GENERATION_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_image_generation_model_deployment_name",
+        "AI_SEARCH_PROJECT_CONNECTION_ID": "azure_ai_projects_tests_ai_search_project_connection_id",
+        "AI_SEARCH_INDEX_NAME": "azure_ai_projects_tests_ai_search_index_name",
+        "AI_SEARCH_USER_INPUT": "azure_ai_projects_tests_ai_search_user_input",
+        "SHAREPOINT_USER_INPUT": "azure_ai_projects_tests_sharepoint_user_input",
+        "SHAREPOINT_PROJECT_CONNECTION_ID": "azure_ai_projects_tests_sharepoint_project_connection_id",
+        "MEMORY_STORE_CHAT_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_memory_store_chat_model_deployment_name",
+        "MEMORY_STORE_EMBEDDING_MODEL_DEPLOYMENT_NAME": "azure_ai_projects_tests_memory_store_embedding_model_deployment_name",
+    }
diff --git a/sdk/ai/azure-ai-projects/tests/test_base.py b/sdk/ai/azure-ai-projects/tests/test_base.py
index 3395505f2965..06f8f68ec195 100644
--- a/sdk/ai/azure-ai-projects/tests/test_base.py
+++ b/sdk/ai/azure-ai-projects/tests/test_base.py
@@ -70,6 +70,14 @@
     azure_ai_projects_tests_memory_store_embedding_model_deployment_name="text-embedding-ada-002",
 )
 
+# Load secrets from environment variables
+originalServicePreparer = functools.partial(
+    EnvironmentVariableLoader,
+    "",
+    azure_ai_project_endpoint="https://sanitized-account-name.services.ai.azure.com/api/projects/sanitized-project-name",
+    azure_ai_model_deployment_name="gpt-4o",
+)
+
 # Fine-tuning job type constants
 SFT_JOB_TYPE: Final[str] = "sft"
 DPO_JOB_TYPE: Final[str] = "dpo"

From a4afb39d07382fd400a5c2c826c010b6562c6c69 Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Mon, 29 Dec 2025 11:39:41 -0800
Subject: [PATCH 02/11] restore patched_open_fn

---
 .../tests/samples/sample_executor.py          | 22 +++++++++++++------
 1 file changed, 15 insertions(+), 7 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
index 0788356daa7f..de95e6212006 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -270,9 +270,13 @@ def _get_mock_credential(self):
 
         return mock.patch(patch_target, new=mock_credential_class)
 
-    def execute(self):
+    def execute(self, patched_open_fn=None):
         """Execute a synchronous sample with proper mocking and environment setup."""
-        from test_base import patched_open_crlf_to_lf
+        # Import patched_open_crlf_to_lf here to avoid circular import
+        if patched_open_fn is None:
+            from test_base import patched_open_crlf_to_lf
+
+            patched_open_fn = patched_open_crlf_to_lf
 
         with (
             MonkeyPatch.context() as mp,
@@ -285,7 +289,7 @@ def execute(self):
 
             with (
                 mock.patch("builtins.print", side_effect=self._capture_print),
-                mock.patch("builtins.open", side_effect=patched_open_crlf_to_lf),
+                mock.patch("builtins.open", side_effect=patched_open_fn),
             ):
                 self.spec.loader.exec_module(self.module)
 
@@ -336,15 +340,19 @@ def _get_mock_credential(self):
 
         return mock.patch(patch_target, new=mock_credential_class)
 
-    async def execute_async(self):
-        """Execute an asynchronous sample with proper mocking and environment setup."""
-        from test_base import patched_open_crlf_to_lf
+    async def execute(self, patched_open_fn=None):
+        """Execute a synchronous sample with proper mocking and environment setup."""
+        # Import patched_open_crlf_to_lf here to avoid circular import
+        if patched_open_fn is None:
+            from test_base import patched_open_crlf_to_lf
+
+            patched_open_fn = patched_open_crlf_to_lf
 
         with (
             MonkeyPatch.context() as mp,
             self._get_mock_credential(),
             mock.patch("builtins.print", side_effect=self._capture_print),
-            mock.patch("builtins.open", side_effect=patched_open_crlf_to_lf),
+            mock.patch("builtins.open", side_effect=patched_open_fn),
         ):
             for var_name, var_value in self.env_vars.items():
                 mp.setenv(var_name, var_value)

From 4e0636f791b6988d0ec14ef42e60437b5062af20 Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Mon, 29 Dec 2025 13:13:45 -0800
Subject: [PATCH 03/11] fix bugs and resolved comment

---
 sdk/ai/azure-ai-projects/tests/samples/sample_executor.py | 7 ++-----
 sdk/ai/azure-ai-projects/tests/samples/test_samples.py    | 2 +-
 .../azure-ai-projects/tests/samples/test_samples_async.py | 2 +-
 sdk/ai/azure-ai-projects/tests/test_base.py               | 8 --------
 4 files changed, 4 insertions(+), 15 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
index de95e6212006..ac3ab7ceaa11 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -15,12 +15,10 @@
 import json
 import unittest.mock as mock
 from typing import cast
-import pytest
 from azure.core.credentials import TokenCredential
 from azure.core.credentials_async import AsyncTokenCredential
 from devtools_testutils.fake_credentials import FakeTokenCredential
 from devtools_testutils.fake_credentials_async import AsyncFakeCredential
-from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
 from azure.ai.projects import AIProjectClient
 from pytest import MonkeyPatch
 from azure.ai.projects.aio import AIProjectClient as AsyncAIProjectClient
@@ -86,7 +84,6 @@ def get_async_sample_paths(sub_folder: str, *, samples_to_skip: list[str]) -> li
     Args:
         sub_folder: Relative path to the samples subfolder (e.g., "agents/tools")
         samples_to_skip: Blacklist of sample filenames to exclude (auto-discovers all samples)
-        is_async: Whether to filter for async samples (_async.py suffix)
 
     Returns:
         List of pytest.param objects with sample paths and test IDs
@@ -340,8 +337,8 @@ def _get_mock_credential(self):
 
         return mock.patch(patch_target, new=mock_credential_class)
 
-    async def execute(self, patched_open_fn=None):
-        """Execute a synchronous sample with proper mocking and environment setup."""
+    async def execute_async(self, patched_open_fn=None):
+        """Execute an asynchronous sample with proper mocking and environment setup."""
         # Import patched_open_crlf_to_lf here to avoid circular import
         if patched_open_fn is None:
             from test_base import patched_open_crlf_to_lf
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
index 1c34cffb44c1..8597d4f9289e 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
@@ -39,5 +39,5 @@ def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
         executor.execute()
         executor.validate_print_calls_by_llm(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+            project_endpoint=os.environ["azure_ai_projects_agents_project_endpoint"],
         )
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index 276918b37207..46ed99daee12 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -35,5 +35,5 @@ async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> No
         await executor.execute_async()
         await executor.validate_print_calls_by_llm(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+            project_endpoint=os.environ["azure_ai_projects_agents_project_endpoint"],
         )
diff --git a/sdk/ai/azure-ai-projects/tests/test_base.py b/sdk/ai/azure-ai-projects/tests/test_base.py
index 06f8f68ec195..3395505f2965 100644
--- a/sdk/ai/azure-ai-projects/tests/test_base.py
+++ b/sdk/ai/azure-ai-projects/tests/test_base.py
@@ -70,14 +70,6 @@
     azure_ai_projects_tests_memory_store_embedding_model_deployment_name="text-embedding-ada-002",
 )
 
-# Load secrets from environment variables
-originalServicePreparer = functools.partial(
-    EnvironmentVariableLoader,
-    "",
-    azure_ai_project_endpoint="https://sanitized-account-name.services.ai.azure.com/api/projects/sanitized-project-name",
-    azure_ai_model_deployment_name="gpt-4o",
-)
-
 # Fine-tuning job type constants
 SFT_JOB_TYPE: Final[str] = "sft"
 DPO_JOB_TYPE: Final[str] = "dpo"

From 3d6966f66a2f1b22451f209babf10e9f703fb58e Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Mon, 29 Dec 2025 13:24:44 -0800
Subject: [PATCH 04/11] clean up

---
 sdk/ai/azure-ai-projects/tests/samples/README.md   |  8 ++++----
 .../tests/samples/sample_executor.py               | 14 +++++++-------
 .../tests/samples/test_samples_async.py            |  2 +-
 3 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/README.md b/sdk/ai/azure-ai-projects/tests/samples/README.md
index 604dfddb63f3..5e60c062cc41 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/README.md
+++ b/sdk/ai/azure-ai-projects/tests/samples/README.md
@@ -40,7 +40,7 @@ class TestSamples(AzureRecordedTestCase):
         executor.execute()
         executor.validate_print_calls_by_llm(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+            project_endpoint=os.environ["azure_ai_projects_tests_project_endpoint"],
         )        
 ```
 
@@ -72,9 +72,9 @@ class TestSamplesAsync(AzureRecordedTestCase):
         env_var_mapping = get_sample_environment_variables_map()
         executor = AsyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
         await executor.execute_async()
-        await executor.validate_print_calls_by_llm(
+        await executor.validate_print_calls_by_llm_async(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+            project_endpoint=os.environ["azure_ai_projects_tests_project_endpoint"],
         )
 ```
 
@@ -106,4 +106,4 @@ def get_sample_environment_variables_map(operation_group: str | None = None) ->
     }
 ```
 - `execute` / `execute_async`: Run the sample; any exception fails the test.
-- `validate_print_calls_by_llm`: Optionally validate captured print output with LLM instructions and an explicit `project_endpoint` (and optional `model`).
+- `validate_print_calls_by_llm` / `validate_print_calls_by_llm_async`: Optionally validate captured print output with LLM instructions and an explicit `project_endpoint` (and optional `model`).
diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
index ac3ab7ceaa11..5d2ad0e45d10 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -358,7 +358,7 @@ async def execute_async(self, patched_open_fn=None):
             self.spec.loader.exec_module(self.module)
             await self.module.main()
 
-    async def validate_print_calls_by_llm(
+    async def validate_print_calls_by_llm_async(
         self,
         *,
         instructions: str,
@@ -379,10 +379,10 @@ async def validate_print_calls_by_llm(
             AsyncAIProjectClient(
                 endpoint=endpoint, credential=cast(AsyncTokenCredential, self.tokenCredential)
             ) as project_client,
+            project_client.get_openai_client() as openai_client,
         ):
-            async with project_client.get_openai_client() as openai_client:
-                response = await openai_client.responses.create(
-                    **self._get_validation_request_params(instructions, model=model)
-                )
-                test_report = json.loads(response.output_text)
-                self._assert_validation_result(test_report)
+            response = await openai_client.responses.create(
+                **self._get_validation_request_params(instructions, model=model)
+            )
+            test_report = json.loads(response.output_text)
+            self._assert_validation_result(test_report)
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index 46ed99daee12..afebfc9ffa11 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -33,7 +33,7 @@ async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> No
         env_var_mapping = get_sample_environment_variables_map(operation_group="agents")
         executor = AsyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
         await executor.execute_async()
-        await executor.validate_print_calls_by_llm(
+        await executor.validate_print_calls_by_llm_async(
             instructions=agent_tools_instructions,
             project_endpoint=os.environ["azure_ai_projects_agents_project_endpoint"],
         )

From 2fd02c093f2408c1a6127c03e029eeb82480e748 Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Mon, 29 Dec 2025 23:16:25 -0800
Subject: [PATCH 05/11] update test endpoint

---
 sdk/ai/azure-ai-projects/tests/samples/test_samples.py       | 2 +-
 sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
index 8597d4f9289e..bf1e697dfbc1 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
@@ -39,5 +39,5 @@ def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
         executor.execute()
         executor.validate_print_calls_by_llm(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["azure_ai_projects_agents_project_endpoint"],
+            project_endpoint=os.environ["azure_ai_projects_tests_agents_project_endpoint"],
         )
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index afebfc9ffa11..a221f673ee41 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -35,5 +35,5 @@ async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> No
         await executor.execute_async()
         await executor.validate_print_calls_by_llm_async(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["azure_ai_projects_agents_project_endpoint"],
+            project_endpoint=os.environ["azure_ai_projects_tests_agents_project_endpoint"],
         )

From 98cca73d21bdda62251bb78f16e5c9355c95dfea Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Tue, 30 Dec 2025 09:36:06 -0800
Subject: [PATCH 06/11] update

---
 sdk/ai/azure-ai-projects/tests/samples/README.md             | 5 +++--
 sdk/ai/azure-ai-projects/tests/samples/test_samples.py       | 2 +-
 sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py | 2 +-
 3 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/README.md b/sdk/ai/azure-ai-projects/tests/samples/README.md
index 5e60c062cc41..df265c7147c5 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/README.md
+++ b/sdk/ai/azure-ai-projects/tests/samples/README.md
@@ -40,7 +40,7 @@ class TestSamples(AzureRecordedTestCase):
         executor.execute()
         executor.validate_print_calls_by_llm(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["azure_ai_projects_tests_project_endpoint"],
+            project_endpoint=kwargs["azure_ai_projects_tests_project_endpoint"],
         )        
 ```
 
@@ -74,7 +74,7 @@ class TestSamplesAsync(AzureRecordedTestCase):
         await executor.execute_async()
         await executor.validate_print_calls_by_llm_async(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["azure_ai_projects_tests_project_endpoint"],
+            project_endpoint=kwargs["azure_ai_projects_tests_project_endpoint"],
         )
 ```
 
@@ -107,3 +107,4 @@ def get_sample_environment_variables_map(operation_group: str | None = None) ->
 ```
 - `execute` / `execute_async`: Run the sample; any exception fails the test.
 - `validate_print_calls_by_llm` / `validate_print_calls_by_llm_async`: Optionally validate captured print output with LLM instructions and an explicit `project_endpoint` (and optional `model`).
+- `kwargs` in the test function: A dictionary with environment variables in key and value pairs.
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
index bf1e697dfbc1..c6401da64375 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
@@ -39,5 +39,5 @@ def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
         executor.execute()
         executor.validate_print_calls_by_llm(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["azure_ai_projects_tests_agents_project_endpoint"],
+            project_endpoint=kwargs["azure_ai_projects_tests_agents_project_endpoint"],
         )
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index a221f673ee41..6f24368c576a 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -35,5 +35,5 @@ async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> No
         await executor.execute_async()
         await executor.validate_print_calls_by_llm_async(
             instructions=agent_tools_instructions,
-            project_endpoint=os.environ["azure_ai_projects_tests_agents_project_endpoint"],
+            project_endpoint=kwargs["azure_ai_projects_tests_agents_project_endpoint"],
         )

From ccb7f91d5160f7994421df705b17dfa6d557c40f Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Tue, 30 Dec 2025 15:32:00 -0800
Subject: [PATCH 07/11] added feature to test samples with optional env vars

---
 .../azure-ai-projects/tests/samples/README.md |  41 ++-
 .../tests/samples/sample_executor.py          | 235 +++++++++++++++++-
 .../tests/samples/test_samples_async.py       |  26 +-
 3 files changed, 294 insertions(+), 8 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/README.md b/sdk/ai/azure-ai-projects/tests/samples/README.md
index df265c7147c5..33d155d58f94 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/README.md
+++ b/sdk/ai/azure-ai-projects/tests/samples/README.md
@@ -4,7 +4,7 @@ Use recorded tests to validate samples with `SyncSampleExecutor` and `AsyncSampl
 
 ### Prerequisites
 - In `.env`, set the variables required by your samples plus `AZURE_TEST_RUN_LIVE=true` and `AZURE_SKIP_LIVE_RECORDING=false` when capturing recordings. CI playback typically uses `AZURE_TEST_RUN_LIVE=false` and `AZURE_SKIP_LIVE_RECORDING=true`.
-- Provide sanitized defaults via `servicePreparer` so recordings do not leak secrets.
+- Provide sanitized defaults via `servicePreparer` so recordings do not leak secrets. All mandatory environment variables used by the tests/samples must be specified in `servicePreparer` (as sanitized values) so playback can run without access to real secrets.
 
 ### Sync example
 ```python
@@ -79,7 +79,7 @@ class TestSamplesAsync(AzureRecordedTestCase):
 ```
 
 ### Key pieces
-- `@servicePreparer()`: Supplies sanitized environment variables for playback (often via `EnvironmentVariableLoader`). Use an empty string as the prefix if your variables do not share one.
+- `@servicePreparer()`: A custom helper you create for your test suite. It supplies sanitized environment variables for playback (often via `EnvironmentVariableLoader`). The name is up to you; these examples call it `servicePreparer` by convention.
 - Example:
 ```python
 import functools
@@ -108,3 +108,40 @@ def get_sample_environment_variables_map(operation_group: str | None = None) ->
 - `execute` / `execute_async`: Run the sample; any exception fails the test.
 - `validate_print_calls_by_llm` / `validate_print_calls_by_llm_async`: Optionally validate captured print output with LLM instructions and an explicit `project_endpoint` (and optional `model`).
 - `kwargs` in the test function: A dictionary with environment variables in key and value pairs.
+
+### Optional environment variables
+To run the “hero path” of a sample, your `@servicePreparer` should provide all mandatory environment variables.
+If a sample supports optional environment variables (for optional features/paths), use `@AdditionalTestsWithEnvironmentVariables` to generate additional recorded test cases with those optional variables set.
+
+```python
+@servicePreparer()
+@AdditionalTestsWithEnvironmentVariables(
+    [
+        (
+            "sample_agent_computer_use.py",
+            {"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model"},
+        ),
+        (
+            "sample_agent_computer_use.py",
+            {"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model", "SOME_FLAG": "true"},
+        )
+    ]
+)
+@pytest.mark.parametrize(
+    "sample_path",
+    get_sample_paths(
+        "agents/tools",
+        samples_to_skip=[],
+    ),
+)
+@SamplePathPasser()
+@recorded_by_proxy(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
+def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
+    ...
+```
+
+In the example above, `sample_agent_computer_use.py` is executed multiple times with different optional environment variable sets.
+- Each tuple entry is one scenario. If you want multiple scenarios for the same sample file, add multiple entries with the same filename.
+- Live/recording: the value is read from your environment (for example, from `.env`).
+- Playback: the value is set to the provided sanitized value (`sanitized_model`).
+ 
diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
index 5d2ad0e45d10..1cdc90fcffcd 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -6,9 +6,11 @@
 """Shared base code for sample tests - sync dependencies only."""
 import os
 import sys
+import re
 import pytest
 import inspect
 import importlib.util
+import functools
 from typing import overload, Union
 from pydantic import BaseModel
 
@@ -158,7 +160,13 @@ class TestReport(BaseModel):
         correct: bool
         reason: str
 
-    def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, str], **kwargs):
+    def __init__(
+        self,
+        test_instance,
+        sample_path: str,
+        env_var_mapping: dict[str, str],
+        **kwargs,
+    ):
         self.test_instance = test_instance
         self.sample_path = sample_path
         self.print_calls: list[str] = []
@@ -171,6 +179,17 @@ def __init__(self, test_instance, sample_path: str, env_var_mapping: dict[str, s
             if value is not None:
                 self.env_vars[sample_var] = value
 
+        # Any remaining ALL_CAPS string kwargs are treated as env vars for the sample.
+        # This supports decorators/tests passing env-var overrides via **kwargs.
+        env_var_overrides: dict[str, str] = {}
+        for key, value in list(kwargs.items()):
+            if isinstance(key, str) and key.isupper() and isinstance(value, str):
+                env_var_overrides[key] = value
+                kwargs.pop(key, None)
+        if env_var_overrides:
+            # Allow overrides to win over mapped ones if needed.
+            self.env_vars.update(env_var_overrides)
+
         # Add the sample's directory to sys.path so it can import local modules
         self.sample_dir = os.path.dirname(sample_path)
         if self.sample_dir not in sys.path:
@@ -386,3 +405,217 @@ async def validate_print_calls_by_llm_async(
             )
             test_report = json.loads(response.output_text)
             self._assert_validation_result(test_report)
+
+
+def _is_live_mode() -> bool:
+    return os.environ.get("AZURE_TEST_RUN_LIVE") == "true"
+
+
+def _normalize_sample_filename(sample_file: str) -> str:
+    return os.path.basename(sample_file)
+
+
+def _resolve_additional_env_vars(
+    *,
+    sample_path: str,
+    playback_values: dict[str, str],
+) -> dict[str, str] | None:
+    sample_filename = os.path.basename(sample_path)
+
+    resolved: dict[str, str] = {}
+    if _is_live_mode():
+        for env_key, playback_value in playback_values.items():
+            live_value = os.environ.get(env_key)
+            if not live_value:
+                raise ValueError(
+                    f"Missing required environment variable '{env_key}' for live recording of sample '{sample_filename}'. "
+                    "Either set it in your environment/.env file or run in playback mode."
+                )
+            resolved[env_key] = live_value
+    else:
+        resolved.update(playback_values)
+
+    return resolved
+
+
+def _register_env_var_sanitizers(
+    *,
+    resolved_env_vars: dict[str, str],
+    playback_values: dict[str, str],
+) -> None:
+    """Register function-scoped sanitizers to replace live env-var values with playback values."""
+    if not _is_live_mode():
+        return
+
+    from devtools_testutils import add_general_string_sanitizer
+
+    for env_key, live_value in resolved_env_vars.items():
+        playback_value = playback_values.get(env_key)
+        if not playback_value:
+            continue
+        if live_value == playback_value:
+            continue
+
+        add_general_string_sanitizer(function_scoped=True, target=live_value, value=playback_value)
+
+
+class AdditionalTestsWithEnvironmentVariables:
+    """Decorator that injects per-sample additional env vars for record/playback.
+
+    Args:
+        samples_with_env_vars: List of tuples: (sample_filename, {ENV_KEY: playback_sanitized_value}).
+            - In live mode (AZURE_TEST_RUN_LIVE=true): reads actual values from the environment for ENV_KEY,
+              and registers function-scoped sanitizers to replace them with the provided playback values.
+            - In playback mode: sets ENV_KEY to the provided playback value.
+
+    The decorator also appends env-var keys to the pytest id for the matching sample.
+    """
+
+    def __init__(self, samples_with_env_vars: list[tuple[str, dict[str, str]]]):
+        # Allow multiple env-var sets per sample (e.g. same sample file listed multiple times)
+        self._env_var_playback_values_by_sample: dict[str, list[dict[str, str]]] = {}
+        for sample_file, playback_values in samples_with_env_vars:
+            key = _normalize_sample_filename(sample_file)
+            self._env_var_playback_values_by_sample.setdefault(key, []).append(playback_values)
+
+        # Mapping from param-id (request.node.callspec.id) -> playback values dict.
+        # Populated when we expand parametrize ids.
+        self._playback_values_by_param_id: dict[str, dict[str, str]] = {}
+
+    def __call__(self, fn):
+        # Expand the existing sample_path parametrization:
+        # - keep the original case (no extra env vars)
+        # - add one extra case per env-var set, with a stable id suffix
+        marks = getattr(fn, "pytestmark", [])
+        for mark in marks:
+            if getattr(mark, "name", None) != "parametrize":
+                continue
+            if not getattr(mark, "args", None) or len(mark.args) < 2:
+                continue
+
+            def _split_argnames(argnames) -> list[str]:
+                if isinstance(argnames, str):
+                    return [a.strip() for a in argnames.split(",") if a.strip()]
+                try:
+                    return list(argnames)
+                except TypeError:
+                    return [str(argnames)]
+
+            argnames = _split_argnames(mark.args[0])
+            if "sample_path" not in argnames:
+                continue
+            sample_path_index = argnames.index("sample_path")
+            argvalues = mark.args[1]
+            if not isinstance(argvalues, list):
+                continue
+
+            expanded: list = []
+
+            inferred_sample_dir: str | None = None
+            template_values: tuple | None = None
+            template_marks: tuple = ()
+            seen_sample_filenames: set[str] = set()
+
+            for parameter_set in list(argvalues):
+                values = getattr(parameter_set, "values", None)
+                if values is None:
+                    continue
+
+                if template_values is None:
+                    if isinstance(values, tuple):
+                        template_values = values
+                    elif isinstance(values, list):
+                        template_values = tuple(values)
+
+                    if template_values is not None:
+                        template_marks = tuple(getattr(parameter_set, "marks", ()))
+
+                expanded.append(parameter_set)  # baseline / original
+
+                if not isinstance(values, (list, tuple)):
+                    continue
+                if sample_path_index >= len(values):
+                    continue
+
+                sample_path = values[sample_path_index]
+
+                sample_filename = os.path.basename(str(sample_path))
+                seen_sample_filenames.add(sample_filename)
+
+                if inferred_sample_dir is None:
+                    inferred_sample_dir = os.path.dirname(str(sample_path))
+
+                playback_sets = self._env_var_playback_values_by_sample.get(sample_filename)
+                if not playback_sets:
+                    continue
+
+                base_id = getattr(parameter_set, "id", None) or os.path.splitext(sample_filename)[0]
+                marks_for_param = getattr(parameter_set, "marks", ())
+                for playback_values in playback_sets:
+                    keys_suffix = "+".join(sorted(playback_values.keys()))
+                    new_id = f"{base_id}[{keys_suffix}]"
+                    expanded.append(pytest.param(*values, marks=marks_for_param, id=new_id))
+                    self._playback_values_by_param_id[new_id] = playback_values
+
+            # If a sample was excluded from discovery (e.g., via samples_to_skip), it won't appear in argvalues.
+            # In that case, still synthesize *variant-only* cases for any configured env-var sets.
+            if inferred_sample_dir and template_values is not None:
+                for sample_filename, playback_sets in self._env_var_playback_values_by_sample.items():
+                    if sample_filename in seen_sample_filenames:
+                        continue
+
+                    synthetic_sample_path = os.path.join(inferred_sample_dir, sample_filename)
+                    synthetic_values = list(template_values)
+                    synthetic_values[sample_path_index] = synthetic_sample_path
+                    base_id = os.path.splitext(sample_filename)[0]
+
+                    for playback_values in playback_sets:
+                        keys_suffix = "+".join(sorted(playback_values.keys()))
+                        new_id = f"{base_id}[{keys_suffix}]"
+                        expanded.append(pytest.param(*synthetic_values, marks=template_marks, id=new_id))
+                        self._playback_values_by_param_id[new_id] = playback_values
+
+            # Keep a stable, deterministic order for test ids.
+            expanded.sort(key=lambda p: str(getattr(p, "id", "") or ""))
+
+            # Mutate the existing list in-place so pytest sees the expanded cases.
+            argvalues[:] = expanded
+
+        def _inject_env_vars(*, sample_path: str, kwargs: dict) -> None:
+            # Determine which env-var set applies for this specific parametrized case.
+            # Can't rely on the `request` fixture here because outer decorators may hide it from pytest.
+            current_test = os.environ.get("PYTEST_CURRENT_TEST", "")
+            nodeid = current_test.split(" ")[0]  # drop " (call)" / " (setup)" / etc.
+
+            # Capture everything between the first '[' and the last ']' in the nodeid.
+            # This works even if the callspec id itself contains nested brackets like base_id[ENV1|ENV2].
+            match = re.search(r"\[(?P<id>.*)\]", nodeid)
+            case_id = match.group("id") if match else None
+            playback_values = self._playback_values_by_param_id.get(case_id) if case_id else None
+
+            if not playback_values:
+                return
+
+            resolved = _resolve_additional_env_vars(sample_path=sample_path, playback_values=playback_values)
+            if not resolved:
+                return
+
+            _register_env_var_sanitizers(resolved_env_vars=resolved, playback_values=playback_values)
+            for env_key, env_value in resolved.items():
+                kwargs.setdefault(env_key, env_value)
+
+        if inspect.iscoroutinefunction(fn):
+
+            @functools.wraps(fn)
+            async def _wrapper_async(test_class, sample_path: str, *args, **kwargs):
+                _inject_env_vars(sample_path=sample_path, kwargs=kwargs)
+                return await fn(test_class, sample_path, *args, **kwargs)
+
+            return _wrapper_async
+
+        @functools.wraps(fn)
+        def _wrapper_sync(test_class, sample_path: str, *args, **kwargs):
+            _inject_env_vars(sample_path=sample_path, kwargs=kwargs)
+            return fn(test_class, sample_path, *args, **kwargs)
+
+        return _wrapper_sync
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index 6f24368c576a..a0b367ed54a5 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -8,7 +8,12 @@
 from devtools_testutils.aio import recorded_by_proxy_async
 from devtools_testutils import AzureRecordedTestCase, RecordedTransport
 from test_base import servicePreparer
-from sample_executor import AsyncSampleExecutor, get_async_sample_paths, SamplePathPasser
+from sample_executor import (
+    AdditionalTestsWithEnvironmentVariables,
+    AsyncSampleExecutor,
+    SamplePathPasser,
+    get_async_sample_paths,
+)
 from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
 
 
@@ -18,20 +23,31 @@ class TestSamplesAsync(AzureRecordedTestCase):
     # To run this test with a specific sample, use:
     # pytest tests/samples/test_samples_async.py::TestSamplesAsync::test_agent_tools_samples_async[sample_agent_memory_search_async]
     @servicePreparer()
+    @AdditionalTestsWithEnvironmentVariables(
+        [
+            (
+                "sample_agent_computer_use_async.py",
+                {"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model"},
+            ),
+        ]
+    )
     @pytest.mark.parametrize(
         "sample_path",
         get_async_sample_paths(
             "agents/tools",
-            samples_to_skip=[
-                "sample_agent_mcp_with_project_connection_async.py",
-            ],
+            samples_to_skip=["sample_agent_mcp_with_project_connection_async.py"],
         ),
     )
     @SamplePathPasser()
     @recorded_by_proxy_async(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
     async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> None:
         env_var_mapping = get_sample_environment_variables_map(operation_group="agents")
-        executor = AsyncSampleExecutor(self, sample_path, env_var_mapping, **kwargs)
+        executor = AsyncSampleExecutor(
+            self,
+            sample_path,
+            env_var_mapping,
+            **kwargs,
+        )
         await executor.execute_async()
         await executor.validate_print_calls_by_llm_async(
             instructions=agent_tools_instructions,

From 1ebd16a4a5334feb04bb1529fea438944a848c1e Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Tue, 30 Dec 2025 16:11:40 -0800
Subject: [PATCH 08/11] resovled comment and recording

---
 sdk/ai/azure-ai-projects/assets.json                         | 2 +-
 sdk/ai/azure-ai-projects/tests/samples/README.md             | 2 +-
 sdk/ai/azure-ai-projects/tests/samples/test_samples.py       | 1 -
 sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py | 1 -
 4 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/assets.json b/sdk/ai/azure-ai-projects/assets.json
index 153709b54f73..f9bbdec2b463 100644
--- a/sdk/ai/azure-ai-projects/assets.json
+++ b/sdk/ai/azure-ai-projects/assets.json
@@ -2,5 +2,5 @@
   "AssetsRepo": "Azure/azure-sdk-assets",
   "AssetsRepoPrefixPath": "python",
   "TagPrefix": "python/ai/azure-ai-projects",
-  "Tag": "python/ai/azure-ai-projects_53529b753b"
+  "Tag": "python/ai/azure-ai-projects_b0201f3422"
 }
diff --git a/sdk/ai/azure-ai-projects/tests/samples/README.md b/sdk/ai/azure-ai-projects/tests/samples/README.md
index 33d155d58f94..d8b3129d1398 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/README.md
+++ b/sdk/ai/azure-ai-projects/tests/samples/README.md
@@ -144,4 +144,4 @@ In the example above, `sample_agent_computer_use.py` is executed multiple times
 - Each tuple entry is one scenario. If you want multiple scenarios for the same sample file, add multiple entries with the same filename.
 - Live/recording: the value is read from your environment (for example, from `.env`).
 - Playback: the value is set to the provided sanitized value (`sanitized_model`).
- 
+
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
index c6401da64375..a8e677c95d47 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
@@ -3,7 +3,6 @@
 # Copyright (c) Microsoft Corporation.
 # Licensed under the MIT License.
 # ------------------------------------
-import os
 import pytest
 from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
 from test_base import servicePreparer
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index a0b367ed54a5..70759f7e1b61 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -3,7 +3,6 @@
 # Copyright (c) Microsoft Corporation.
 # Licensed under the MIT License.
 # ------------------------------------
-import os
 import pytest
 from devtools_testutils.aio import recorded_by_proxy_async
 from devtools_testutils import AzureRecordedTestCase, RecordedTransport

From e809149535e57fe14a81f9d049aaf71e50e978ce Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Tue, 30 Dec 2025 16:56:45 -0800
Subject: [PATCH 09/11] recording again

---
 sdk/ai/azure-ai-projects/assets.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/sdk/ai/azure-ai-projects/assets.json b/sdk/ai/azure-ai-projects/assets.json
index f9bbdec2b463..f9f75fbad26b 100644
--- a/sdk/ai/azure-ai-projects/assets.json
+++ b/sdk/ai/azure-ai-projects/assets.json
@@ -2,5 +2,5 @@
   "AssetsRepo": "Azure/azure-sdk-assets",
   "AssetsRepoPrefixPath": "python",
   "TagPrefix": "python/ai/azure-ai-projects",
-  "Tag": "python/ai/azure-ai-projects_b0201f3422"
+  "Tag": "python/ai/azure-ai-projects_7928349686"
 }

From b0117d5440e6e39021427301617ea5a1039aa230 Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Tue, 30 Dec 2025 17:47:47 -0800
Subject: [PATCH 10/11] fix

---
 sdk/ai/azure-ai-projects/tests/samples/sample_executor.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
index 1cdc90fcffcd..dea43216f12e 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -419,12 +419,12 @@ def _resolve_additional_env_vars(
     *,
     sample_path: str,
     playback_values: dict[str, str],
-) -> dict[str, str] | None:
+) -> dict[str, str]:
     sample_filename = os.path.basename(sample_path)
 
     resolved: dict[str, str] = {}
     if _is_live_mode():
-        for env_key, playback_value in playback_values.items():
+        for env_key, _ in playback_values.items():
             live_value = os.environ.get(env_key)
             if not live_value:
                 raise ValueError(

From ee53c3dec79945f9aca198d9da38b2d45530a579 Mon Sep 17 00:00:00 2001
From: Howie Leung <howieleung@microsoft.com>
Date: Wed, 31 Dec 2025 00:09:08 -0800
Subject: [PATCH 11/11] Update sample test configurations and improve
 environment variable handling

---
 sdk/ai/azure-ai-projects/assets.json          |   2 +-
 .../azure-ai-projects/tests/samples/README.md |  52 +++++---
 .../tests/samples/sample_executor.py          | 122 +++++++++++++-----
 .../tests/samples/test_samples.py             |  18 ++-
 .../tests/samples/test_samples_async.py       |  13 +-
 5 files changed, 140 insertions(+), 67 deletions(-)

diff --git a/sdk/ai/azure-ai-projects/assets.json b/sdk/ai/azure-ai-projects/assets.json
index f9f75fbad26b..d83bf373729d 100644
--- a/sdk/ai/azure-ai-projects/assets.json
+++ b/sdk/ai/azure-ai-projects/assets.json
@@ -2,5 +2,5 @@
   "AssetsRepo": "Azure/azure-sdk-assets",
   "AssetsRepoPrefixPath": "python",
   "TagPrefix": "python/ai/azure-ai-projects",
-  "Tag": "python/ai/azure-ai-projects_7928349686"
+  "Tag": "python/ai/azure-ai-projects_99f92cad55"
 }
diff --git a/sdk/ai/azure-ai-projects/tests/samples/README.md b/sdk/ai/azure-ai-projects/tests/samples/README.md
index d8b3129d1398..2f9537e9169d 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/README.md
+++ b/sdk/ai/azure-ai-projects/tests/samples/README.md
@@ -6,13 +6,15 @@ Use recorded tests to validate samples with `SyncSampleExecutor` and `AsyncSampl
 - In `.env`, set the variables required by your samples plus `AZURE_TEST_RUN_LIVE=true` and `AZURE_SKIP_LIVE_RECORDING=false` when capturing recordings. CI playback typically uses `AZURE_TEST_RUN_LIVE=false` and `AZURE_SKIP_LIVE_RECORDING=true`.
 - Provide sanitized defaults via `servicePreparer` so recordings do not leak secrets. All mandatory environment variables used by the tests/samples must be specified in `servicePreparer` (as sanitized values) so playback can run without access to real secrets.
 
+**VS Code tip (record a single sample):** Open the **Testing** tab, expand the pytest tree to find the specific sample test case (for example, one parameterized case for a particular `sample_path`), then right-click it and choose **Run Test** (or **Debug Test**). Make sure your `.env` (or your test run environment) includes `AZURE_TEST_RUN_LIVE=true` and `AZURE_SKIP_LIVE_RECORDING=false` so that run captures a new recording for just that sample.
+
 ### Sync example
 ```python
 import pytest
 import os
 from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
 from test_base import servicePreparer
-from sample_executor import SyncSampleExecutor, get_sample_paths, SamplePathPasser
+from sample_executor import SyncSampleExecutor, get_sample_paths, samplePathPasser
 from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
 
 class TestSamples(AzureRecordedTestCase):
@@ -32,7 +34,7 @@ class TestSamples(AzureRecordedTestCase):
             ],
         ),
     )
-    @SamplePathPasser()
+    @samplePathPasser()
     @recorded_by_proxy(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
     def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
         env_var_mapping = get_sample_environment_variables_map()
@@ -51,7 +53,7 @@ from devtools_testutils.aio import recorded_by_proxy_async
 import os
 from devtools_testutils import AzureRecordedTestCase, RecordedTransport
 from test_base import servicePreparer
-from sample_executor import AsyncSampleExecutor, get_async_sample_paths, SamplePathPasser
+from sample_executor import AsyncSampleExecutor, get_async_sample_paths, samplePathPasser
 from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
 
 class TestSamplesAsync(AzureRecordedTestCase):
@@ -66,7 +68,7 @@ class TestSamplesAsync(AzureRecordedTestCase):
             ],
         ),
     )
-    @SamplePathPasser()
+    @samplePathPasser()
     @recorded_by_proxy_async(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
     async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> None:
         env_var_mapping = get_sample_environment_variables_map()
@@ -94,7 +96,7 @@ servicePreparer = functools.partial(
 )
 ```
 - `@pytest.mark.parametrize`: Drives one test per sample file. Use `samples_to_test` or `samples_to_skip` with `get_sample_paths` / `get_async_sample_paths`.
-- `@SamplePathPasser`: Forwards the sample path to the recorder decorators.
+- `@samplePathPasser`: Forwards the sample path to the recorder decorators.
 - `recorded_by_proxy` / `recorded_by_proxy_async`: Wrap tests for recording/playback. Include `RecordedTransport.HTTPX` when samples use httpx in addition to the default `RecordedTransport.AZURE_CORE`.
 - `get_sample_environment_variables_map`: Map test env vars to the names expected by samples. Pass `{}` if you already export the sample variables directly. Example:
 ```python
@@ -111,20 +113,27 @@ def get_sample_environment_variables_map(operation_group: str | None = None) ->
 
 ### Optional environment variables
 To run the “hero path” of a sample, your `@servicePreparer` should provide all mandatory environment variables.
-If a sample supports optional environment variables (for optional features/paths), use `@AdditionalTestsWithEnvironmentVariables` to generate additional recorded test cases with those optional variables set.
+If a sample supports optional environment variables (for optional features/paths), use `@additionalSampleTests` to generate additional recorded test cases with those optional variables set.
 
 ```python
+from sample_executor import AdditionalSampleTestDetail, additionalSampleTests
+
 @servicePreparer()
-@AdditionalTestsWithEnvironmentVariables(
+@additionalSampleTests(
     [
-        (
-            "sample_agent_computer_use.py",
-            {"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model"},
+        AdditionalSampleTestDetail(
+            sample_filename="sample_agent_computer_use.py",
+            env_vars={"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model"},
+            test_id="computer_use",
+        ),
+        AdditionalSampleTestDetail(
+            sample_filename="sample_agent_computer_use.py",
+            env_vars={
+                "COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model",
+                "SOME_FLAG": "true",
+            },
+            test_id="sample_agent_computer_use_with_flag",
         ),
-        (
-            "sample_agent_computer_use.py",
-            {"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model", "SOME_FLAG": "true"},
-        )
     ]
 )
 @pytest.mark.parametrize(
@@ -134,14 +143,19 @@ If a sample supports optional environment variables (for optional features/paths
         samples_to_skip=[],
     ),
 )
-@SamplePathPasser()
+@samplePathPasser()
 @recorded_by_proxy(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
 def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
     ...
 ```
 
-In the example above, `sample_agent_computer_use.py` is executed multiple times with different optional environment variable sets.
-- Each tuple entry is one scenario. If you want multiple scenarios for the same sample file, add multiple entries with the same filename.
-- Live/recording: the value is read from your environment (for example, from `.env`).
-- Playback: the value is set to the provided sanitized value (`sanitized_model`).
+Notes:
+- `AdditionalSampleTestDetail.env_vars` is a mapping of **sample env-var name** -> **sanitized playback value**.
+    - Live/recording (`AZURE_TEST_RUN_LIVE=true`): reads the real value from your environment (for example, from `.env`) and sanitizes it to the provided playback value.
+    - Playback (`AZURE_TEST_RUN_LIVE=false`): sets each key to the provided playback value.
+- `AdditionalSampleTestDetail.test_id` customizes the parameter id used for that variant.
+    - If omitted, the id is auto-generated from the sample filename and env-var keys (for example, `sample_agent_computer_use-[COMPUTER_USE_MODEL_DEPLOYMENT_NAME]`).
+    - If provided, it becomes the full parameter id for that variant (no filename prefix).
+    - If the auto-generated id makes the recording file path too long (most commonly on Windows), the recording file may fail to generate; set a short `test_id` (and keep it unique across all parametrized cases).
+- In VS Code’s **Testing** tab, these show up as additional parameterized cases for the same test, using the parameter id.
 
diff --git a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
index dea43216f12e..62fb614ff600 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/sample_executor.py
@@ -11,6 +11,7 @@
 import inspect
 import importlib.util
 import functools
+from dataclasses import dataclass, field
 from typing import overload, Union
 from pydantic import BaseModel
 
@@ -249,22 +250,28 @@ def _assert_validation_result(self, test_report: dict) -> None:
         print(f"Reason: {test_report['reason']}")
 
 
-class SamplePathPasser:
-    """Decorator for passing sample path to test functions."""
+def samplePathPasser():
+    """Decorator factory for passing sample path to test functions.
 
-    def __call__(self, fn):
+    Usage: `@samplePathPasser()`.
+    """
+
+    def _decorator(fn):
         if inspect.iscoroutinefunction(fn):
 
+            @functools.wraps(fn)
             async def _wrapper_async(test_class, sample_path, **kwargs):
                 return await fn(test_class, sample_path, **kwargs)
 
             return _wrapper_async
-        else:
 
-            def _wrapper_sync(test_class, sample_path, **kwargs):
-                return fn(test_class, sample_path, **kwargs)
+        @functools.wraps(fn)
+        def _wrapper_sync(test_class, sample_path, **kwargs):
+            return fn(test_class, sample_path, **kwargs)
 
-            return _wrapper_sync
+        return _wrapper_sync
+
+    return _decorator
 
 
 class SyncSampleExecutor(BaseSampleExecutor):
@@ -459,11 +466,49 @@ def _register_env_var_sanitizers(
         add_general_string_sanitizer(function_scoped=True, target=live_value, value=playback_value)
 
 
-class AdditionalTestsWithEnvironmentVariables:
-    """Decorator that injects per-sample additional env vars for record/playback.
+@dataclass(slots=True, init=False)
+class AdditionalSampleTestDetail:
+    """Configuration for adding an additional parametrized test case for a specific sample.
+
+    In live mode (AZURE_TEST_RUN_LIVE=true), the values for keys in `env_vars` are read from the
+    environment and then sanitized to the provided playback values.
+
+    In playback mode, keys in `env_vars` are set to the provided playback values.
+    """
+
+    sample_filename: str
+    env_vars: dict[str, str]
+    _test_id: str | None = field(default=None, repr=False)
+
+    def __init__(
+        self,
+        *,
+        sample_filename: str,
+        env_vars: dict[str, str],
+        test_id: str | None = None,
+    ) -> None:
+        self.sample_filename = sample_filename
+        self.env_vars = env_vars
+        self._test_id = test_id
+
+    @property
+    def test_id(self) -> str:
+        if self._test_id is None:
+            sample_stem = os.path.splitext(os.path.basename(self.sample_filename))[0]
+            keys_suffix = ",".join(sorted(self.env_vars.keys()))
+            self._test_id = f"{sample_stem}-[{keys_suffix}]"
+        return self._test_id
+
+    @test_id.setter
+    def test_id(self, value: str) -> None:
+        self._test_id = value
+
+
+def additionalSampleTests(additional_tests: list[AdditionalSampleTestDetail]):
+    """Decorator factory that adds additional test cases per sample for record/playback.
 
     Args:
-        samples_with_env_vars: List of tuples: (sample_filename, {ENV_KEY: playback_sanitized_value}).
+        additional_tests: List of `AdditionalSampleTestDetail` items.
             - In live mode (AZURE_TEST_RUN_LIVE=true): reads actual values from the environment for ENV_KEY,
               and registers function-scoped sanitizers to replace them with the provided playback values.
             - In playback mode: sets ENV_KEY to the provided playback value.
@@ -471,18 +516,17 @@ class AdditionalTestsWithEnvironmentVariables:
     The decorator also appends env-var keys to the pytest id for the matching sample.
     """
 
-    def __init__(self, samples_with_env_vars: list[tuple[str, dict[str, str]]]):
-        # Allow multiple env-var sets per sample (e.g. same sample file listed multiple times)
-        self._env_var_playback_values_by_sample: dict[str, list[dict[str, str]]] = {}
-        for sample_file, playback_values in samples_with_env_vars:
-            key = _normalize_sample_filename(sample_file)
-            self._env_var_playback_values_by_sample.setdefault(key, []).append(playback_values)
+    # Allow multiple env-var sets per sample (e.g. same sample file listed multiple times)
+    env_var_sets_by_sample: dict[str, list[AdditionalSampleTestDetail]] = {}
+    for item in additional_tests:
+        key = _normalize_sample_filename(item.sample_filename)
+        env_var_sets_by_sample.setdefault(key, []).append(item)
 
-        # Mapping from param-id (request.node.callspec.id) -> playback values dict.
-        # Populated when we expand parametrize ids.
-        self._playback_values_by_param_id: dict[str, dict[str, str]] = {}
+    # Mapping from param-id (request.node.callspec.id) -> playback values dict.
+    # Populated when we expand parametrize ids.
+    playback_values_by_param_id: dict[str, dict[str, str]] = {}
 
-    def __call__(self, fn):
+    def _decorator(fn):
         # Expand the existing sample_path parametrization:
         # - keep the original case (no extra env vars)
         # - add one extra case per env-var set, with a stable id suffix
@@ -545,35 +589,43 @@ def _split_argnames(argnames) -> list[str]:
                 if inferred_sample_dir is None:
                     inferred_sample_dir = os.path.dirname(str(sample_path))
 
-                playback_sets = self._env_var_playback_values_by_sample.get(sample_filename)
-                if not playback_sets:
+                additional_details = env_var_sets_by_sample.get(sample_filename)
+                if not additional_details:
                     continue
 
-                base_id = getattr(parameter_set, "id", None) or os.path.splitext(sample_filename)[0]
                 marks_for_param = getattr(parameter_set, "marks", ())
-                for playback_values in playback_sets:
-                    keys_suffix = "+".join(sorted(playback_values.keys()))
-                    new_id = f"{base_id}[{keys_suffix}]"
+                for detail in additional_details:
+                    new_id = detail.test_id
+
+                    if new_id in playback_values_by_param_id:
+                        raise ValueError(
+                            f"Duplicate additional sample test id '{new_id}'. "
+                            "When using test_id, ensure it is unique across all parametrized cases."
+                        )
                     expanded.append(pytest.param(*values, marks=marks_for_param, id=new_id))
-                    self._playback_values_by_param_id[new_id] = playback_values
+                    playback_values_by_param_id[new_id] = detail.env_vars
 
             # If a sample was excluded from discovery (e.g., via samples_to_skip), it won't appear in argvalues.
             # In that case, still synthesize *variant-only* cases for any configured env-var sets.
             if inferred_sample_dir and template_values is not None:
-                for sample_filename, playback_sets in self._env_var_playback_values_by_sample.items():
+                for sample_filename, playback_sets in env_var_sets_by_sample.items():
                     if sample_filename in seen_sample_filenames:
                         continue
 
                     synthetic_sample_path = os.path.join(inferred_sample_dir, sample_filename)
                     synthetic_values = list(template_values)
                     synthetic_values[sample_path_index] = synthetic_sample_path
-                    base_id = os.path.splitext(sample_filename)[0]
 
-                    for playback_values in playback_sets:
-                        keys_suffix = "+".join(sorted(playback_values.keys()))
-                        new_id = f"{base_id}[{keys_suffix}]"
+                    for detail in playback_sets:
+                        new_id = detail.test_id
+
+                        if new_id in playback_values_by_param_id:
+                            raise ValueError(
+                                f"Duplicate additional sample test id '{new_id}'. "
+                                "When using test_id, ensure it is unique across all parametrized cases."
+                            )
                         expanded.append(pytest.param(*synthetic_values, marks=template_marks, id=new_id))
-                        self._playback_values_by_param_id[new_id] = playback_values
+                        playback_values_by_param_id[new_id] = detail.env_vars
 
             # Keep a stable, deterministic order for test ids.
             expanded.sort(key=lambda p: str(getattr(p, "id", "") or ""))
@@ -591,7 +643,7 @@ def _inject_env_vars(*, sample_path: str, kwargs: dict) -> None:
             # This works even if the callspec id itself contains nested brackets like base_id[ENV1|ENV2].
             match = re.search(r"\[(?P<id>.*)\]", nodeid)
             case_id = match.group("id") if match else None
-            playback_values = self._playback_values_by_param_id.get(case_id) if case_id else None
+            playback_values = playback_values_by_param_id.get(case_id) if case_id else None
 
             if not playback_values:
                 return
@@ -619,3 +671,5 @@ def _wrapper_sync(test_class, sample_path: str, *args, **kwargs):
             return fn(test_class, sample_path, *args, **kwargs)
 
         return _wrapper_sync
+
+    return _decorator
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
index a8e677c95d47..c517e43908de 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples.py
@@ -6,7 +6,13 @@
 import pytest
 from devtools_testutils import recorded_by_proxy, AzureRecordedTestCase, RecordedTransport
 from test_base import servicePreparer
-from sample_executor import SyncSampleExecutor, get_sample_paths, SamplePathPasser
+from sample_executor import (
+    AdditionalSampleTestDetail,
+    SyncSampleExecutor,
+    additionalSampleTests,
+    get_sample_paths,
+    samplePathPasser,
+)
 from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
 
 
@@ -15,6 +21,14 @@ class TestSamples(AzureRecordedTestCase):
     # To run this test with a specific sample, use:
     # pytest tests/samples/test_samples.py::TestSamples::test_agent_tools_samples[sample_agent_memory_search]
     @servicePreparer()
+    @additionalSampleTests(
+        [
+            AdditionalSampleTestDetail(
+                sample_filename="sample_agent_computer_use.py",
+                env_vars={"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model"},
+            ),
+        ]
+    )
     @pytest.mark.parametrize(
         "sample_path",
         get_sample_paths(
@@ -30,7 +44,7 @@ class TestSamples(AzureRecordedTestCase):
             ],
         ),
     )
-    @SamplePathPasser()
+    @samplePathPasser()
     @recorded_by_proxy(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
     def test_agent_tools_samples(self, sample_path: str, **kwargs) -> None:
         env_var_mapping = get_sample_environment_variables_map(operation_group="agents")
diff --git a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
index 70759f7e1b61..1f3b4c5775c4 100644
--- a/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
+++ b/sdk/ai/azure-ai-projects/tests/samples/test_samples_async.py
@@ -8,9 +8,8 @@
 from devtools_testutils import AzureRecordedTestCase, RecordedTransport
 from test_base import servicePreparer
 from sample_executor import (
-    AdditionalTestsWithEnvironmentVariables,
     AsyncSampleExecutor,
-    SamplePathPasser,
+    samplePathPasser,
     get_async_sample_paths,
 )
 from test_samples_helpers import agent_tools_instructions, get_sample_environment_variables_map
@@ -22,14 +21,6 @@ class TestSamplesAsync(AzureRecordedTestCase):
     # To run this test with a specific sample, use:
     # pytest tests/samples/test_samples_async.py::TestSamplesAsync::test_agent_tools_samples_async[sample_agent_memory_search_async]
     @servicePreparer()
-    @AdditionalTestsWithEnvironmentVariables(
-        [
-            (
-                "sample_agent_computer_use_async.py",
-                {"COMPUTER_USE_MODEL_DEPLOYMENT_NAME": "sanitized_model"},
-            ),
-        ]
-    )
     @pytest.mark.parametrize(
         "sample_path",
         get_async_sample_paths(
@@ -37,7 +28,7 @@ class TestSamplesAsync(AzureRecordedTestCase):
             samples_to_skip=["sample_agent_mcp_with_project_connection_async.py"],
         ),
     )
-    @SamplePathPasser()
+    @samplePathPasser()
     @recorded_by_proxy_async(RecordedTransport.AZURE_CORE, RecordedTransport.HTTPX)
     async def test_agent_tools_samples_async(self, sample_path: str, **kwargs) -> None:
         env_var_mapping = get_sample_environment_variables_map(operation_group="agents")