Make e2e tests deterministic for provider-proxy cache

Replace random values (UUIDs, random integers) in LLM provider request bodies with fixed strings. This makes provider-proxy cache keys deterministic across test runs, enabling read-only cache mode in CI. Changes: - providers/common.rs: Remove UUID from bad auth test prompt - providers/anthropic.rs: Remove UUID from thinking test prompt - aggregated_response/mod.rs: Remove UUID suffix from prompt - otel.rs: Use fixed string for tag value - raw_response/embeddings.rs: Use fixed string for embedding input - test_client.py: Remove UUID from extra headers test prompt - test_embeddings.py: Use fixed strings for cache test inputs Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
tensorzero · AntoineToussaint · Apr 8, 2026 · Apr 8, 2026 · Apr 9, 2026 · Apr 9, 2026
commit 9a6feab46ea35ee2a39de7ec4ae18be5ab24c70b
diff --git a/crates/tensorzero-core/tests/e2e/aggregated_response/mod.rs b/crates/tensorzero-core/tests/e2e/aggregated_response/mod.rs
@@ -15,7 +15,6 @@ use crate::common::get_gateway_endpoint;
 #[tokio::test]
 async fn test_aggregated_response_chat_streaming() {
     let episode_id = Uuid::now_v7();
-    let random_suffix = Uuid::now_v7();
 
     let payload = json!({
         "function_name": "basic_test",
@@ -26,7 +25,7 @@ async fn test_aggregated_response_chat_streaming() {
             "messages": [
                 {
                     "role": "user",
-                    "content": format!("Say hello in one sentence. {random_suffix}")
+                    "content": "Say hello in one sentence. deterministic-cache-test"
                 }
             ]
         },

diff --git a/crates/tensorzero-core/tests/e2e/otel.rs b/crates/tensorzero-core/tests/e2e/otel.rs
@@ -943,7 +943,7 @@ pub fn test_capture_model_error(mode: OtlpTracesFormat, config_mode: &str) {
                 tags: HashMap::from([
                     ("first_tag".to_string(), "first_value".into()),
                     ("second_tag".to_string(), "second_value".into()),
-                    ("user_id".to_string(), Uuid::now_v7().to_string()),
+                    ("user_id".to_string(), "deterministic-cache-test".into()),
                 ]),
                 ..Default::default()
             })

diff --git a/crates/tensorzero-core/tests/e2e/providers/anthropic.rs b/crates/tensorzero-core/tests/e2e/providers/anthropic.rs
@@ -202,14 +202,13 @@ async fn test_thinking_rejected_128k() {
     // does not cache. Therefore, this test will always hit live providers.
     // Consider moving to periodic live tests if this causes merge queue instability.
     // See: https://github.com/tensorzero/tensorzero/issues/5380
-    let random = Uuid::now_v7();
     let payload = json!({
         "model_name": "anthropic::claude-sonnet-4-5",
         "input":{
             "messages": [
                 {
                     "role": "user",
-                    "content": format!("Output a haiku that ends in the word 'my_custom_stop': {random}"),
+                    "content": "Output a haiku that ends in the word 'my_custom_stop': deterministic-cache-test",
                 }
             ]},
         "params": {

diff --git a/crates/tensorzero-core/tests/e2e/providers/common.rs b/crates/tensorzero-core/tests/e2e/providers/common.rs
@@ -2405,7 +2405,7 @@ pub async fn test_bad_auth_extra_headers_with_provider_and_stream(
                "messages": [
                 {
                     "role": "user",
-                    "content": format!("If you see this, something has gone wrong - the request should have failed: {}", Uuid::now_v7())
+                    "content": "If you see this, something has gone wrong - the request should have failed: deterministic-cache-test"
                 }
             ]},
         "stream": stream,

diff --git a/crates/tensorzero-core/tests/e2e/raw_response/embeddings.rs b/crates/tensorzero-core/tests/e2e/raw_response/embeddings.rs
@@ -234,10 +234,7 @@ async fn test_embeddings_raw_response_batch() {
 
 #[tokio::test]
 async fn test_embeddings_raw_response_with_cache() {
-    let input_text = format!(
-        "This is a cache test for embeddings raw_response - {}",
-        rand::random::<u32>()
-    );
+    let input_text = "This is a cache test for embeddings raw_response - deterministic-cache-test";
 
     // First request: populate cache with raw_response enabled
     let payload = json!({

diff --git a/crates/tensorzero-python/tests/test_client.py b/crates/tensorzero-python/tests/test_client.py
@@ -2413,13 +2413,12 @@ def test_prepare_inference_request(sync_client: TensorZeroGateway):
 
 def test_extra_headers_raw(sync_client: TensorZeroGateway):
     with pytest.raises(TensorZeroError) as exc_info:
-        id = uuid7()
         sync_client.inference(
             function_name="basic_test",
             variant_name="openai",
             input={
                 "system": {"assistant_name": "Alfred Pennyworth"},
-                "messages": [{"role": "user", "content": f"Write me a haiku {id}"}],
+                "messages": [{"role": "user", "content": "Write me a haiku about extra headers"}],
             },
             extra_headers=[
                 {

diff --git a/crates/tensorzero-python/tests/test_embeddings.py b/crates/tensorzero-python/tests/test_embeddings.py
@@ -15,7 +15,6 @@
 """
 
 import asyncio
-import random
 
 import pytest
 
@@ -217,8 +216,7 @@ async def test_embeddings_consistency(async_openai_client):
 @pytest.mark.asyncio
 async def test_embeddings_cache_with_float_encoding(async_openai_client):
     """Test that caching works correctly with float encoding format"""
-    # Use a unique input to ensure we're not hitting existing cache
-    input_text = f"Cache test with float encoding - {random.randint(0, 1000000)}"
+    input_text = "Cache test with float encoding - deterministic"
 
     # First request with float encoding and cache enabled
     result1 = await async_openai_client.embeddings.create(
@@ -254,8 +252,7 @@ async def test_embeddings_cache_with_float_encoding(async_openai_client):
 @pytest.mark.asyncio
 async def test_embeddings_cache_with_base64_encoding(async_openai_client):
     """Test that caching works correctly with base64 encoding format"""
-    # Use a unique input to ensure we're not hitting existing cache
-    input_text = f"Cache test with base64 encoding - {random.randint(0, 1000000)}"
+    input_text = "Cache test with base64 encoding - deterministic"
 
     # First request with base64 encoding and cache enabled
     result1 = await async_openai_client.embeddings.create(