From cbc1d3e980f24744b10b79ede5fc42b494433874 Mon Sep 17 00:00:00 2001
From: Adil Hafeez <adil.hafeez@gmail.com>
Date: Wed, 5 Feb 2025 19:13:58 -0800
Subject: [PATCH] rust tests

---
 crates/prompt_gateway/src/stream_context.rs |   4 +-
 crates/prompt_gateway/tests/integration.rs  | 724 ++++++++++----------
 2 files changed, 363 insertions(+), 365 deletions(-)

diff --git a/crates/prompt_gateway/src/stream_context.rs b/crates/prompt_gateway/src/stream_context.rs
index ce9b852f..77608cca 100644
--- a/crates/prompt_gateway/src/stream_context.rs
+++ b/crates/prompt_gateway/src/stream_context.rs
@@ -321,9 +321,7 @@ impl StreamContext {
             };
 
         let (path, body) = match http_method {
-            HttpMethod::Get => {
-                (format!("{}?{}", path_with_params, query_string), None)
-            }
+            HttpMethod::Get => (format!("{}?{}", path_with_params, query_string), None),
             HttpMethod::Post => {
                 let mut additional_params = additional_params;
                 if !query_string.is_empty() {
diff --git a/crates/prompt_gateway/tests/integration.rs b/crates/prompt_gateway/tests/integration.rs
index e9ff2064..4cc6f656 100644
--- a/crates/prompt_gateway/tests/integration.rs
+++ b/crates/prompt_gateway/tests/integration.rs
@@ -1,11 +1,11 @@
 use common::api::open_ai::{
-  ChatCompletionsResponse, Choice, FunctionCallDetail, Message, ToolCall, ToolType, Usage,
+    ChatCompletionsResponse, Choice, FunctionCallDetail, Message, ToolCall, ToolType, Usage,
 };
 use common::configuration::Configuration;
 use http::StatusCode;
 use proxy_wasm_test_framework::tester::{self, Tester};
 use proxy_wasm_test_framework::types::{
-  Action, BufferType, LogLevel, MapType, MetricType, ReturnType,
+    Action, BufferType, LogLevel, MapType, MetricType, ReturnType,
 };
 use serde_yaml::Value;
 use serial_test::serial;
@@ -13,440 +13,440 @@ use std::collections::HashMap;
 use std::path::Path;
 
 fn wasm_module() -> String {
-  let wasm_file = Path::new("../target/wasm32-wasip1/release/prompt_gateway.wasm");
-  assert!(
-      wasm_file.exists(),
-      "Run `cargo build --release --target=wasm32-wasip1` first"
-  );
-  wasm_file.to_str().unwrap().to_string()
+    let wasm_file = Path::new("../target/wasm32-wasip1/release/prompt_gateway.wasm");
+    assert!(
+        wasm_file.exists(),
+        "Run `cargo build --release --target=wasm32-wasip1` first"
+    );
+    wasm_file.to_str().unwrap().to_string()
 }
 
 fn request_headers_expectations(module: &mut Tester, http_context: i32) {
-  module
-      .call_proxy_on_request_headers(http_context, 0, false)
-      .expect_remove_header_map_value(Some(MapType::HttpRequestHeaders), Some("content-length"))
-      .expect_get_header_map_value(Some(MapType::HttpRequestHeaders), Some(":path"))
-      .returning(Some("/v1/chat/completions"))
-      .expect_get_header_map_pairs(Some(MapType::HttpRequestHeaders))
-      .returning(None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_get_header_map_value(Some(MapType::HttpRequestHeaders), Some("x-request-id"))
-      .returning(None)
-      .expect_get_header_map_value(Some(MapType::HttpRequestHeaders), Some("traceparent"))
-      .returning(None)
-      .execute_and_expect(ReturnType::Action(Action::Continue))
-      .unwrap();
+    module
+        .call_proxy_on_request_headers(http_context, 0, false)
+        .expect_remove_header_map_value(Some(MapType::HttpRequestHeaders), Some("content-length"))
+        .expect_get_header_map_value(Some(MapType::HttpRequestHeaders), Some(":path"))
+        .returning(Some("/v1/chat/completions"))
+        .expect_get_header_map_pairs(Some(MapType::HttpRequestHeaders))
+        .returning(None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_get_header_map_value(Some(MapType::HttpRequestHeaders), Some("x-request-id"))
+        .returning(None)
+        .expect_get_header_map_value(Some(MapType::HttpRequestHeaders), Some("traceparent"))
+        .returning(None)
+        .execute_and_expect(ReturnType::Action(Action::Continue))
+        .unwrap();
 }
 
 fn normal_flow(module: &mut Tester, filter_context: i32, http_context: i32) {
-  module
-      .call_proxy_on_context_create(http_context, filter_context)
-      .expect_log(Some(LogLevel::Trace), None)
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_proxy_on_context_create(http_context, filter_context)
+        .expect_log(Some(LogLevel::Trace), None)
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  request_headers_expectations(module, http_context);
+    request_headers_expectations(module, http_context);
 
-  // Request Body
-  let chat_completions_request_body = "\
+    // Request Body
+    let chat_completions_request_body = "\
 {\
-  \"messages\": [\
-  {\
-      \"role\": \"system\",\
-      \"content\": \"You are a poetic assistant, skilled in explaining complex programming concepts with creative flair.\"\
-  },\
-  {\
-      \"role\": \"user\",\
-      \"content\": \"Compose a poem that explains the concept of recursion in programming.\"\
-  }\
-  ],\
-  \"model\": \"gpt-4\"\
+    \"messages\": [\
+    {\
+        \"role\": \"system\",\
+        \"content\": \"You are a poetic assistant, skilled in explaining complex programming concepts with creative flair.\"\
+    },\
+    {\
+        \"role\": \"user\",\
+        \"content\": \"Compose a poem that explains the concept of recursion in programming.\"\
+    }\
+    ],\
+    \"model\": \"gpt-4\"\
 }";
 
-  module
-      .call_proxy_on_request_body(
-          http_context,
-          chat_completions_request_body.len() as i32,
-          true,
-      )
-      .expect_get_buffer_bytes(Some(BufferType::HttpRequestBody))
-      .returning(Some(chat_completions_request_body))
-      // The actual call is not important in this test, we just need to grab the token_id
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_http_call(
-          Some("arch_internal"),
-          Some(vec![
-              ("x-arch-upstream", "model_server"),
-              (":method", "POST"),
-              (":path", "/function_calling"),
-              ("content-type", "application/json"),
-              (":authority", "model_server"),
-          ]),
-          None,
-          None,
-          None,
-      )
-      .returning(Some(1))
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_metric_increment("active_http_calls", 1)
-      .execute_and_expect(ReturnType::Action(Action::Pause))
-      .unwrap();
+    module
+        .call_proxy_on_request_body(
+            http_context,
+            chat_completions_request_body.len() as i32,
+            true,
+        )
+        .expect_get_buffer_bytes(Some(BufferType::HttpRequestBody))
+        .returning(Some(chat_completions_request_body))
+        // The actual call is not important in this test, we just need to grab the token_id
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_http_call(
+            Some("arch_internal"),
+            Some(vec![
+                ("x-arch-upstream", "model_server"),
+                (":method", "POST"),
+                (":path", "/function_calling"),
+                ("content-type", "application/json"),
+                (":authority", "model_server"),
+            ]),
+            None,
+            None,
+            None,
+        )
+        .returning(Some(1))
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_metric_increment("active_http_calls", 1)
+        .execute_and_expect(ReturnType::Action(Action::Pause))
+        .unwrap();
 }
 
 fn setup_filter(module: &mut Tester, config: &str) -> i32 {
-  let filter_context = 1;
+    let filter_context = 1;
 
-  module
-      .call_proxy_on_context_create(filter_context, 0)
-      .expect_metric_creation(MetricType::Gauge, "active_http_calls")
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_proxy_on_context_create(filter_context, 0)
+        .expect_metric_creation(MetricType::Gauge, "active_http_calls")
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  module
-      .call_proxy_on_configure(filter_context, config.len() as i32)
-      .expect_get_buffer_bytes(Some(BufferType::PluginConfiguration))
-      .returning(Some(config))
-      .execute_and_expect(ReturnType::Bool(true))
-      .unwrap();
+    module
+        .call_proxy_on_configure(filter_context, config.len() as i32)
+        .expect_get_buffer_bytes(Some(BufferType::PluginConfiguration))
+        .returning(Some(config))
+        .execute_and_expect(ReturnType::Bool(true))
+        .unwrap();
 
-  filter_context
+    filter_context
 }
 
 fn default_config() -> &'static str {
-  r#"
+    r#"
 version: "0.1-beta"
 
 listener:
-address: 0.0.0.0
-port: 10000
-message_format: huggingface
-connect_timeout: 0.005s
-
-endpoints:
-api_server:
-  endpoint: api_server:80
+  address: 0.0.0.0
+  port: 10000
+  message_format: huggingface
   connect_timeout: 0.005s
 
+endpoints:
+  api_server:
+    endpoint: api_server:80
+    connect_timeout: 0.005s
+
 llm_providers:
-- name: open-ai-gpt-4
-  provider_interface: openai
-  access_key: secret_key
-  model: gpt-4
-  default: true
+  - name: open-ai-gpt-4
+    provider_interface: openai
+    access_key: secret_key
+    model: gpt-4
+    default: true
 
 overrides:
-# confidence threshold for prompt target intent matching
-prompt_target_intent_matching_threshold: 0.0
+  # confidence threshold for prompt target intent matching
+  prompt_target_intent_matching_threshold: 0.0
 
 system_prompt: |
-You are a helpful assistant.
+  You are a helpful assistant.
 
 prompt_guards:
-input_guards:
-  jailbreak:
-    on_exception:
-      message: "Looks like you're curious about my abilities, but I can only provide assistance within my programmed parameters."
+  input_guards:
+    jailbreak:
+      on_exception:
+        message: "Looks like you're curious about my abilities, but I can only provide assistance within my programmed parameters."
 
 prompt_targets:
-- name: weather_forecast
-  description: This function provides realtime weather forecast information for a given city.
-  parameters:
-    - name: city
-      required: true
-      description: The city for which the weather forecast is requested.
-    - name: days
-      description: The number of days for which the weather forecast is requested.
-    - name: units
-      description: The units in which the weather forecast is requested.
-  endpoint:
-    name: api_server
-    path: /weather
-    http_method: POST
-  system_prompt: |
-    You are a helpful weather forecaster. Use weater data that is provided to you. Please following following guidelines when responding to user queries:
-    - Use farenheight for temperature
-    - Use miles per hour for wind speed
+  - name: weather_forecast
+    description: This function provides realtime weather forecast information for a given city.
+    parameters:
+      - name: city
+        required: true
+        description: The city for which the weather forecast is requested.
+      - name: days
+        description: The number of days for which the weather forecast is requested.
+      - name: units
+        description: The units in which the weather forecast is requested.
+    endpoint:
+      name: api_server
+      path: /weather
+      http_method: POST
+    system_prompt: |
+      You are a helpful weather forecaster. Use weater data that is provided to you. Please following following guidelines when responding to user queries:
+      - Use farenheight for temperature
+      - Use miles per hour for wind speed
 
 ratelimits:
-- model: gpt-4
-  selector:
-    key: selector-key
-    value: selector-value
-  limit:
-    tokens: 1
-    unit: minute
+  - model: gpt-4
+    selector:
+      key: selector-key
+      value: selector-value
+    limit:
+      tokens: 1
+      unit: minute
 "#
 }
 
 #[test]
 #[serial]
 fn prompt_gateway_successful_request_to_open_ai_chat_completions() {
-  let args = tester::MockSettings {
-      wasm_path: wasm_module(),
-      quiet: false,
-      allow_unexpected: false,
-  };
-  let mut module = tester::mock(args).unwrap();
+    let args = tester::MockSettings {
+        wasm_path: wasm_module(),
+        quiet: false,
+        allow_unexpected: false,
+    };
+    let mut module = tester::mock(args).unwrap();
 
-  module
-      .call_start()
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_start()
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  // Setup Filter
-  let filter_context = setup_filter(&mut module, default_config());
+    // Setup Filter
+    let filter_context = setup_filter(&mut module, default_config());
 
-  // Setup HTTP Stream
-  let http_context = 2;
+    // Setup HTTP Stream
+    let http_context = 2;
 
-  module
-      .call_proxy_on_context_create(http_context, filter_context)
-      .expect_log(Some(LogLevel::Trace), None)
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_proxy_on_context_create(http_context, filter_context)
+        .expect_log(Some(LogLevel::Trace), None)
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  request_headers_expectations(&mut module, http_context);
+    request_headers_expectations(&mut module, http_context);
 
-  // Request Body
-  let chat_completions_request_body = "\
-  {\
-      \"messages\": [\
-      {\
-          \"role\": \"system\",\
-          \"content\": \"You are a poetic assistant, skilled in explaining complex programming concepts with creative flair.\"\
-      },\
-      {\
-          \"role\": \"user\",\
-          \"content\": \"Compose a poem that explains the concept of recursion in programming.\"\
-      }\
-      ],\
-      \"model\": \"gpt-4\"\
-  }";
+    // Request Body
+    let chat_completions_request_body = "\
+    {\
+        \"messages\": [\
+        {\
+            \"role\": \"system\",\
+            \"content\": \"You are a poetic assistant, skilled in explaining complex programming concepts with creative flair.\"\
+        },\
+        {\
+            \"role\": \"user\",\
+            \"content\": \"Compose a poem that explains the concept of recursion in programming.\"\
+        }\
+        ],\
+        \"model\": \"gpt-4\"\
+    }";
 
-  module
-      .call_proxy_on_request_body(
-          http_context,
-          chat_completions_request_body.len() as i32,
-          true,
-      )
-      .expect_get_buffer_bytes(Some(BufferType::HttpRequestBody))
-      .returning(Some(chat_completions_request_body))
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_http_call(Some("arch_internal"), None, None, None, None)
-      .returning(Some(4))
-      .expect_metric_increment("active_http_calls", 1)
-      .execute_and_expect(ReturnType::Action(Action::Pause))
-      .unwrap();
+    module
+        .call_proxy_on_request_body(
+            http_context,
+            chat_completions_request_body.len() as i32,
+            true,
+        )
+        .expect_get_buffer_bytes(Some(BufferType::HttpRequestBody))
+        .returning(Some(chat_completions_request_body))
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_http_call(Some("arch_internal"), None, None, None, None)
+        .returning(Some(4))
+        .expect_metric_increment("active_http_calls", 1)
+        .execute_and_expect(ReturnType::Action(Action::Pause))
+        .unwrap();
 }
 
 #[test]
 #[serial]
 fn prompt_gateway_bad_request_to_open_ai_chat_completions() {
-  let args = tester::MockSettings {
-      wasm_path: wasm_module(),
-      quiet: false,
-      allow_unexpected: false,
-  };
-  let mut module = tester::mock(args).unwrap();
+    let args = tester::MockSettings {
+        wasm_path: wasm_module(),
+        quiet: false,
+        allow_unexpected: false,
+    };
+    let mut module = tester::mock(args).unwrap();
 
-  module
-      .call_start()
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_start()
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  // Setup Filter
-  let filter_context = setup_filter(&mut module, default_config());
+    // Setup Filter
+    let filter_context = setup_filter(&mut module, default_config());
 
-  // Setup HTTP Stream
-  let http_context = 2;
+    // Setup HTTP Stream
+    let http_context = 2;
 
-  module
-      .call_proxy_on_context_create(http_context, filter_context)
-      .expect_log(Some(LogLevel::Trace), None)
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_proxy_on_context_create(http_context, filter_context)
+        .expect_log(Some(LogLevel::Trace), None)
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  request_headers_expectations(&mut module, http_context);
+    request_headers_expectations(&mut module, http_context);
 
-  // Request Body
-  let incomplete_chat_completions_request_body = "\
-  {\
-      \"messages\": [\
-      {\
-          \"role\": \"system\",\
-      },\
-      {\
-          \"role\": \"user\",\
-          \"content\": \"Compose a poem that explains the concept of recursion in programming.\"\
-      }\
-      ]\
-  }";
+    // Request Body
+    let incomplete_chat_completions_request_body = "\
+    {\
+        \"messages\": [\
+        {\
+            \"role\": \"system\",\
+        },\
+        {\
+            \"role\": \"user\",\
+            \"content\": \"Compose a poem that explains the concept of recursion in programming.\"\
+        }\
+        ]\
+    }";
 
-  module
-      .call_proxy_on_request_body(
-          http_context,
-          incomplete_chat_completions_request_body.len() as i32,
-          true,
-      )
-      .expect_get_buffer_bytes(Some(BufferType::HttpRequestBody))
-      .returning(Some(incomplete_chat_completions_request_body))
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_send_local_response(
-          Some(StatusCode::BAD_REQUEST.as_u16().into()),
-          None,
-          None,
-          None,
-      )
-      .expect_log(Some(LogLevel::Trace), None)
-      .execute_and_expect(ReturnType::Action(Action::Pause))
-      .unwrap();
+    module
+        .call_proxy_on_request_body(
+            http_context,
+            incomplete_chat_completions_request_body.len() as i32,
+            true,
+        )
+        .expect_get_buffer_bytes(Some(BufferType::HttpRequestBody))
+        .returning(Some(incomplete_chat_completions_request_body))
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_send_local_response(
+            Some(StatusCode::BAD_REQUEST.as_u16().into()),
+            None,
+            None,
+            None,
+        )
+        .expect_log(Some(LogLevel::Trace), None)
+        .execute_and_expect(ReturnType::Action(Action::Pause))
+        .unwrap();
 }
 
 #[test]
 #[serial]
 fn prompt_gateway_request_to_llm_gateway() {
-  let args = tester::MockSettings {
-      wasm_path: wasm_module(),
-      quiet: false,
-      allow_unexpected: false,
-  };
-  let mut module = tester::mock(args).unwrap();
+    let args = tester::MockSettings {
+        wasm_path: wasm_module(),
+        quiet: false,
+        allow_unexpected: false,
+    };
+    let mut module = tester::mock(args).unwrap();
 
-  module
-      .call_start()
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    module
+        .call_start()
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  // Setup Filter
-  let mut config: Configuration = serde_yaml::from_str(default_config()).unwrap();
-  config.ratelimits.as_mut().unwrap()[0].limit.tokens += 1000;
-  let config_str = serde_json::to_string(&config).unwrap();
+    // Setup Filter
+    let mut config: Configuration = serde_yaml::from_str(default_config()).unwrap();
+    config.ratelimits.as_mut().unwrap()[0].limit.tokens += 1000;
+    let config_str = serde_json::to_string(&config).unwrap();
 
-  let filter_context = setup_filter(&mut module, &config_str);
+    let filter_context = setup_filter(&mut module, &config_str);
 
-  // Setup HTTP Stream
-  let http_context = 2;
+    // Setup HTTP Stream
+    let http_context = 2;
 
-  normal_flow(&mut module, filter_context, http_context);
+    normal_flow(&mut module, filter_context, http_context);
 
-  let arch_fc_resp = ChatCompletionsResponse {
-      usage: Some(Usage {
-          completion_tokens: 0,
-      }),
-      choices: vec![Choice {
-          finish_reason: Some("test".to_string()),
-          index: Some(0),
-          message: Message {
-              role: "system".to_string(),
-              content: None,
-              tool_calls: Some(vec![ToolCall {
-                  id: String::from("test"),
-                  tool_type: ToolType::Function,
-                  function: FunctionCallDetail {
-                      name: String::from("weather_forecast"),
-                      arguments: HashMap::from([(
-                          String::from("city"),
-                          Value::String(String::from("seattle")),
-                      )]),
-                  },
-              }]),
-              model: None,
-              tool_call_id: None,
-          },
-      }],
-      model: String::from("test"),
-      metadata: None,
-  };
+    let arch_fc_resp = ChatCompletionsResponse {
+        usage: Some(Usage {
+            completion_tokens: 0,
+        }),
+        choices: vec![Choice {
+            finish_reason: Some("test".to_string()),
+            index: Some(0),
+            message: Message {
+                role: "system".to_string(),
+                content: None,
+                tool_calls: Some(vec![ToolCall {
+                    id: String::from("test"),
+                    tool_type: ToolType::Function,
+                    function: FunctionCallDetail {
+                        name: String::from("weather_forecast"),
+                        arguments: HashMap::from([(
+                            String::from("city"),
+                            Value::String(String::from("seattle")),
+                        )]),
+                    },
+                }]),
+                model: None,
+                tool_call_id: None,
+            },
+        }],
+        model: String::from("test"),
+        metadata: None,
+    };
 
-  let expected_body = "{\"city\":\"seattle\"}";
-  let arch_fc_resp_str = serde_json::to_string(&arch_fc_resp).unwrap();
-  module
-      .call_proxy_on_http_call_response(http_context, 1, 0, arch_fc_resp_str.len() as i32, 0)
-      .expect_metric_increment("active_http_calls", -1)
-      .expect_get_buffer_bytes(Some(BufferType::HttpCallResponseBody))
-      .returning(Some(&arch_fc_resp_str))
-      .expect_log(Some(LogLevel::Warn), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_http_call(
-          Some("arch_internal"),
-          Some(vec![
-              (":method", "POST"),
-              ("content-type", "application/json"),
-              ("x-arch-upstream", "api_server"),
-              (":authority", "api_server"),
-              ("x-envoy-max-retries", "3"),
-              (":path", "/weather"),
-          ]),
-          Some(expected_body),
-          None,
-          None,
-      )
-      .returning(Some(2))
-      .expect_metric_increment("active_http_calls", 1)
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    let expected_body = "{\"city\":\"seattle\"}";
+    let arch_fc_resp_str = serde_json::to_string(&arch_fc_resp).unwrap();
+    module
+        .call_proxy_on_http_call_response(http_context, 1, 0, arch_fc_resp_str.len() as i32, 0)
+        .expect_metric_increment("active_http_calls", -1)
+        .expect_get_buffer_bytes(Some(BufferType::HttpCallResponseBody))
+        .returning(Some(&arch_fc_resp_str))
+        .expect_log(Some(LogLevel::Warn), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_http_call(
+            Some("arch_internal"),
+            Some(vec![
+                (":method", "POST"),
+                ("content-type", "application/json"),
+                ("x-arch-upstream", "api_server"),
+                (":authority", "api_server"),
+                ("x-envoy-max-retries", "3"),
+                (":path", "/weather")
+            ]),
+            Some(expected_body),
+            None,
+            None,
+        )
+        .returning(Some(2))
+        .expect_metric_increment("active_http_calls", 1)
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  let body_text = String::from("test body");
-  module
-      .call_proxy_on_http_call_response(http_context, 2, 0, body_text.len() as i32, 0)
-      .expect_metric_increment("active_http_calls", -1)
-      .expect_get_buffer_bytes(Some(BufferType::HttpCallResponseBody))
-      .returning(Some(&body_text))
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_get_header_map_value(Some(MapType::HttpCallResponseHeaders), Some(":status"))
-      .returning(Some("200"))
-      .expect_set_buffer_bytes(Some(BufferType::HttpRequestBody), None)
-      .execute_and_expect(ReturnType::None)
-      .unwrap();
+    let body_text = String::from("test body");
+    module
+        .call_proxy_on_http_call_response(http_context, 2, 0, body_text.len() as i32, 0)
+        .expect_metric_increment("active_http_calls", -1)
+        .expect_get_buffer_bytes(Some(BufferType::HttpCallResponseBody))
+        .returning(Some(&body_text))
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_get_header_map_value(Some(MapType::HttpCallResponseHeaders), Some(":status"))
+        .returning(Some("200"))
+        .expect_set_buffer_bytes(Some(BufferType::HttpRequestBody), None)
+        .execute_and_expect(ReturnType::None)
+        .unwrap();
 
-  let chat_completion_response = ChatCompletionsResponse {
-      usage: Some(Usage {
-          completion_tokens: 0,
-      }),
-      choices: vec![Choice {
-          finish_reason: Some("test".to_string()),
-          index: Some(0),
-          message: Message {
-              role: "assistant".to_string(),
-              content: Some("hello from fake llm gateway".to_string()),
-              model: None,
-              tool_calls: None,
-              tool_call_id: None,
-          },
-      }],
-      model: String::from("test"),
-      metadata: None,
-  };
+    let chat_completion_response = ChatCompletionsResponse {
+        usage: Some(Usage {
+            completion_tokens: 0,
+        }),
+        choices: vec![Choice {
+            finish_reason: Some("test".to_string()),
+            index: Some(0),
+            message: Message {
+                role: "assistant".to_string(),
+                content: Some("hello from fake llm gateway".to_string()),
+                model: None,
+                tool_calls: None,
+                tool_call_id: None,
+            },
+        }],
+        model: String::from("test"),
+        metadata: None,
+    };
 
-  let chat_completion_response_str = serde_json::to_string(&chat_completion_response).unwrap();
-  module
-      .call_proxy_on_response_body(
-          http_context,
-          chat_completion_response_str.len() as i32,
-          true,
-      )
-      .expect_get_buffer_bytes(Some(BufferType::HttpResponseBody))
-      .returning(Some(chat_completion_response_str.as_str()))
-      .expect_log(Some(LogLevel::Trace), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_set_buffer_bytes(Some(BufferType::HttpResponseBody), None)
-      .expect_log(Some(LogLevel::Debug), None)
-      .expect_log(Some(LogLevel::Trace), None)
-      .execute_and_expect(ReturnType::Action(Action::Continue))
-      .unwrap();
+    let chat_completion_response_str = serde_json::to_string(&chat_completion_response).unwrap();
+    module
+        .call_proxy_on_response_body(
+            http_context,
+            chat_completion_response_str.len() as i32,
+            true,
+        )
+        .expect_get_buffer_bytes(Some(BufferType::HttpResponseBody))
+        .returning(Some(chat_completion_response_str.as_str()))
+        .expect_log(Some(LogLevel::Trace), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_set_buffer_bytes(Some(BufferType::HttpResponseBody), None)
+        .expect_log(Some(LogLevel::Debug), None)
+        .expect_log(Some(LogLevel::Trace), None)
+        .execute_and_expect(ReturnType::Action(Action::Continue))
+        .unwrap();
 }