rename public_types => common and move common code there

2026-05-30 14:25:15 +02:00 · 2024-10-16 10:42:54 -07:00 · 2024-10-16 10:42:54 -07:00 · 93ea6e1a3d
commit 93ea6e1a3d
parent db202578d3
35 changed files with 458 additions and 791 deletions
--- a/crates/prompt_gateway/src/filter_context.rs
+++ b/crates/prompt_gateway/src/filter_context.rs
@ -1,25 +1,23 @@
-use crate::llm_providers::LlmProviders;
-use crate::ratelimit;
 use crate::stream_context::StreamContext;
+use common::common_types::EmbeddingType;
+use common::configuration::{Configuration, GatewayMode, Overrides, PromptGuards, PromptTarget};
+use common::consts::ARCH_INTERNAL_CLUSTER_NAME;
+use common::consts::ARCH_UPSTREAM_HOST_HEADER;
+use common::consts::DEFAULT_EMBEDDING_MODEL;
+use common::consts::MODEL_SERVER_NAME;
+use common::embeddings::{
+    CreateEmbeddingRequest, CreateEmbeddingRequestInput, CreateEmbeddingResponse,
+};
+use common::http::CallArgs;
+use common::http::Client;
+use common::llm_providers::LlmProviders;
+use common::ratelimit;
+use common::stats::Counter;
+use common::stats::Gauge;
+use common::stats::IncrementingMetric;
 use log::debug;
 use proxy_wasm::traits::*;
 use proxy_wasm::types::*;
-use public_types::common_types::EmbeddingType;
-use public_types::configuration::{
-    Configuration, GatewayMode, Overrides, PromptGuards, PromptTarget,
-};
-use public_types::consts::ARCH_INTERNAL_CLUSTER_NAME;
-use public_types::consts::ARCH_UPSTREAM_HOST_HEADER;
-use public_types::consts::DEFAULT_EMBEDDING_MODEL;
-use public_types::consts::MODEL_SERVER_NAME;
-use public_types::embeddings::{
-    CreateEmbeddingRequest, CreateEmbeddingRequestInput, CreateEmbeddingResponse,
-};
-use public_types::http::CallArgs;
-use public_types::http::Client;
-use public_types::stats::Counter;
-use public_types::stats::Gauge;
-use public_types::stats::IncrementingMetric;
 use std::cell::RefCell;
 use std::collections::hash_map::Entry;
 use std::collections::HashMap;
--- a/crates/prompt_gateway/src/lib.rs
+++ b/crates/prompt_gateway/src/lib.rs
@ -3,11 +3,7 @@ use proxy_wasm::traits::*;
 use proxy_wasm::types::*;

 mod filter_context;
-mod llm_providers;
-mod ratelimit;
-mod routing;
 mod stream_context;
-mod tokenizer;

 proxy_wasm::main! {{
    proxy_wasm::set_log_level(LogLevel::Trace);
--- a/crates/prompt_gateway/src/llm_providers.rs
+++ b/crates/prompt_gateway/src/llm_providers.rs
@ -1,69 +0,0 @@
-use public_types::configuration::LlmProvider;
-use std::collections::HashMap;
-use std::rc::Rc;
-
-#[derive(Debug)]
-pub struct LlmProviders {
-    providers: HashMap<String, Rc<LlmProvider>>,
-    default: Option<Rc<LlmProvider>>,
-}
-
-impl LlmProviders {
-    pub fn iter(&self) -> std::collections::hash_map::Iter<'_, String, Rc<LlmProvider>> {
-        self.providers.iter()
-    }
-
-    pub fn default(&self) -> Option<Rc<LlmProvider>> {
-        self.default.as_ref().map(|rc| rc.clone())
-    }
-
-    pub fn get(&self, name: &str) -> Option<Rc<LlmProvider>> {
-        self.providers.get(name).cloned()
-    }
-}
-
-#[derive(thiserror::Error, Debug)]
-pub enum LlmProvidersNewError {
-    #[error("There must be at least one LLM Provider")]
-    EmptySource,
-    #[error("There must be at most one default LLM Provider")]
-    MoreThanOneDefault,
-    #[error("\'{0}\' is not a unique name")]
-    DuplicateName(String),
-}
-
-impl TryFrom<Vec<LlmProvider>> for LlmProviders {
-    type Error = LlmProvidersNewError;
-
-    fn try_from(llm_providers_config: Vec<LlmProvider>) -> Result<Self, Self::Error> {
-        if llm_providers_config.is_empty() {
-            return Err(LlmProvidersNewError::EmptySource);
-        }
-
-        let mut llm_providers = LlmProviders {
-            providers: HashMap::new(),
-            default: None,
-        };
-
-        for llm_provider in llm_providers_config {
-            let llm_provider: Rc<LlmProvider> = Rc::new(llm_provider);
-            if llm_provider.default.unwrap_or_default() {
-                match llm_providers.default {
-                    Some(_) => return Err(LlmProvidersNewError::MoreThanOneDefault),
-                    None => llm_providers.default = Some(Rc::clone(&llm_provider)),
-                }
-            }
-
-            // Insert and check that there is no other provider with the same name.
-            let name = llm_provider.name.clone();
-            if llm_providers
-                .providers
-                .insert(name.clone(), llm_provider)
-                .is_some()
-            {
-                return Err(LlmProvidersNewError::DuplicateName(name));
-            }
-        }
-        Ok(llm_providers)
-    }
-}
--- a/crates/prompt_gateway/src/ratelimit.rs
+++ b/crates/prompt_gateway/src/ratelimit.rs
@ -1,450 +0,0 @@
-use governor::{DefaultKeyedRateLimiter, InsufficientCapacity, Quota};
-use log::debug;
-use public_types::configuration;
-use public_types::configuration::{Limit, Ratelimit, TimeUnit};
-use std::fmt::Display;
-use std::num::{NonZero, NonZeroU32};
-use std::sync::RwLock;
-use std::{collections::HashMap, sync::OnceLock};
-
-pub type RatelimitData = RwLock<RatelimitMap>;
-
-pub fn ratelimits(ratelimits_config: Option<Vec<Ratelimit>>) -> &'static RatelimitData {
-    static RATELIMIT_DATA: OnceLock<RatelimitData> = OnceLock::new();
-    RATELIMIT_DATA.get_or_init(|| {
-        RwLock::new(RatelimitMap::new(
-            ratelimits_config.expect("The initialization call has to have passed a config"),
-        ))
-    })
-}
-
-// The Data Structure is laid out in the following way:
-// Provider -> Hash { Header -> Limit }.
-// If the Header used to configure the given Limit:
-//   a) Has None value, then there will be N Limit keyed by the Header value.
-//   b) Has Some() value, then there will be 1 Limit keyed by the empty string.
-// It would have been nicer to use a non-keyed limit for b). However, the type system made that option a nightmare.
-pub struct RatelimitMap {
-    datastore: HashMap<String, HashMap<configuration::Header, DefaultKeyedRateLimiter<String>>>,
-}
-
-// This version of Header demands that the user passes a header value to match on.
-#[derive(Debug, Clone)]
-pub struct Header {
-    pub key: String,
-    pub value: String,
-}
-
-impl Display for Header {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
-        write!(f, "{self:?}")
-    }
-}
-
-impl From<Header> for configuration::Header {
-    fn from(header: Header) -> Self {
-        Self {
-            key: header.key,
-            value: Some(header.value),
-        }
-    }
-}
-
-#[derive(Debug, thiserror::Error)]
-pub enum Error {
-    #[error("exceeded limit provider={provider}, selector={selector}, tokens_used={tokens_used}")]
-    ExceededLimit {
-        provider: String,
-        selector: Header,
-        tokens_used: NonZeroU32,
-    },
-}
-
-impl RatelimitMap {
-    // n.b new is private so that the only access to the Ratelimits can be done via the static
-    // reference inside a RwLock via ratelimit::ratelimits().
-    fn new(ratelimits_config: Vec<Ratelimit>) -> Self {
-        let mut new_ratelimit_map = RatelimitMap {
-            datastore: HashMap::new(),
-        };
-        for ratelimit_config in ratelimits_config {
-            let limit = DefaultKeyedRateLimiter::keyed(get_quota(ratelimit_config.limit));
-
-            match new_ratelimit_map.datastore.get_mut(&ratelimit_config.model) {
-                Some(limits) => match limits.get_mut(&ratelimit_config.selector) {
-                    Some(_) => {
-                        panic!("repeated selector. Selectors per provider must be unique")
-                    }
-                    None => {
-                        limits.insert(ratelimit_config.selector, limit);
-                    }
-                },
-                None => {
-                    // The provider has not been seen before.
-                    // Insert the provider and a new HashMap with the specified limit
-                    let new_hash_map = HashMap::from([(ratelimit_config.selector, limit)]);
-                    new_ratelimit_map
-                        .datastore
-                        .insert(ratelimit_config.model, new_hash_map);
-                }
-            }
-        }
-        new_ratelimit_map
-    }
-
-    #[allow(unused)]
-    pub fn check_limit(
-        &self,
-        provider: String,
-        selector: Header,
-        tokens_used: NonZeroU32,
-    ) -> Result<(), Error> {
-        debug!(
-            "Checking limit for provider={}, with selector={:?}, consuming tokens={:?}",
-            provider, selector, tokens_used
-        );
-
-        let provider_limits = match self.datastore.get(&provider) {
-            None => {
-                // No limit configured for this provider, hence ok.
-                return Ok(());
-            }
-            Some(limit) => limit,
-        };
-
-        let mut config_selector = configuration::Header::from(selector.clone());
-
-        let (limit, limit_key) = match provider_limits.get(&config_selector) {
-            // This is a specific limit, i.e one that was configured with both key, and value.
-            // Therefore, the key for the internal limit does not matter, and hence the empty string is always returned.
-            Some(limit) => (limit, String::from("")),
-            None => {
-                // Unwrap is ok here because we _know_ the value exists.
-                let header_key = config_selector.value.take().unwrap();
-                // Search for less specific limit, i.e, one that was configured without a value, therefore every Header
-                // value has its own key in the internal limit.
-                match provider_limits.get(&config_selector) {
-                    Some(limit) => (limit, header_key),
-                    // No limit for that header key, value pair exists within that provider limits.
-                    None => {
-                        return Ok(());
-                    }
-                }
-            }
-        };
-
-        match limit.check_key_n(&limit_key, tokens_used) {
-            Ok(Ok(())) => Ok(()),
-            Ok(Err(_)) | Err(InsufficientCapacity(_)) => Err(Error::ExceededLimit {
-                provider,
-                selector,
-                tokens_used,
-            }),
-        }
-    }
-}
-
-fn get_quota(limit: Limit) -> Quota {
-    let tokens = NonZero::new(limit.tokens).expect("Limit's tokens must be positive");
-    match limit.unit {
-        TimeUnit::Second => Quota::per_second(tokens),
-        TimeUnit::Minute => Quota::per_minute(tokens),
-        TimeUnit::Hour => Quota::per_hour(tokens),
-    }
-}
-
-// The following tests are inside the ratelimit module in order to access RatelimitMap::new() in order to provide
-// different configuration values per test.
-#[test]
-fn non_existent_provider_is_ok() {
-    let ratelimits_config = vec![Ratelimit {
-        model: String::from("provider"),
-        selector: configuration::Header {
-            key: String::from("only-key"),
-            value: None,
-        },
-        limit: Limit {
-            tokens: 100,
-            unit: TimeUnit::Minute,
-        },
-    }];
-
-    let ratelimits = RatelimitMap::new(ratelimits_config);
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("non-existent-provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(5000).unwrap(),
-        )
-        .is_ok())
-}
-
-#[test]
-fn non_existent_key_is_ok() {
-    let ratelimits_config = vec![Ratelimit {
-        model: String::from("provider"),
-        selector: configuration::Header {
-            key: String::from("only-key"),
-            value: None,
-        },
-        limit: Limit {
-            tokens: 100,
-            unit: TimeUnit::Minute,
-        },
-    }];
-
-    let ratelimits = RatelimitMap::new(ratelimits_config);
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(5000).unwrap(),
-        )
-        .is_ok())
-}
-
-#[test]
-fn specific_limit_does_not_catch_non_specific_value() {
-    let ratelimits_config = vec![Ratelimit {
-        model: String::from("provider"),
-        selector: configuration::Header {
-            key: String::from("key"),
-            value: Some(String::from("value")),
-        },
-        limit: Limit {
-            tokens: 200,
-            unit: TimeUnit::Second,
-        },
-    }];
-
-    let ratelimits = RatelimitMap::new(ratelimits_config);
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("not-the-correct-value"),
-            },
-            NonZero::new(5000).unwrap(),
-        )
-        .is_ok())
-}
-
-#[test]
-fn specific_limit_is_hit() {
-    let ratelimits_config = vec![Ratelimit {
-        model: String::from("provider"),
-        selector: configuration::Header {
-            key: String::from("key"),
-            value: Some(String::from("value")),
-        },
-        limit: Limit {
-            tokens: 200,
-            unit: TimeUnit::Hour,
-        },
-    }];
-
-    let ratelimits = RatelimitMap::new(ratelimits_config);
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(5000).unwrap(),
-        )
-        .is_err())
-}
-
-#[test]
-fn non_specific_key_has_different_limits_for_different_values() {
-    let ratelimits_config = vec![Ratelimit {
-        model: String::from("provider"),
-        selector: configuration::Header {
-            key: String::from("only-key"),
-            value: None,
-        },
-        limit: Limit {
-            tokens: 100,
-            unit: TimeUnit::Hour,
-        },
-    }];
-
-    let ratelimits = RatelimitMap::new(ratelimits_config);
-
-    // Value1 takes 50.
-    assert!(ratelimits
-        .check_limit(
-            String::from("provider"),
-            Header {
-                key: String::from("only-key"),
-                value: String::from("value1"),
-            },
-            NonZero::new(50).unwrap(),
-        )
-        .is_ok());
-
-    // value2 takes 60 because it has its own 100 limit
-    assert!(ratelimits
-        .check_limit(
-            String::from("provider"),
-            Header {
-                key: String::from("only-key"),
-                value: String::from("value2"),
-            },
-            NonZero::new(60).unwrap(),
-        )
-        .is_ok());
-
-    // However value1 cannot take more than 100 per hour which 50+70 = 120
-    assert!(ratelimits
-        .check_limit(
-            String::from("provider"),
-            Header {
-                key: String::from("only-key"),
-                value: String::from("value1"),
-            },
-            NonZero::new(70).unwrap(),
-        )
-        .is_err())
-}
-
-#[test]
-fn different_provider_can_have_different_limits_with_the_same_keys() {
-    let ratelimits_config = vec![
-        Ratelimit {
-            model: String::from("first_provider"),
-            selector: configuration::Header {
-                key: String::from("key"),
-                value: Some(String::from("value")),
-            },
-            limit: Limit {
-                tokens: 100,
-                unit: TimeUnit::Hour,
-            },
-        },
-        Ratelimit {
-            model: String::from("second_provider"),
-            selector: configuration::Header {
-                key: String::from("key"),
-                value: Some(String::from("value")),
-            },
-            limit: Limit {
-                tokens: 200,
-                unit: TimeUnit::Hour,
-            },
-        },
-    ];
-
-    let ratelimits = RatelimitMap::new(ratelimits_config);
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("first_provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(100).unwrap(),
-        )
-        .is_ok());
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("second_provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(200).unwrap(),
-        )
-        .is_ok());
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("first_provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(1).unwrap(),
-        )
-        .is_err());
-
-    assert!(ratelimits
-        .check_limit(
-            String::from("second_provider"),
-            Header {
-                key: String::from("key"),
-                value: String::from("value"),
-            },
-            NonZero::new(1).unwrap(),
-        )
-        .is_err());
-}
-
-// These tests use the publicly exposed static singleton, thus the same configuration is used in every test.
-// If more tests are written here, move the initial call out of the test.
-#[cfg(test)]
-mod test {
-    use super::ratelimits;
-    use configuration::{Limit, Ratelimit, TimeUnit};
-    use public_types::configuration;
-    use std::num::NonZero;
-    use std::thread;
-
-    #[test]
-    fn make_ratelimits_optional() {
-        let ratelimits_config = Vec::new();
-
-        // Initialize in the main thread.
-        ratelimits(Some(ratelimits_config));
-    }
-
-    #[test]
-    fn different_threads_have_same_ratelimit_data_structure() {
-        let ratelimits_config = Some(vec![Ratelimit {
-            model: String::from("provider"),
-            selector: configuration::Header {
-                key: String::from("key"),
-                value: Some(String::from("value")),
-            },
-            limit: Limit {
-                tokens: 200,
-                unit: TimeUnit::Hour,
-            },
-        }]);
-
-        // Initialize in the main thread.
-        ratelimits(ratelimits_config);
-
-        // Use the singleton in a different thread.
-        thread::spawn(|| {
-            let ratelimits = ratelimits(None);
-
-            assert!(ratelimits
-                .read()
-                .unwrap()
-                .check_limit(
-                    String::from("provider"),
-                    super::Header {
-                        key: String::from("key"),
-                        value: String::from("value"),
-                    },
-                    NonZero::new(5000).unwrap(),
-                )
-                .is_err())
-        });
-    }
-}
--- a/crates/prompt_gateway/src/routing.rs
+++ b/crates/prompt_gateway/src/routing.rs
@ -1,50 +0,0 @@
-use std::rc::Rc;
-
-use crate::llm_providers::LlmProviders;
-use log::debug;
-use public_types::configuration::LlmProvider;
-use rand::{seq::IteratorRandom, thread_rng};
-
-#[derive(Debug)]
-pub enum ProviderHint {
-    Default,
-    Name(String),
-}
-
-impl From<String> for ProviderHint {
-    fn from(value: String) -> Self {
-        match value.as_str() {
-            "default" => ProviderHint::Default,
-            _ => ProviderHint::Name(value),
-        }
-    }
-}
-
-pub fn get_llm_provider(
-    llm_providers: &LlmProviders,
-    provider_hint: Option<ProviderHint>,
-) -> Rc<LlmProvider> {
-    let maybe_provider = provider_hint.and_then(|hint| match hint {
-        ProviderHint::Default => llm_providers.default(),
-        // FIXME: should a non-existent name in the hint be more explicit? i.e, return a BAD_REQUEST?
-        ProviderHint::Name(name) => llm_providers.get(&name),
-    });
-
-    if let Some(provider) = maybe_provider {
-        return provider;
-    }
-
-    if llm_providers.default().is_some() {
-        debug!("no llm provider found for hint, using default llm provider");
-        return llm_providers.default().unwrap();
-    }
-
-    debug!("no default llm found, using random llm provider");
-    let mut rng = thread_rng();
-    llm_providers
-        .iter()
-        .choose(&mut rng)
-        .expect("There should always be at least one llm provider")
-        .1
-        .clone()
-}
--- a/crates/prompt_gateway/src/stream_context.rs
+++ b/crates/prompt_gateway/src/stream_context.rs
@ -1,25 +1,18 @@
 use crate::filter_context::{EmbeddingsStore, WasmMetrics};
-use crate::llm_providers::LlmProviders;
-use crate::ratelimit::Header;
-use crate::{ratelimit, routing, tokenizer};
 use acap::cos;
-use http::StatusCode;
-use log::{debug, info, warn};
-use proxy_wasm::traits::*;
-use proxy_wasm::types::*;
-use public_types::common_types::open_ai::{
+use common::common_types::open_ai::{
    ArchState, ChatCompletionChunkResponse, ChatCompletionTool, ChatCompletionsRequest,
    ChatCompletionsResponse, Choice, FunctionDefinition, FunctionParameter, FunctionParameters,
    Message, ParameterType, StreamOptions, ToolCall, ToolCallState, ToolType,
 };
-use public_types::common_types::{
+use common::common_types::{
    EmbeddingType, HallucinationClassificationRequest, HallucinationClassificationResponse,
    PromptGuardRequest, PromptGuardResponse, PromptGuardTask, ZeroShotClassificationRequest,
    ZeroShotClassificationResponse,
 };
-use public_types::configuration::{GatewayMode, LlmProvider};
-use public_types::configuration::{Overrides, PromptGuards, PromptTarget};
-use public_types::consts::{
+use common::configuration::{GatewayMode, LlmProvider};
+use common::configuration::{Overrides, PromptGuards, PromptTarget};
+use common::consts::{
    ARCH_FC_MODEL_NAME, ARCH_FC_REQUEST_TIMEOUT_MS, ARCH_INTERNAL_CLUSTER_NAME,
    ARCH_LLM_UPSTREAM_LISTENER, ARCH_MESSAGES_KEY, ARCH_MODEL_PREFIX, ARCH_PROVIDER_HINT_HEADER,
    ARCH_ROUTING_HEADER, ARCH_STATE_HEADER, ARCH_UPSTREAM_HOST_HEADER, ARC_FC_CLUSTER,
@ -27,11 +20,18 @@ use public_types::consts::{
    DEFAULT_INTENT_MODEL, DEFAULT_PROMPT_TARGET_THRESHOLD, GPT_35_TURBO, MODEL_SERVER_NAME,
    RATELIMIT_SELECTOR_HEADER_KEY, REQUEST_ID_HEADER, SYSTEM_ROLE, USER_ROLE,
 };
-use public_types::embeddings::{
+use common::embeddings::{
    CreateEmbeddingRequest, CreateEmbeddingRequestInput, CreateEmbeddingResponse,
 };
-use public_types::http::{CallArgs, Client, ClientError};
-use public_types::stats::Gauge;
+use common::http::{CallArgs, Client, ClientError};
+use common::llm_providers::LlmProviders;
+use common::ratelimit::Header;
+use common::stats::Gauge;
+use common::{ratelimit, routing, tokenizer};
+use http::StatusCode;
+use log::{debug, info, warn};
+use proxy_wasm::traits::*;
+use proxy_wasm::types::*;
 use serde_json::Value;
 use sha2::{Digest, Sha256};
 use std::cell::RefCell;
@ -40,7 +40,7 @@ use std::num::NonZero;
 use std::rc::Rc;
 use std::time::Duration;

-use public_types::stats::IncrementingMetric;
+use common::stats::IncrementingMetric;

 #[derive(Debug, Clone)]
 enum ResponseHandlerType {
@ -1280,7 +1280,7 @@ impl HttpContext for StreamContext {
        let prompt_guard_jailbreak_task = self
            .prompt_guards
            .input_guards
-            .contains_key(&public_types::configuration::GuardType::Jailbreak);
+            .contains_key(&common::configuration::GuardType::Jailbreak);

        self.chat_completions_request = Some(deserialized_body);

--- a/crates/prompt_gateway/src/tokenizer.rs
+++ b/crates/prompt_gateway/src/tokenizer.rs
@ -1,39 +0,0 @@
-use log::debug;
-
-#[derive(Debug, PartialEq, Eq)]
-#[allow(dead_code)]
-pub enum Error {
-    UnknownModel,
-    FailedToTokenize,
-}
-
-#[allow(dead_code)]
-pub fn token_count(model_name: &str, text: &str) -> Result<usize, Error> {
-    debug!("getting token count model={}", model_name);
-    // Consideration: is it more expensive to instantiate the BPE object every time, or to contend the singleton?
-    let bpe = tiktoken_rs::get_bpe_from_model(model_name).map_err(|_| Error::UnknownModel)?;
-    Ok(bpe.encode_ordinary(text).len())
-}
-
-#[cfg(test)]
-mod test {
-    use super::*;
-
-    #[test]
-    fn encode_ordinary() {
-        let model_name = "gpt-3.5-turbo";
-        let text = "How many tokens does this sentence have?";
-        assert_eq!(
-            8,
-            token_count(model_name, text).expect("correct tokenization")
-        );
-    }
-
-    #[test]
-    fn unrecognized_model() {
-        assert_eq!(
-            Error::UnknownModel,
-            token_count("unknown", "").expect_err("unknown model")
-        )
-    }
-}