Merge c97b0c7548 into 33e8fc7a65

2025-04-19 01:53:28 +00:00 · 2025-04-19 01:53:28 +00:00 · 31ba7a5968
parent 33e8fc7a65 c97b0c7548
commit 31ba7a5968
6 changed files with 441 additions and 0 deletions
--- a/rig-core/Cargo.toml
+++ b/rig-core/Cargo.toml
@ -127,3 +127,8 @@ required-features = ["audio"]
 [[example]]
 name = "hyperbolic_audio_generation"
 required-features = ["audio"]
 [[example]]
 name = "aliyun_embeddings"
 required-features = ["derive"]
--- a/rig-core/examples/aliyun_embeddings.rs
+++ b/rig-core/examples/aliyun_embeddings.rs
@ -0,0 +1,30 @@
 use rig::providers::aliyun;
 use rig::Embed;
 #[derive(Embed, Debug)]
 struct Greetings {
    #[embed]
    message: String,
 }
 #[tokio::main]
 async fn main() -> Result<(), anyhow::Error> {
    // Initialize the Aliyun client
    let client = aliyun::Client::from_env();
    let embeddings = client
        .embeddings(aliyun::embedding::EMBEDDING_V1)
        .document(Greetings {
            message: "Hello, world!".to_string(),
        })?
        .document(Greetings {
            message: "Goodbye, world!".to_string(),
        })?
        .build()
        .await
        .expect("Failed to embed documents");
    println!("{:?}", embeddings);
    Ok(())
 }
--- a/rig-core/src/providers/aliyun/client.rs
+++ b/rig-core/src/providers/aliyun/client.rs
@ -0,0 +1,162 @@
 use crate::{
    embeddings::{self},
    Embed,
 };
 use serde::Deserialize;
 use super::embedding::EmbeddingModel;
 // ================================================================
 // Aliyun Gemini Client
 // ================================================================
 const ALIYUN_API_BASE_URL: &str = "https://dashscope.aliyuncs.com";
 #[derive(Clone)]
 pub struct Client {
    base_url: String,
    api_key: String,
    http_client: reqwest::Client,
 }
 impl Client {
    /// Create a new Aliyun client with the given API key.
    ///
    /// # Example
    /// ```
    /// use rig::providers::aliyun::Client;
    ///
    /// // Initialize the Aliyun client
    /// let aliyun = Client::new("your-dashscope-api-key");
    /// ```
    pub fn new(api_key: &str) -> Self {
        Self::from_url(api_key, ALIYUN_API_BASE_URL)
    }
    /// Create a new Aliyun client with the given API key and base URL.
    ///
    /// # Example
    /// ```
    /// use rig::providers::aliyun::Client;
    ///
    /// // Initialize the Aliyun client with a custom base URL
    /// let aliyun = Client::from_url("your-dashscope-api-key", "https://custom-dashscope-url.com");
    /// ```
    pub fn from_url(api_key: &str, base_url: &str) -> Self {
        Self {
            base_url: base_url.to_string(),
            api_key: api_key.to_string(),
            http_client: reqwest::Client::builder()
                .default_headers({
                    let mut headers = reqwest::header::HeaderMap::new();
                    headers.insert(
                        reqwest::header::CONTENT_TYPE,
                        "application/json".parse().unwrap(),
                    );
                    headers
                })
                .build()
                .expect("Aliyun reqwest client should build"),
        }
    }
    /// Create a new Aliyun client from the `DASHSCOPE_API_KEY` environment variable.
    /// Panics if the environment variable is not set.
    ///
    /// # Example
    /// ```
    /// use rig::providers::aliyun::Client;
    ///
    /// // Initialize the Aliyun client from environment variable
    /// let aliyun = Client::from_env();
    /// ```
    /// # Panics
    /// This function will panic if the `DASHSCOPE_API_KEY` environment variable is not set.
    pub fn from_env() -> Self {
        let api_key = std::env::var("DASHSCOPE_API_KEY").expect("DASHSCOPE_API_KEY not set");
        Self::new(&api_key)
    }
    /// Create a POST request to the specified API endpoint path.
    /// The Authorization header with the API key will be automatically added.
    ///
    /// # Arguments
    /// * `path` - The API endpoint path to append to the base URL
    ///
    /// # Returns
    /// A reqwest::RequestBuilder instance that can be further customized before sending
    pub fn post(&self, path: &str) -> reqwest::RequestBuilder {
        let url = format!("{}/{}", self.base_url, path).replace("//", "/");
        tracing::debug!("POST {}/{}", self.base_url, path);
        self.http_client
            .post(url)
            .header("Authorization", format!("Bearer {}", self.api_key))
    }
    /// Create an embedding model with the given name.
    /// Note: default embedding dimension of 0 will be used if model is not known.
    /// If this is the case, it's better to use function `embedding_model_with_ndims`
    ///
    /// # Example
    /// ```
    /// use rig::providers::aliyun::{Client, self};
    ///
    /// // Initialize the Aliyun client
    /// let aliyun = Client::new("your-dashscope-api-key");
    ///
    /// let embedding_model = aliyun.embedding_model("your-model-name");
    /// ```
    pub fn embedding_model(&self, model: &str) -> EmbeddingModel {
        EmbeddingModel::new(self.clone(), model, None)
    }
    /// Create an embedding model with the given name and the number of dimensions in the embedding generated by the model.
    ///
    /// # Example
    /// ```
    /// use rig::providers::aliyun::{Client, self};
    ///
    /// // Initialize the Aliyun client
    /// let aliyun = Client::new("your-dashscope-api-key");
    ///
    /// let embedding_model = aliyun.embedding_model_with_ndims("model-unknown-to-rig", 1024);
    /// ```
    pub fn embedding_model_with_ndims(&self, model: &str, ndims: usize) -> EmbeddingModel {
        EmbeddingModel::new(self.clone(), model, Some(ndims))
    }
    /// Create an embedding builder with the given embedding model.
    ///
    /// # Example
    /// ```
    /// use rig::providers::aliyun::{Client, self};
    ///
    /// // Initialize the Aliyun client
    /// let aliyun = Client::new("your-dashscope-api-key");
    ///
    /// let embeddings = aliyun.embeddings("your-model-name")
    ///     .simple_document("doc0", "Hello, world!")
    ///     .simple_document("doc1", "Goodbye, world!")
    ///     .build()
    ///     .await
    ///     .expect("Failed to embed documents");
    /// ```
    pub fn embeddings<D: Embed>(
        &self,
        model: &str,
    ) -> embeddings::EmbeddingsBuilder<EmbeddingModel, D> {
        embeddings::EmbeddingsBuilder::new(self.embedding_model(model))
    }
 }
 #[derive(Debug, Deserialize)]
 pub struct ApiErrorResponse {
    pub message: String,
 }
 #[derive(Debug, Deserialize)]
 #[serde(untagged)]
 pub enum ApiResponse<T> {
    Ok(T),
    Err(ApiErrorResponse),
 }
--- a/rig-core/src/providers/aliyun/embedding.rs
+++ b/rig-core/src/providers/aliyun/embedding.rs
@ -0,0 +1,239 @@
 // ================================================================
 //! Aliyun Embedding API Integration
 //! Implementation of Aliyun embedding models for text vectorization
 //! From https://help.aliyun.com/zh/model-studio/developer-reference/text-embedding-synchronous-api
 // ================================================================
 use serde_json::json;
 use crate::embeddings::{self, EmbeddingError};
 use super::client::{ApiResponse, Client};
 // Available embedding models provided by Aliyun
 pub const EMBEDDING_V1: &str = "text-embedding-v1";
 pub const EMBEDDING_V2: &str = "text-embedding-v2";
 pub const EMBEDDING_V3: &str = "text-embedding-v3";
 /// Aliyun embedding model implementation
 #[derive(Clone)]
 pub struct EmbeddingModel {
    client: Client,
    model: String,
    ndims: Option<usize>,
 }
 impl EmbeddingModel {
    /// Creates a new instance of the Aliyun embedding model
    ///
    /// # Arguments
    /// * `client` - The Aliyun API client
    /// * `model` - The model identifier (e.g., "text-embedding-v1")
    /// * `ndims` - Optional custom dimension size for the embedding output
    pub fn new(client: Client, model: &str, ndims: Option<usize>) -> Self {
        Self {
            client,
            model: model.to_string(),
            ndims,
        }
    }
 }
 impl EmbeddingModel {
    /// Returns the maximum number of documents supported by the model
    ///
    /// # Returns
    /// * For EMBEDDING_V3 model: 10 documents maximum
    /// * For other models: 25 documents maximum
    fn max_documents(&self) -> usize {
        match self.model.as_str() {
            EMBEDDING_V3 => 10,
            _ => 25,
        }
    }
    /// Returns the maximum number of tokens per document supported by the model
    ///
    /// # Returns
    /// * For EMBEDDING_V3 model: 8192 tokens per document
    /// * For other models: 2048 tokens per document
    fn max_tokens(&self) -> usize {
        match self.model.as_str() {
            EMBEDDING_V3 => 8192,
            _ => 2048,
        }
    }
    /// Validates if the document list meets the model's constraints
    ///
    /// # Validation Checks
    /// 1. Number of documents doesn't exceed model's maximum capacity
    /// 2. Each document's token count is within the model's token limit
    ///
    /// # Returns
    /// * `Ok(())` if validation passes
    /// * `Err(EmbeddingError)` with appropriate error message if validation fails
    fn validate_documents(&self, documents: &[String]) -> Result<(), EmbeddingError> {
        const AVG_CHARS_PER_TOKEN: usize = 4;
        if documents.len() > self.max_documents() {
            return Err(EmbeddingError::ProviderError(format!(
                "Model {} supports maximum {} documents",
                self.model,
                self.max_documents()
            )));
        }
        for (i, doc) in documents.iter().enumerate() {
            let estimated_tokens = doc.len() / AVG_CHARS_PER_TOKEN;
            if estimated_tokens > self.max_tokens() {
                return Err(EmbeddingError::ProviderError(format!(
                    "Document #{} exceeds maximum token limit of {}",
                    i + 1,
                    self.max_tokens()
                )));
            }
        }
        Ok(())
    }
 }
 impl embeddings::EmbeddingModel for EmbeddingModel {
    const MAX_DOCUMENTS: usize = 25;
    /// Returns the default embedding dimension for the current model
    ///
    /// # Returns
    /// * EMBEDDING_V1: 1536 dimensions
    /// * EMBEDDING_V2: 1536 dimensions
    /// * EMBEDDING_V3: 1024 dimensions (can be customized)
    /// * Unknown models: 0 dimensions
    fn ndims(&self) -> usize {
        match self.model.as_str() {
            EMBEDDING_V1 => 1536,
            EMBEDDING_V2 => 1536,
            // V3 model defaults to 1024 dimensions
            // Can be customized to [128, 256, 384, 512, 768, 1024]
            EMBEDDING_V3 => 1024,
            _ => 0, // Default to 0 for unknown models
        }
    }
    /// Generates embeddings for the provided text documents
    ///
    /// # Arguments
    /// * `documents` - Collection of text documents to embed
    ///
    /// # Returns
    /// * `Result<Vec<Embedding>, EmbeddingError>` - Vector of embeddings or error
    #[cfg_attr(feature = "worker", worker::send)]
    async fn embed_texts(
        &self,
        documents: impl IntoIterator<Item = String> + Send,
    ) -> Result<Vec<embeddings::Embedding>, EmbeddingError> {
        let documents: Vec<String> = documents.into_iter().collect();
        self.validate_documents(&documents)?;
        let request = json!({
            "model": self.model,
            "input": documents,
            "dimension": self.ndims.unwrap_or(self.ndims()),
            "encoding_format": "float",
        });
        tracing::info!("{}", serde_json::to_string_pretty(&request).unwrap());
        let response = self
            .client
            .post(&format!("/compatible-mode/v1/embeddings"))
            .json(&request)
            .send()
            .await?
            .error_for_status()?
            .json::<ApiResponse<aliyun_api_types::EmbeddingResponse>>()
            .await?;
        match response {
            ApiResponse::Ok(response) => {
                let docs = documents
                    .into_iter()
                    .zip(response.data)
                    .map(|(document, embedding)| embeddings::Embedding {
                        document,
                        vec: embedding.embedding,
                    })
                    .collect();
                Ok(docs)
            }
            ApiResponse::Err(err) => Err(EmbeddingError::ProviderError(err.message)),
        }
    }
 }
 // =================================================================
 // Aliyun API Types
 // =================================================================
 /// Type definitions for Aliyun Embedding API responses
 /// Follows OpenAI-compatible API structure
 #[allow(dead_code)]
 mod aliyun_api_types {
    use serde::Deserialize;
    /// Response structure for embedding requests
    #[derive(Debug, Deserialize)]
    pub struct EmbeddingResponse {
        pub data: Vec<EmbeddingData>,
        pub model: String,
        pub object: String,
        pub usage: Usage,
        pub id: String,
    }
    /// Individual embedding data for a single input document
    #[derive(Debug, Deserialize)]
    pub struct EmbeddingData {
        pub embedding: Vec<f64>,
        pub index: usize,
        pub object: String,
    }
    /// Token usage statistics for the embedding request
    #[derive(Debug, Deserialize)]
    pub struct Usage {
        pub prompt_tokens: usize,
        pub total_tokens: usize,
    }
 }
 #[cfg(test)]
 mod tests {
    use super::*;
    use crate::embeddings::embedding::EmbeddingModel as EmbeddingModelTrait;
    #[tokio::test]
    async fn test_embed_texts() {
        let client = Client::from_env();
        let model = EmbeddingModel::new(client, EMBEDDING_V1, None);
        // Test embedding for a single document
        let documents = vec!["Hello, world!".to_string()];
        let embeddings = model.embed_texts(documents).await.unwrap();
        assert_eq!(embeddings.len(), 1);
        assert_eq!(embeddings[0].vec.len(), 1536);
        // Test embedding for multiple documents
        let documents = vec!["Hello, world!".to_string(), "This is a test".to_string()];
        let embeddings = model.embed_texts(documents).await.unwrap();
        assert_eq!(embeddings.len(), 2);
        assert_eq!(embeddings[0].vec.len(), 1536);
        assert_eq!(embeddings[0].document, "Hello, world!");
        assert_eq!(embeddings[1].vec.len(), 1536);
        assert_eq!(embeddings[1].document, "This is a test");
    }
 }
--- a/rig-core/src/providers/aliyun/mod.rs
+++ b/rig-core/src/providers/aliyun/mod.rs
@ -0,0 +1,4 @@
 pub mod client;
 pub mod embedding;
 pub use client::Client;
--- a/rig-core/src/providers/mod.rs
+++ b/rig-core/src/providers/mod.rs
@ -62,3 +62,4 @@ pub mod openrouter;
 pub mod perplexity;
 pub mod together;
 pub mod xai;
 pub mod aliyun;