Feature/claude (#101)

* feat: Add cloude LLM * chore(logs): logs * chore(refactor): visibility of modules * chore: update Cloude client and models to include default implementation and new functions * chore: adding models, and chage model on api call * feat: add error handling and payload customization for anthropic This commit includes enhancements to the cloud API client. Error handling for different server responses has been added using the enum added to . The file has been extensively refactored to support this enhanced error handling and also offers better payload customization options. Default values for , , and are now being set from the options. Tests have also been updated to reflect changes. Additionally, a first class error handling module has been created for handling different types of errors. This module contains the struct for representing various types of errors that could occur when communicating with the Anthropic API. The has been updated to include this new error module. The models have been updated in to support additional optional parameters in the payload like , , , and . * chore: ignoring examples * fix: fixing typo Cloude to Claude * feat: improve content-type header and simplify check for streaming function in client.rs This commit updates the content-type header to specify utf-8 charset. It also simplifies the way we check if a streaming function is present in the client's options.
Abraxas-365 · Apr 2, 2024 · a619431 · a619431
1 parent a105b6e
commit a619431
Show file tree

Hide file tree

Showing 8 changed files with 398 additions and 2 deletions.
diff --git a/Cargo.toml b/Cargo.toml
@@ -16,7 +16,7 @@ scraper = "0.19"
 serde = { version = "1.0", features = ["derive"] }
 async-trait = "0.1.79"
 tokio = { version = "1", features = ["full"] }
-reqwest = { version = "0.12", features = ["json"] }
+reqwest = { version = "0.12", features = ["json","stream"] }
 serde_json = "1.0"
 futures ="0.3"
 regex = "1.10.4"

diff --git a/src/language_models/error.rs b/src/language_models/error.rs
@@ -4,11 +4,16 @@ use serde_json::Error as SerdeJsonError;
 use thiserror::Error;
 use tokio::time::error::Elapsed;
 
+use crate::llm::AnthropicError;
+
 #[derive(Error, Debug)]
 pub enum LLMError {
     #[error("OpenAI error: {0}")]
     OpenAIError(#[from] OpenAIError),
 
+    #[error("Anthropic error: {0}")]
+    AnthropicError(#[from] AnthropicError),
+
     #[error("Network request failed: {0}")]
     RequestError(#[from] ReqwestError),
 

diff --git a/src/language_models/llm.rs b/src/language_models/llm.rs
@@ -10,7 +10,11 @@ use super::{options::CallOptions, GenerateResult, LLMError};
 #[async_trait]
 pub trait LLM: Sync + Send {
     async fn generate(&self, messages: &[Message]) -> Result<GenerateResult, LLMError>;
-    async fn invoke(&self, prompt: &str) -> Result<String, LLMError>;
+    async fn invoke(&self, prompt: &str) -> Result<String, LLMError> {
+        self.generate(&[Message::new_human_message(prompt)])
+            .await
+            .map(|res| res.generation)
+    }
     async fn stream(
         &self,
         _messages: &[Message],

diff --git a/src/llm/claude/client.rs b/src/llm/claude/client.rs
@@ -0,0 +1,282 @@
+use crate::{
+    language_models::{llm::LLM, options::CallOptions, GenerateResult, LLMError, TokenUsage},
+    llm::AnthropicError,
+    schemas::{Message, StreamData},
+};
+use async_trait::async_trait;
+use futures::{Stream, StreamExt};
+use reqwest::Client;
+use serde_json::Value;
+use std::{collections::HashMap, pin::Pin};
+
+use super::models::{ApiResponse, ClaudeMessage, Payload};
+
+pub enum ClaudeModel {
+    Claude3pus20240229,
+    Claude3sonnet20240229,
+    Claude3haiku20240307,
+}
+
+impl ToString for ClaudeModel {
+    fn to_string(&self) -> String {
+        match self {
+            ClaudeModel::Claude3pus20240229 => "claude-3-opus-20240229".to_string(),
+            ClaudeModel::Claude3sonnet20240229 => "claude-3-sonnet-20240229".to_string(),
+            ClaudeModel::Claude3haiku20240307 => "claude-3-haiku-20240307".to_string(),
+        }
+    }
+}
+
+pub struct Claude {
+    model: String,
+    options: CallOptions,
+    api_key: String,
+    anthropic_version: String,
+}
+
+impl Default for Claude {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl Claude {
+    pub fn new() -> Self {
+        Self {
+            model: ClaudeModel::Claude3pus20240229.to_string(),
+            options: CallOptions::default(),
+            api_key: std::env::var("CLOUDE_API_KEY").unwrap_or_default(),
+            anthropic_version: "2023-06-01".to_string(),
+        }
+    }
+
+    pub fn with_model<S: Into<String>>(mut self, model: S) -> Self {
+        self.model = model.into();
+        self
+    }
+
+    pub fn with_options(mut self, options: CallOptions) -> Self {
+        self.options = options;
+        self
+    }
+
+    pub fn with_api_key<S: Into<String>>(mut self, api_key: S) -> Self {
+        self.api_key = api_key.into();
+        self
+    }
+
+    pub fn with_anthropic_version<S: Into<String>>(mut self, version: S) -> Self {
+        self.anthropic_version = version.into();
+        self
+    }
+
+    async fn generate(&self, messages: &[Message]) -> Result<GenerateResult, LLMError> {
+        let client = Client::new();
+        let is_stream = self.options.streaming_func.is_some();
+
+        let payload = self.build_payload(messages, is_stream);
+        let res = client
+            .post("https://api.anthropic.com/v1/messages")
+            .header("x-api-key", &self.api_key)
+            .header("anthropic-version", self.anthropic_version.clone())
+            .header("content-type", "application/json; charset=utf-8")
+            .json(&payload)
+            .send()
+            .await?;
+        let res = match res.status().as_u16() {
+            401 => Err(LLMError::AnthropicError(
+                AnthropicError::AuthenticationError("Invalid API Key".to_string()),
+            )),
+            403 => Err(LLMError::AnthropicError(AnthropicError::PermissionError(
+                "Permission Denied".to_string(),
+            ))),
+            404 => Err(LLMError::AnthropicError(AnthropicError::NotFoundError(
+                "Not Found".to_string(),
+            ))),
+            429 => Err(LLMError::AnthropicError(AnthropicError::RateLimitError(
+                "Rate Limit Exceeded".to_string(),
+            ))),
+            503 => Err(LLMError::AnthropicError(AnthropicError::OverloadedError(
+                "Service Unavailable".to_string(),
+            ))),
+            _ => Ok(res.json::<ApiResponse>().await?),
+        }?;
+
+        let generation = res
+            .content
+            .get(0)
+            .map(|c| c.text.clone())
+            .unwrap_or_default();
+
+        let tokens = Some(TokenUsage {
+            prompt_tokens: res.usage.input_tokens,
+            completion_tokens: res.usage.output_tokens,
+            total_tokens: res.usage.input_tokens + res.usage.output_tokens,
+        });
+
+        Ok(GenerateResult { tokens, generation })
+    }
+
+    fn build_payload(&self, messages: &[Message], stream: bool) -> Payload {
+        let mut payload = Payload {
+            model: self.model.clone(),
+            messages: messages
+                .iter()
+                .map(|m| ClaudeMessage::from_message(m))
+                .collect::<Vec<_>>(),
+            max_tokens: self.options.max_tokens.unwrap_or(1024),
+            stream: None,
+            stop_sequences: self.options.stop_words.clone(),
+            temperature: self.options.temperature,
+            top_p: self.options.top_p,
+            top_k: self.options.top_k,
+        };
+        if stream {
+            payload.stream = Some(true);
+        }
+        payload
+    }
+}
+
+#[async_trait]
+impl LLM for Claude {
+    async fn generate(&self, messages: &[Message]) -> Result<GenerateResult, LLMError> {
+        match &self.options.streaming_func {
+            Some(func) => {
+                let mut complete_response = String::new();
+                let mut stream = self.stream(messages).await?;
+                while let Some(data) = stream.next().await {
+                    match data {
+                        Ok(value) => {
+                            let mut func = func.lock().await;
+                            complete_response.push_str(&value.content);
+                            let _ = func(value.content).await;
+                        }
+                        Err(e) => return Err(e),
+                    }
+                }
+                let mut generate_result = GenerateResult::default();
+                generate_result.generation = complete_response;
+                Ok(generate_result)
+            }
+            None => self.generate(messages).await,
+        }
+    }
+    async fn stream(
+        &self,
+        messages: &[Message],
+    ) -> Result<Pin<Box<dyn Stream<Item = Result<StreamData, LLMError>> + Send>>, LLMError> {
+        let client = Client::new();
+        let payload = self.build_payload(messages, true);
+        let request = client
+            .post("https://api.anthropic.com/v1/messages")
+            .header("x-api-key", &self.api_key)
+            .header("anthropic-version", &self.anthropic_version)
+            .header("content-type", "application/json; charset=utf-8")
+            .json(&payload)
+            .build()?;
+
+        // Instead of sending the request directly, return a stream wrapper
+        let stream = client.execute(request).await?.bytes_stream();
+
+        // Process each chunk as it arrives
+        let processed_stream = stream.then(move |result| {
+            async move {
+                match result {
+                    Ok(bytes) => {
+                        let value: Value = parse_sse_to_json(&String::from_utf8_lossy(&bytes))?;
+                        if value["type"].as_str().unwrap_or("") == "content_block_delta" {
+                            let content = value["delta"]["text"].clone();
+                            // Return StreamData based on the parsed content
+                            Ok(StreamData::new(value, content.as_str().unwrap_or("")))
+                        } else {
+                            Ok(StreamData::new(value, ""))
+                        }
+                    }
+                    Err(e) => Err(LLMError::RequestError(e)),
+                }
+            }
+        });
+
+        Ok(Box::pin(processed_stream))
+    }
+
+    fn add_options(&mut self, options: CallOptions) {
+        self.options.merge_options(options)
+    }
+}
+
+fn parse_sse_to_json(sse_data: &str) -> Result<Value, LLMError> {
+    if let Ok(json) = serde_json::from_str::<Value>(sse_data) {
+        return parse_error(&json);
+    }
+
+    let lines: Vec<&str> = sse_data.trim().split('\n').collect();
+    let mut event_data: HashMap<&str, String> = HashMap::new();
+
+    for line in lines {
+        if let Some((key, value)) = line.split_once(": ") {
+            event_data.insert(key, value.to_string());
+        }
+    }
+
+    if let Some(data) = event_data.get("data") {
+        let data: Value = serde_json::from_str(data)?;
+        return match data["type"].as_str() {
+            Some("error") => parse_error(&data),
+            _ => Ok(data),
+        };
+    }
+    log::error!("No data field in the SSE event");
+    Err(LLMError::ContentNotFound("data".to_string()))
+}
+
+fn parse_error(json: &Value) -> Result<Value, LLMError> {
+    let error_type = json["error"]["type"].as_str().unwrap_or("");
+    let message = json["error"]["message"].as_str().unwrap_or("").to_string();
+    match error_type {
+        "invalid_request_error" => Err(AnthropicError::InvalidRequestError(message))?,
+        "authentication_error" => Err(AnthropicError::AuthenticationError(message))?,
+        "permission_error" => Err(AnthropicError::PermissionError(message))?,
+        "not_found_error" => Err(AnthropicError::NotFoundError(message))?,
+        "rate_limit_error" => Err(AnthropicError::RateLimitError(message))?,
+        "api_error" => Err(AnthropicError::ApiError(message))?,
+        "overloaded_error" => Err(AnthropicError::OverloadedError(message))?,
+        _ => Err(LLMError::OtherError("Unknown error".to_string())),
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use tokio::test;
+
+    #[test]
+    #[ignore]
+    async fn test_cloudia_generate() {
+        let cloudia = Claude::new();
+
+        let res = cloudia
+            .generate(&[Message::new_human_message("Hi, how are you doing")])
+            .await
+            .unwrap();
+
+        println!("{:?}", res)
+    }
+
+    #[test]
+    #[ignore]
+    async fn test_cloudia_stream() {
+        let cloudia = Claude::new();
+        let mut stream = cloudia
+            .stream(&[Message::new_human_message("Hi, how are you doing")])
+            .await
+            .unwrap();
+        while let Some(data) = stream.next().await {
+            match data {
+                Ok(value) => value.to_stdout().unwrap(),
+                Err(e) => panic!("Error invoking LLMChain: {:?}", e),
+            }
+        }
+    }
+}
diff --git a/src/llm/claude/error.rs b/src/llm/claude/error.rs
@@ -0,0 +1,25 @@
+use thiserror::Error;
+
+#[derive(Error, Debug)]
+pub enum AnthropicError {
+    #[error("Anthropic API error: Invalid request - {0}")]
+    InvalidRequestError(String),
+
+    #[error("Anthropic API error: Authentication failed - {0}")]
+    AuthenticationError(String),
+
+    #[error("Anthropic API error: Permission denied - {0}")]
+    PermissionError(String),
+
+    #[error("Anthropic API error: Not found - {0}")]
+    NotFoundError(String),
+
+    #[error("Anthropic API error: Rate limit exceeded - {0}")]
+    RateLimitError(String),
+
+    #[error("Anthropic API error: Internal error - {0}")]
+    ApiError(String),
+
+    #[error("Anthropic API error: Overloaded - {0}")]
+    OverloadedError(String),
+}
diff --git a/src/llm/claude/mod.rs b/src/llm/claude/mod.rs
@@ -0,0 +1,7 @@
+mod models;
+
+mod client;
+pub use client::*;
+
+mod error;
+pub use error::*;