220 lines
6.9 KiB
Rust
220 lines
6.9 KiB
Rust
use crate::error::{Error as GeminiError, Result as GeminiResult};
|
|
use crate::network::event_source::{EventSource, ServerSentEvent};
|
|
use crate::prelude::*;
|
|
|
|
use tokio_stream::{Stream, StreamExt};
|
|
use tokio_util::codec::LinesCodecError;
|
|
use tracing::error;
|
|
|
|
pub static AUTH_SCOPE: &[&str] = &["https://www.googleapis.com/auth/cloud-platform"];
|
|
|
|
#[derive(Clone, Debug)]
|
|
pub struct GeminiClient {
|
|
client: reqwest::Client,
|
|
api_key: String,
|
|
}
|
|
|
|
unsafe impl Send for GeminiClient {}
|
|
unsafe impl Sync for GeminiClient {}
|
|
|
|
impl GeminiClient {
|
|
pub fn new(api_key: String) -> Self {
|
|
GeminiClient {
|
|
client: reqwest::Client::new(),
|
|
api_key,
|
|
}
|
|
}
|
|
|
|
pub async fn stream_generate_content(
|
|
&self,
|
|
request: &GenerateContentRequest,
|
|
model: &str,
|
|
) -> GeminiResult<impl Stream<Item = GeminiResult<GenerateContentResponseResult>>> {
|
|
let endpoint_url = format!(
|
|
"https://generativelanguage.googleapis.com/v1beta/models/{model}:streamGenerateContent?alt=sse"
|
|
);
|
|
let client = self.client.clone();
|
|
let request = request.clone();
|
|
Ok(client
|
|
.post(&endpoint_url)
|
|
.header("x-goog-api-key", &self.api_key)
|
|
.json(&request)
|
|
.send()
|
|
.await?
|
|
.event_stream()
|
|
.filter_map(Self::parse_event))
|
|
}
|
|
|
|
fn parse_event(
|
|
event_result: std::result::Result<ServerSentEvent, LinesCodecError>,
|
|
) -> Option<GeminiResult<GenerateContentResponseResult>> {
|
|
let data = event_result.map_err(Into::<GeminiError>::into).ok()?.data?;
|
|
|
|
Some(
|
|
serde_json::from_str::<GenerateContentResponse>(&data)
|
|
.map_err(Into::into)
|
|
.and_then(|resp| resp.into_result()),
|
|
)
|
|
}
|
|
|
|
pub async fn generate_content(
|
|
&self,
|
|
request: &GenerateContentRequest,
|
|
model: &str,
|
|
) -> GeminiResult<GenerateContentResponseResult> {
|
|
let endpoint_url: String = format!(
|
|
"https://generativelanguage.googleapis.com/v1beta/models/{model}:generateContent",
|
|
);
|
|
let resp = self
|
|
.client
|
|
.post(&endpoint_url)
|
|
.header("x-goog-api-key", &self.api_key)
|
|
.json(&request)
|
|
.send()
|
|
.await?;
|
|
|
|
let status = resp.status();
|
|
let txt_json = resp.text().await?;
|
|
tracing::debug!("generate_content response: {:?}", txt_json);
|
|
|
|
if !status.is_success() {
|
|
if let Ok(gemini_error) =
|
|
serde_json::from_str::<crate::types::GeminiApiError>(&txt_json)
|
|
{
|
|
return Err(GeminiError::GeminiError(gemini_error));
|
|
}
|
|
// Fallback if parsing fails, though it should ideally match GeminiApiError
|
|
return Err(GeminiError::GenericApiError {
|
|
status: status.as_u16(),
|
|
body: txt_json,
|
|
});
|
|
}
|
|
|
|
match serde_json::from_str::<GenerateContentResponse>(&txt_json) {
|
|
Ok(response) => Ok(response.into_result()?),
|
|
Err(e) => {
|
|
tracing::error!("Failed to parse response: {} with error {}", txt_json, e);
|
|
Err(e.into())
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Prompts a conversation to the model.
|
|
pub async fn prompt_conversation(
|
|
&self,
|
|
messages: &[Message],
|
|
model: &str,
|
|
) -> GeminiResult<Message> {
|
|
let request = GenerateContentRequest {
|
|
contents: messages
|
|
.iter()
|
|
.map(|m| Content {
|
|
role: Some(m.role),
|
|
parts: Some(vec![Part::from_text(m.text.clone())]),
|
|
})
|
|
.collect(),
|
|
generation_config: None,
|
|
tools: None,
|
|
system_instruction: None,
|
|
safety_settings: None,
|
|
};
|
|
|
|
let response = self.generate_content(&request, model).await?;
|
|
|
|
// Check for errors in the response.
|
|
let mut candidates = GeminiClient::collect_text_from_response(&response);
|
|
|
|
match candidates.pop() {
|
|
Some(text) => Ok(Message::new(Role::Model, &text)),
|
|
None => Err(GeminiError::NoCandidatesError),
|
|
}
|
|
}
|
|
|
|
fn collect_text_from_response(response: &GenerateContentResponseResult) -> Vec<String> {
|
|
response
|
|
.candidates
|
|
.iter()
|
|
.filter_map(Candidate::get_text)
|
|
.collect::<Vec<String>>()
|
|
}
|
|
|
|
pub async fn text_embeddings(
|
|
&self,
|
|
request: &TextEmbeddingRequest,
|
|
model: &str,
|
|
) -> GeminiResult<TextEmbeddingResponse> {
|
|
let endpoint_url =
|
|
format!("https://generativelanguage.googleapis.com/v1beta/models/{model}:predict");
|
|
let resp = self
|
|
.client
|
|
.post(&endpoint_url)
|
|
.header("x-goog-api-key", &self.api_key)
|
|
.json(&request)
|
|
.send()
|
|
.await?;
|
|
let txt_json = resp.text().await?;
|
|
tracing::debug!("text_embeddings response: {:?}", txt_json);
|
|
Ok(serde_json::from_str::<TextEmbeddingResponse>(&txt_json)?)
|
|
}
|
|
|
|
pub async fn count_tokens(
|
|
&self,
|
|
request: &CountTokensRequest,
|
|
model: &str,
|
|
) -> GeminiResult<CountTokensResponse> {
|
|
let endpoint_url =
|
|
format!("https://generativelanguage.googleapis.com/v1beta/models/{model}:countTokens");
|
|
let resp = self
|
|
.client
|
|
.post(&endpoint_url)
|
|
.header("x-goog-api-key", &self.api_key)
|
|
.json(&request)
|
|
.send()
|
|
.await?;
|
|
|
|
let txt_json = resp.text().await?;
|
|
tracing::debug!("count_tokens response: {:?}", txt_json);
|
|
Ok(serde_json::from_str(&txt_json)?)
|
|
}
|
|
|
|
pub async fn predict_image(
|
|
&self,
|
|
request: &PredictImageRequest,
|
|
model: &str,
|
|
) -> GeminiResult<PredictImageResponse> {
|
|
let endpoint_url =
|
|
format!("https://generativelanguage.googleapis.com/v1beta/models/{model}:predict");
|
|
|
|
let resp = self
|
|
.client
|
|
.post(&endpoint_url)
|
|
.header("x-goog-api-key", &self.api_key)
|
|
.json(&request)
|
|
.send()
|
|
.await?;
|
|
|
|
let status = resp.status();
|
|
let txt_json = resp.text().await?;
|
|
|
|
if !status.is_success() {
|
|
if let Ok(gemini_error) =
|
|
serde_json::from_str::<crate::types::GeminiApiError>(&txt_json)
|
|
{
|
|
return Err(GeminiError::GeminiError(gemini_error));
|
|
}
|
|
return Err(GeminiError::GenericApiError {
|
|
status: status.as_u16(),
|
|
body: txt_json,
|
|
});
|
|
}
|
|
|
|
match serde_json::from_str::<PredictImageResponse>(&txt_json) {
|
|
Ok(response) => Ok(response),
|
|
Err(e) => {
|
|
error!(response = txt_json, error = ?e, "Failed to parse response");
|
|
Err(e.into())
|
|
}
|
|
}
|
|
}
|
|
}
|