prvng_platform/crates/rag/src/llm.rs

//! LLM integration using stratum-llm

use stratum_llm::{
    AnthropicProvider, ConfiguredProvider, CredentialSource, GenerationOptions, Message,
    ProviderChain, Role, UnifiedClient,
};
use tracing::info;

use crate::error::Result;

pub struct LlmClient {
    client: UnifiedClient,
    pub model: String,
}

impl LlmClient {
    pub fn new(model: String) -> Result<Self> {
        let api_key = std::env::var("ANTHROPIC_API_KEY").ok();

        if api_key.is_none() {
            tracing::warn!("ANTHROPIC_API_KEY not set - LLM calls will fail");
        }

        let provider =
            AnthropicProvider::new(api_key.unwrap_or_default(), model.clone());

        let configured = ConfiguredProvider {
            provider: Box::new(provider),
            credential_source: CredentialSource::EnvVar {
                name: "ANTHROPIC_API_KEY".to_string(),
            },
            priority: 0,
        };

        let chain = ProviderChain::with_providers(vec![configured]);

        let client = UnifiedClient::builder()
            .with_chain(chain)
            .build()
            .map_err(|e| {
                crate::error::RagError::LlmError(format!("Failed to build LLM client: {}", e))
            })?;

        info!("Initialized stratum-llm client: {}", model);

        Ok(Self { client, model })
    }

    pub async fn generate_answer(&self, query: &str, context: &str) -> Result<String> {
        let system_prompt = format!(
            r#"You are a helpful assistant answering questions about a provisioning platform.
You have been provided with relevant documentation context below.
Answer the user's question based on this context.
Be concise and accurate.

# Retrieved Context
{}
"#,
            context
        );

        let messages = vec![
            Message {
                role: Role::System,
                content: system_prompt,
            },
            Message {
                role: Role::User,
                content: query.to_string(),
            },
        ];

        let options = GenerationOptions {
            max_tokens: Some(1024),
            ..Default::default()
        };

        let response = self
            .client
            .generate(&messages, Some(&options))
            .await
            .map_err(|e| {
                crate::error::RagError::LlmError(format!("LLM generation failed: {}", e))
            })?;

        info!("Generated answer: {} characters", response.content.len());
        Ok(response.content)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_llm_client_creation() {
        let client = LlmClient::new("claude-opus-4".to_string());
        assert!(client.is_ok());
    }

    #[test]
    fn test_llm_client_model() {
        let client = LlmClient::new("claude-sonnet-4".to_string());
        assert!(client.is_ok());
        assert_eq!(client.unwrap().model, "claude-sonnet-4");
    }
}
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`//! LLM integration using stratum-llm`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`use stratum_llm::{`
			`AnthropicProvider, ConfiguredProvider, CredentialSource, GenerationOptions, Message,`
			`ProviderChain, Role, UnifiedClient,`
			`};`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`use tracing::info;`

			`use crate::error::Result;`

			`pub struct LlmClient {`
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`client: UnifiedClient,`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`pub model: String,`
			`}`

			`impl LlmClient {`
			`pub fn new(model: String) -> Result<Self> {`
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`let api_key = std::env::var("ANTHROPIC_API_KEY").ok();`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`if api_key.is_none() {`
			`tracing::warn!("ANTHROPIC_API_KEY not set - LLM calls will fail");`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`}`

chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`let provider =`
			`AnthropicProvider::new(api_key.unwrap_or_default(), model.clone());`

			`let configured = ConfiguredProvider {`
			`provider: Box::new(provider),`
			`credential_source: CredentialSource::EnvVar {`
			`name: "ANTHROPIC_API_KEY".to_string(),`
			`},`
			`priority: 0,`
			`};`

			`let chain = ProviderChain::with_providers(vec![configured]);`

			`let client = UnifiedClient::builder()`
			`.with_chain(chain)`
			`.build()`
			`.map_err(\|e\| {`
			`crate::error::RagError::LlmError(format!("Failed to build LLM client: {}", e))`
			`})?;`

			`info!("Initialized stratum-llm client: {}", model);`

			`Ok(Self { client, model })`
			`}`

			`pub async fn generate_answer(&self, query: &str, context: &str) -> Result<String> {`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`let system_prompt = format!(`
			`r#"You are a helpful assistant answering questions about a provisioning platform.`
			`You have been provided with relevant documentation context below.`
			`Answer the user's question based on this context.`
			`Be concise and accurate.`

			`# Retrieved Context`
			`{}`
			`"#,`
			`context`
			`);`

chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`let messages = vec![`
			`Message {`
			`role: Role::System,`
			`content: system_prompt,`
			`},`
			`Message {`
			`role: Role::User,`
			`content: query.to_string(),`
			`},`
			`];`

			`let options = GenerationOptions {`
			`max_tokens: Some(1024),`
			`..Default::default()`
			`};`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`let response = self`
			`.client`
			`.generate(&messages, Some(&options))`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`.await`
			`.map_err(\|e\| {`
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`crate::error::RagError::LlmError(format!("LLM generation failed: {}", e))`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`})?;`

chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`info!("Generated answer: {} characters", response.content.len());`
			`Ok(response.content)`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`}`
			`}`

			`#[cfg(test)]`
			`mod tests {`
			`use super::*;`

			`#[test]`
			`fn test_llm_client_creation() {`
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`let client = LlmClient::new("claude-opus-4".to_string());`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`assert!(client.is_ok());`
			`}`

			`#[test]`
chore: update crates, names and clippy fixes 2026-02-04 01:02:18 +00:00			`fn test_llm_client_model() {`
			`let client = LlmClient::new("claude-sonnet-4".to_string());`
			`assert!(client.is_ok());`
			`assert_eq!(client.unwrap().model, "claude-sonnet-4");`
chore: update platform submodule to monorepo crates structure Platform restructured into crates/, added AI service and detector, migrated control-center-ui to Leptos 0.8 2026-01-08 21:32:59 +00:00			`}`
			`}`