server/src/llm/providers/ollama.rs

use crate::llm::types::{
    CompletionResponse, FunctionCall, Message, ModelProvider, Role, ToolCall, ToolDefinition,
};
use async_trait::async_trait;
use futures::StreamExt;
use serde::{Deserialize, Serialize};
use serde_json::Value;

pub struct OllamaProvider {
    base_url: String,
}

impl OllamaProvider {
    pub fn new(base_url: String) -> Self {
        Self { base_url }
    }

    pub async fn get_models(base_url: &str) -> Result<Vec<String>, String> {
        let client = reqwest::Client::new();
        let url = format!("{}/api/tags", base_url.trim_end_matches('/'));

        let res = client
            .get(&url)
            .send()
            .await
            .map_err(|e| format!("Request failed: {}", e))?;

        if !res.status().is_success() {
            let status = res.status();
            let text = res.text().await.unwrap_or_default();
            return Err(format!("Ollama API error {}: {}", status, text));
        }

        let body: OllamaTagsResponse = res
            .json()
            .await
            .map_err(|e| format!("Failed to parse response: {}", e))?;

        Ok(body.models.into_iter().map(|m| m.name).collect())
    }

    /// Streaming chat that calls `on_token` for each token chunk.
    pub async fn chat_stream<F>(
        &self,
        model: &str,
        messages: &[Message],
        tools: &[ToolDefinition],
        cancel_rx: &mut tokio::sync::watch::Receiver<bool>,
        mut on_token: F,
    ) -> Result<CompletionResponse, String>
    where
        F: FnMut(&str) + Send,
    {
        let client = reqwest::Client::new();
        let url = format!("{}/api/chat", self.base_url.trim_end_matches('/'));

        let ollama_messages: Vec<OllamaRequestMessage> = messages
            .iter()
            .map(|m| {
                let tool_calls = m.tool_calls.as_ref().map(|calls| {
                    calls
                        .iter()
                        .map(|tc| {
                            let args_val: Value = serde_json::from_str(&tc.function.arguments)
                                .unwrap_or(Value::String(tc.function.arguments.clone()));

                            OllamaRequestToolCall {
                                kind: tc.kind.clone(),
                                function: OllamaRequestFunctionCall {
                                    name: tc.function.name.clone(),
                                    arguments: args_val,
                                },
                            }
                        })
                        .collect()
                });

                OllamaRequestMessage {
                    role: m.role.clone(),
                    content: m.content.clone(),
                    tool_calls,
                    tool_call_id: m.tool_call_id.clone(),
                }
            })
            .collect();

        let request_body = OllamaRequest {
            model,
            messages: ollama_messages,
            stream: true,
            tools,
        };

        let res = client
            .post(&url)
            .json(&request_body)
            .send()
            .await
            .map_err(|e| format!("Request failed: {}", e))?;

        if !res.status().is_success() {
            let status = res.status();
            let text = res.text().await.unwrap_or_default();
            return Err(format!("Ollama API error {}: {}", status, text));
        }

        let mut stream = res.bytes_stream();
        let mut buffer = String::new();
        let mut accumulated_content = String::new();
        let mut final_tool_calls: Option<Vec<ToolCall>> = None;

        loop {
            if *cancel_rx.borrow() {
                return Err("Chat cancelled by user".to_string());
            }

            let chunk_result = tokio::select! {
                chunk = stream.next() => {
                    match chunk {
                        Some(c) => c,
                        None => break,
                    }
                }
                _ = cancel_rx.changed() => {
                    if *cancel_rx.borrow() {
                        return Err("Chat cancelled by user".to_string());
                    } else {
                        continue;
                    }
                }
            };

            let chunk = chunk_result.map_err(|e| format!("Stream error: {}", e))?;
            buffer.push_str(&String::from_utf8_lossy(&chunk));

            while let Some(newline_pos) = buffer.find('\n') {
                let line = buffer[..newline_pos].trim().to_string();
                buffer = buffer[newline_pos + 1..].to_string();

                if line.is_empty() {
                    continue;
                }

                let stream_msg: OllamaStreamResponse =
                    serde_json::from_str(&line).map_err(|e| format!("JSON parse error: {}", e))?;

                if !stream_msg.message.content.is_empty() {
                    accumulated_content.push_str(&stream_msg.message.content);
                    on_token(&stream_msg.message.content);
                }

                if let Some(tool_calls) = stream_msg.message.tool_calls {
                    final_tool_calls = Some(
                        tool_calls
                            .into_iter()
                            .map(|tc| ToolCall {
                                id: None,
                                kind: "function".to_string(),
                                function: FunctionCall {
                                    name: tc.function.name,
                                    arguments: tc.function.arguments.to_string(),
                                },
                            })
                            .collect(),
                    );
                }

                if stream_msg.done {
                    break;
                }
            }
        }

        Ok(CompletionResponse {
            content: if accumulated_content.is_empty() {
                None
            } else {
                Some(accumulated_content)
            },
            tool_calls: final_tool_calls,
            session_id: None,
        })
    }
}

#[derive(Deserialize)]
struct OllamaTagsResponse {
    models: Vec<OllamaModelTag>,
}

#[derive(Deserialize)]
struct OllamaModelTag {
    name: String,
}

#[derive(Serialize)]
struct OllamaRequest<'a> {
    model: &'a str,
    messages: Vec<OllamaRequestMessage>,
    stream: bool,
    #[serde(skip_serializing_if = "is_empty_tools")]
    tools: &'a [ToolDefinition],
}

fn is_empty_tools(tools: &&[ToolDefinition]) -> bool {
    tools.is_empty()
}

#[derive(Serialize)]
struct OllamaRequestMessage {
    role: Role,
    content: String,
    #[serde(skip_serializing_if = "Option::is_none")]
    tool_calls: Option<Vec<OllamaRequestToolCall>>,
    #[serde(skip_serializing_if = "Option::is_none")]
    tool_call_id: Option<String>,
}

#[derive(Serialize)]
struct OllamaRequestToolCall {
    function: OllamaRequestFunctionCall,
    #[serde(rename = "type")]
    kind: String,
}

#[derive(Serialize)]
struct OllamaRequestFunctionCall {
    name: String,
    arguments: Value,
}

#[derive(Deserialize)]
struct OllamaStreamResponse {
    message: OllamaStreamMessage,
    done: bool,
}

#[derive(Deserialize)]
struct OllamaStreamMessage {
    #[serde(default)]
    content: String,
    #[serde(default)]
    tool_calls: Option<Vec<OllamaResponseToolCall>>,
}

#[derive(Deserialize)]
struct OllamaResponseToolCall {
    function: OllamaResponseFunctionCall,
}

#[derive(Deserialize)]
struct OllamaResponseFunctionCall {
    name: String,
    arguments: Value,
}

#[async_trait]
impl ModelProvider for OllamaProvider {
    async fn chat(
        &self,
        _model: &str,
        _messages: &[Message],
        _tools: &[ToolDefinition],
    ) -> Result<CompletionResponse, String> {
        Err("Non-streaming Ollama chat not implemented for server".to_string())
    }
}
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`use crate::llm::types::{`
			`CompletionResponse, FunctionCall, Message, ModelProvider, Role, ToolCall, ToolDefinition,`
			`};`
fix: make llm provider async and add tool toggle 2025-12-24 17:32:46 +00:00			`use async_trait::async_trait;`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`use futures::StreamExt;`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`use serde::{Deserialize, Serialize};`
			`use serde_json::Value;`

			`pub struct OllamaProvider {`
			`base_url: String,`
			`}`

			`impl OllamaProvider {`
			`pub fn new(base_url: String) -> Self {`
			`Self { base_url }`
			`}`
feat: auto-detect ollama models 2025-12-25 12:21:58 +00:00
			`pub async fn get_models(base_url: &str) -> Result<Vec<String>, String> {`
			`let client = reqwest::Client::new();`
			`let url = format!("{}/api/tags", base_url.trim_end_matches('/'));`

			`let res = client`
			`.get(&url)`
			`.send()`
			`.await`
			`.map_err(\|e\| format!("Request failed: {}", e))?;`

			`if !res.status().is_success() {`
			`let status = res.status();`
			`let text = res.text().await.unwrap_or_default();`
			`return Err(format!("Ollama API error {}: {}", status, text));`
			`}`

			`let body: OllamaTagsResponse = res`
			`.json()`
			`.await`
			`.map_err(\|e\| format!("Failed to parse response: {}", e))?;`

			`Ok(body.models.into_iter().map(\|m\| m.name).collect())`
			`}`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			/// Streaming chat that calls `on_token` for each token chunk.
			`pub async fn chat_stream<F>(`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`&self,`
			`model: &str,`
			`messages: &[Message],`
			`tools: &[ToolDefinition],`
Story 13: Implement Stop button with backend cancellation - Add tokio watch channel for cancellation signaling - Implement cancel_chat command - Add cancellation checks in streaming loop and before tool execution - Stop button (■) replaces Send button (↑) during generation - Preserve partial streaming content when cancelled - Clean UX: no error messages on cancellation - Backend properly stops streaming and prevents tool execution Closes Story 13 2025-12-27 18:32:15 +00:00			`cancel_rx: &mut tokio::sync::watch::Receiver<bool>,`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`mut on_token: F,`
			`) -> Result<CompletionResponse, String>`
			`where`
			`F: FnMut(&str) + Send,`
			`{`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`let client = reqwest::Client::new();`
			`let url = format!("{}/api/chat", self.base_url.trim_end_matches('/'));`

			`let ollama_messages: Vec<OllamaRequestMessage> = messages`
			`.iter()`
			`.map(\|m\| {`
			`let tool_calls = m.tool_calls.as_ref().map(\|calls\| {`
			`calls`
			`.iter()`
			`.map(\|tc\| {`
			`let args_val: Value = serde_json::from_str(&tc.function.arguments)`
			`.unwrap_or(Value::String(tc.function.arguments.clone()));`

			`OllamaRequestToolCall {`
			`kind: tc.kind.clone(),`
			`function: OllamaRequestFunctionCall {`
			`name: tc.function.name.clone(),`
			`arguments: args_val,`
			`},`
			`}`
			`})`
			`.collect()`
			`});`

			`OllamaRequestMessage {`
			`role: m.role.clone(),`
			`content: m.content.clone(),`
			`tool_calls,`
			`tool_call_id: m.tool_call_id.clone(),`
			`}`
			`})`
			`.collect();`

			`let request_body = OllamaRequest {`
			`model,`
			`messages: ollama_messages,`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`stream: true,`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`tools,`
			`};`

			`let res = client`
			`.post(&url)`
			`.json(&request_body)`
			`.send()`
			`.await`
			`.map_err(\|e\| format!("Request failed: {}", e))?;`

			`if !res.status().is_success() {`
			`let status = res.status();`
			`let text = res.text().await.unwrap_or_default();`
			`return Err(format!("Ollama API error {}: {}", status, text));`
			`}`

			`let mut stream = res.bytes_stream();`
			`let mut buffer = String::new();`
			`let mut accumulated_content = String::new();`
			`let mut final_tool_calls: Option<Vec<ToolCall>> = None;`

Story 13: Implement Stop button with backend cancellation - Add tokio watch channel for cancellation signaling - Implement cancel_chat command - Add cancellation checks in streaming loop and before tool execution - Stop button (■) replaces Send button (↑) during generation - Preserve partial streaming content when cancelled - Clean UX: no error messages on cancellation - Backend properly stops streaming and prevents tool execution Closes Story 13 2025-12-27 18:32:15 +00:00			`loop {`
			`if *cancel_rx.borrow() {`
			`return Err("Chat cancelled by user".to_string());`
			`}`

			`let chunk_result = tokio::select! {`
			`chunk = stream.next() => {`
			`match chunk {`
			`Some(c) => c,`
			`None => break,`
			`}`
			`}`
			`_ = cancel_rx.changed() => {`
			`if *cancel_rx.borrow() {`
			`return Err("Chat cancelled by user".to_string());`
			`} else {`
			`continue;`
			`}`
			`}`
			`};`

Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`let chunk = chunk_result.map_err(\|e\| format!("Stream error: {}", e))?;`
			`buffer.push_str(&String::from_utf8_lossy(&chunk));`

			`while let Some(newline_pos) = buffer.find('\n') {`
			`let line = buffer[..newline_pos].trim().to_string();`
			`buffer = buffer[newline_pos + 1..].to_string();`

			`if line.is_empty() {`
			`continue;`
			`}`

			`let stream_msg: OllamaStreamResponse =`
			`serde_json::from_str(&line).map_err(\|e\| format!("JSON parse error: {}", e))?;`

			`if !stream_msg.message.content.is_empty() {`
			`accumulated_content.push_str(&stream_msg.message.content);`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`on_token(&stream_msg.message.content);`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`}`

			`if let Some(tool_calls) = stream_msg.message.tool_calls {`
			`final_tool_calls = Some(`
			`tool_calls`
			`.into_iter()`
			`.map(\|tc\| ToolCall {`
			`id: None,`
			`kind: "function".to_string(),`
			`function: FunctionCall {`
			`name: tc.function.name,`
			`arguments: tc.function.arguments.to_string(),`
			`},`
			`})`
			`.collect(),`
			`);`
			`}`

			`if stream_msg.done {`
			`break;`
			`}`
			`}`
			`}`

			`Ok(CompletionResponse {`
			`content: if accumulated_content.is_empty() {`
			`None`
			`} else {`
			`Some(accumulated_content)`
			`},`
			`tool_calls: final_tool_calls,`
Accept story 39: Persistent Claude Code Sessions in Web UI Use --resume <session_id> with claude -p so the web UI claude-code-pty provider maintains full conversation context across messages, identical to a long-running terminal Claude Code session. Changes: - Capture session_id from claude -p stream-json system event - Pass --resume on subsequent messages in same chat session - Thread session_id through ProviderConfig, ChatResult, WsResponse - Frontend stores sessionId per chat, clears on New Session - Unset CLAUDECODE env to allow nested spawning from server - Wait for clean process exit to ensure transcript flush to disk Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> 2026-02-20 11:51:19 +00:00			`session_id: None,`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`})`
			`}`
feat: auto-detect ollama models 2025-12-25 12:21:58 +00:00			`}`

			`#[derive(Deserialize)]`
			`struct OllamaTagsResponse {`
			`models: Vec<OllamaModelTag>,`
			`}`

			`#[derive(Deserialize)]`
			`struct OllamaModelTag {`
			`name: String,`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`}`

			`#[derive(Serialize)]`
			`struct OllamaRequest<'a> {`
			`model: &'a str,`
			`messages: Vec<OllamaRequestMessage>,`
			`stream: bool,`
			`#[serde(skip_serializing_if = "is_empty_tools")]`
			`tools: &'a [ToolDefinition],`
			`}`

			`fn is_empty_tools(tools: &&[ToolDefinition]) -> bool {`
			`tools.is_empty()`
			`}`

			`#[derive(Serialize)]`
			`struct OllamaRequestMessage {`
			`role: Role,`
			`content: String,`
			`#[serde(skip_serializing_if = "Option::is_none")]`
			`tool_calls: Option<Vec<OllamaRequestToolCall>>,`
			`#[serde(skip_serializing_if = "Option::is_none")]`
			`tool_call_id: Option<String>,`
			`}`

			`#[derive(Serialize)]`
			`struct OllamaRequestToolCall {`
			`function: OllamaRequestFunctionCall,`
			`#[serde(rename = "type")]`
			`kind: String,`
			`}`

			`#[derive(Serialize)]`
			`struct OllamaRequestFunctionCall {`
			`name: String,`
			`arguments: Value,`
			`}`

			`#[derive(Deserialize)]`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`struct OllamaStreamResponse {`
			`message: OllamaStreamMessage,`
			`done: bool,`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`}`

			`#[derive(Deserialize)]`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`struct OllamaStreamMessage {`
			`#[serde(default)]`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`content: String,`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`#[serde(default)]`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`tool_calls: Option<Vec<OllamaResponseToolCall>>,`
			`}`

			`#[derive(Deserialize)]`
			`struct OllamaResponseToolCall {`
			`function: OllamaResponseFunctionCall,`
			`}`

			`#[derive(Deserialize)]`
			`struct OllamaResponseFunctionCall {`
			`name: String,`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`arguments: Value,`
Story 18: Token-by-token streaming responses - Backend: Added OllamaProvider::chat_stream() with newline-delimited JSON parsing - Backend: Emit chat:token events for each token received from Ollama - Backend: Added futures dependency and stream feature for reqwest - Frontend: Added streamingContent state and chat:token event listener - Frontend: Real-time token display with auto-scroll - Frontend: Markdown and syntax highlighting support for streaming content - Fixed all TypeScript errors (tsc --noEmit) - Fixed all Biome warnings and errors - Fixed all Clippy warnings - Added comprehensive code quality documentation - Added tsc --noEmit to verification checklist Tested and verified: - Tokens stream in real-time - Auto-scroll works during streaming - Tool calls interrupt streaming correctly - Multi-turn conversations work - Smooth performance with no lag 2025-12-27 16:50:18 +00:00			`}`

fix: make llm provider async and add tool toggle 2025-12-24 17:32:46 +00:00			`#[async_trait]`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`impl ModelProvider for OllamaProvider {`
fix: make llm provider async and add tool toggle 2025-12-24 17:32:46 +00:00			`async fn chat(`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`&self,`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`_model: &str,`
			`_messages: &[Message],`
			`_tools: &[ToolDefinition],`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`) -> Result<CompletionResponse, String> {`
moved from tauri to a server with embedded UI 2026-02-13 12:31:36 +00:00			`Err("Non-streaming Ollama chat not implemented for server".to_string())`
feat: agent brain (ollama) and chat ui 2025-12-24 17:17:35 +00:00			`}`
			`}`