hcengineering
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 1 deletion b/‎.gitignore‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎Cargo.lock‎
Lines changed: 2 additions & 2 deletions b/‎Cargo.lock‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/agent/event.rs‎
Lines changed: 1 addition & 8 deletions b/‎src/agent/event.rs‎
Lines changed: 1 addition & 8 deletions
diff --git a/‎src/agent/mod.rs‎
Lines changed: 59 additions & 11 deletions b/‎src/agent/mod.rs‎
Lines changed: 59 additions & 11 deletions
diff --git a/‎src/main.rs‎
Lines changed: 5 additions & 1 deletion b/‎src/main.rs‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/providers/anthropic_models.json‎
Lines changed: 44 additions & 0 deletions b/‎src/providers/anthropic_models.json‎
Lines changed: 44 additions & 0 deletions
diff --git a/‎src/providers/mod.rs‎
Lines changed: 2 additions & 0 deletions b/‎src/providers/mod.rs‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/providers/model_info.rs‎
Lines changed: 127 additions & 0 deletions b/‎src/providers/model_info.rs‎
Lines changed: 127 additions & 0 deletions
@@ -7,4 +7,5 @@ logs/
 history.json
 huly-coder-local.yaml
 /memory.yaml
-/.fastembed_cache/
+/.fastembed_cache/
+openrouter_models.json
@@ -43,13 +43,6 @@ impl Display for AgentState {
     }
 }
 
-#[derive(Clone, Debug, Default)]
-pub struct AgentStatus {
-    pub current_tokens: u32,
-    pub max_tokens: u32,
-    pub state: AgentState,
-}
-
 /// Status of a command tool call
 #[derive(Clone, Debug, Default)]
 pub struct AgentCommandStatus {
@@ -66,7 +59,7 @@ pub enum AgentOutputEvent {
     UpdateMessage(Message),
     NewTask,
     CommandStatus(Vec<AgentCommandStatus>),
-    AgentStatus(AgentStatus),
+    AgentStatus(u32, u32, AgentState),
     HighlightFile(String, bool),
 }
 
 
@@ -51,7 +51,6 @@ pub use event::AgentOutputEvent;
 use tokio::sync::RwLock;
 
 use self::event::AgentState;
-use self::event::AgentStatus;
 use self::utils::*;
 
 pub struct Agent {
@@ -66,7 +65,8 @@ pub struct Agent {
     memory: Arc<RwLock<MemoryManager>>,
     memory_index: Option<InMemoryVectorIndex<rig_fastembed::EmbeddingModel, Entity>>,
     process_registry: Arc<RwLock<ProcessRegistry>>,
-    current_tokens: u32,
+    current_input_tokens: u32,
+    current_completion_tokens: u32,
     state: AgentState,
 }
 
@@ -93,6 +93,10 @@ impl Display for AgentError {
     }
 }
 
+fn count_tokens(system_prompt: &str) -> u32 {
+    system_prompt.len() as u32 / 4
+}
+
 impl Agent {
     pub fn new(
         config: Config,
@@ -108,7 +112,8 @@ impl Agent {
             messages,
             stream: None,
             assistant_content: None,
-            current_tokens: 0,
+            current_input_tokens: 0,
+            current_completion_tokens: 0,
             memory: Arc::new(RwLock::new(MemoryManager::new(false))),
             process_registry: Arc::new(RwLock::new(ProcessRegistry::default())),
             memory_index: None,
@@ -338,7 +343,7 @@ impl Agent {
         self.messages[last_idx] = message;
     }
 
-    async fn process_messages(&mut self) -> Result<(), AgentError> {
+    async fn process_messages(&mut self, system_prompt_token_count: u32) -> Result<(), AgentError> {
         if self.state.is_paused() {
             return Ok(());
         }
@@ -494,7 +499,49 @@ impl Agent {
                 if let Some(raw_response) = response.raw_response {
                     let usage = raw_response.usage;
                     tracing::info!("Usage: {:?}", usage);
-                    self.current_tokens = usage.total_tokens as u32;
+                    if usage.total_tokens > 0 {
+                        self.current_input_tokens = usage.prompt_tokens as u32;
+                        self.current_completion_tokens =
+                            (usage.total_tokens - usage.prompt_tokens) as u32;
+                    } else {
+                        // try to calculate aproximate tokens
+                        self.current_input_tokens = system_prompt_token_count
+                            + self
+                                .messages
+                                .iter()
+                                .map(|m| match m {
+                                    Message::User { content } => content
+                                        .iter()
+                                        .map(|c| match c {
+                                            UserContent::Text(text) => count_tokens(&text.text),
+                                            UserContent::ToolResult(tool_result) => tool_result
+                                                .content
+                                                .iter()
+                                                .map(|t| match t {
+                                                    ToolResultContent::Text(text) => {
+                                                        count_tokens(&text.text)
+                                                    }
+                                                    _ => 0,
+                                                })
+                                                .sum::<u32>(),
+                                            _ => 0,
+                                        })
+                                        .sum::<u32>(),
+                                    Message::Assistant { content } => content
+                                        .iter()
+                                        .map(|c| match c {
+                                            AssistantContent::Text(text) => {
+                                                count_tokens(&text.text)
+                                            }
+                                            AssistantContent::ToolCall(tool_call) => count_tokens(
+                                                &serde_json::to_string(tool_call).unwrap(),
+                                            ),
+                                        })
+                                        .sum::<u32>(),
+                                })
+                                .sum::<u32>();
+                        self.current_completion_tokens = 0;
+                    }
                 }
                 self.assistant_content = None;
                 if matches!(self.state, AgentState::Completed(false)) {
@@ -517,6 +564,7 @@ impl Agent {
         );
         let system_prompt =
             prepare_system_prompt(&self.config.workspace, &self.config.user_instructions).await;
+        let system_prompt_token_count = count_tokens(&system_prompt);
         self.agent = Some(
             Self::build_agent(BuildAgentContext {
                 config: &self.config,
@@ -577,7 +625,7 @@ impl Agent {
                     }
                 }
             }
-            if let Err(e) = self.process_messages().await {
+            if let Err(e) = self.process_messages(system_prompt_token_count).await {
                 tracing::debug!("persist_history");
                 persist_history(&self.messages);
                 tracing::error!("Error processing messages: {}", e);
@@ -615,11 +663,11 @@ impl Agent {
         self.state = state;
         if !self.sender.is_closed() {
             self.sender
-                .send(AgentOutputEvent::AgentStatus(AgentStatus {
-                    current_tokens: self.current_tokens,
-                    max_tokens: 1,
-                    state: self.state.clone(),
-                }))
+                .send(AgentOutputEvent::AgentStatus(
+                    self.current_input_tokens,
+                    self.current_completion_tokens,
+                    self.state.clone(),
+                ))
                 .unwrap();
         }
     }
 
@@ -9,6 +9,7 @@ use crossterm::terminal::disable_raw_mode;
 use crossterm::terminal::enable_raw_mode;
 use crossterm::terminal::EnterAlternateScreen;
 use crossterm::terminal::LeaveAlternateScreen;
+use providers::model_info::model_info;
 use ratatui::prelude::CrosstermBackend;
 use ratatui::DefaultTerminal;
 use ratatui::Terminal;
@@ -107,6 +108,9 @@ async fn main() -> color_eyre::Result<()> {
         Vec::new()
     };
 
+    let model_info = model_info(&config).await?;
+    tracing::info!("Model info: {:?}", model_info);
+
     let mut agent = agent::Agent::new(
         config.clone(),
         control_receiver,
@@ -120,7 +124,7 @@ async fn main() -> color_eyre::Result<()> {
     });
 
     let terminal = init_tui().unwrap();
-    let result = tui::App::new(config, control_sender, output_receiver, history)
+    let result = tui::App::new(config, model_info, control_sender, output_receiver, history)
         .run(terminal)
         .await;
     let _ = agent_handler.await;
 
@@ -0,0 +1,44 @@
+[
+    {
+        "model_id": "claude-opus-4",
+        "input_price": 0.000015,
+        "output_price": 0.000075,
+        "max_context_tokens": 200000
+    },
+    {
+        "model_id": "claude-sonnet-4",
+        "input_price": 0.000003,
+        "output_price": 0.000015,
+        "max_context_tokens": 200000
+    },
+    {
+        "model_id": "claude-sonnet-3.7",
+        "input_price": 0.000003,
+        "output_price": 0.000015,
+        "max_context_tokens": 200000
+    },
+    {
+        "model_id": "claude-sonnet-3.5",
+        "input_price": 0.000003,
+        "output_price": 0.000015,
+        "max_context_tokens": 200000
+    },
+    {
+        "model_id": "claude-haiku-3.5",
+        "input_price": 0.0000008,
+        "output_price": 0.000004,
+        "max_context_tokens": 200000
+    },
+    {
+        "model_id": "claude-opus-3",
+        "input_price": 0.000015,
+        "output_price": 0.000075,
+        "max_context_tokens": 200000
+    },
+    {
+        "model_id": "claude-haiku-3",
+        "input_price": 0.00000025,
+        "output_price": 0.00000125,
+        "max_context_tokens": 200000
+    }
+]
@@ -1,11 +1,13 @@
 // Copyright © 2025 Huly Labs. Use of this source code is governed by the MIT license.
+
 use async_trait::async_trait;
 use rig::agent::Agent;
 use rig::completion::CompletionError;
 use rig::message::Message;
 use rig::streaming::{StreamingCompletion, StreamingCompletionResponse};
 use rig::tool::ToolSet;
 
+pub mod model_info;
 pub mod openrouter;
 
 #[async_trait]
 
@@ -0,0 +1,127 @@
+// Copyright © 2025 Huly Labs. Use of this source code is governed by the MIT license.
+
+use std::{fs, path::Path};
+
+use serde::Deserialize;
+
+use crate::config::Config;
+
+const OPENROUTER_MODELS_FILE: &str = "openrouter_models.json";
+const ANTHROPIC_MODELS: &str = include_str!("anthropic_models.json");
+const OPENAI_MODELS: &str = include_str!("openai_models.json");
+
+#[derive(Debug, Clone)]
+pub struct ModelInfo {
+    pub input_price: f64,
+    pub completion_price: f64,
+    pub max_tokens: u32,
+}
+
+#[derive(Deserialize)]
+struct LMStudioModelInfo {
+    pub id: String,
+    pub loaded_context_length: Option<u32>,
+    pub max_context_length: u32,
+}
+
+#[derive(Deserialize)]
+struct OpenRouterPriceInfo {
+    pub prompt: String,
+    pub completion: String,
+}
+
+#[derive(Deserialize)]
+struct OpenRouterModelInfo {
+    pub id: String,
+    pub pricing: OpenRouterPriceInfo,
+    pub context_length: u32,
+}
+
+#[derive(Deserialize)]
+struct AnthropicModelInfo {
+    pub model_id: String,
+    pub input_price: f64,
+    pub output_price: f64,
+    pub max_context_tokens: u32,
+}
+
+#[derive(Deserialize)]
+struct OpenAIModelInfo {
+    pub model_id: String,
+    pub input_price: f64,
+    pub output_price: f64,
+    pub max_context_tokens: u32,
+}
+
+pub async fn model_info(config: &Config) -> color_eyre::Result<ModelInfo> {
+    match config.provider {
+        crate::config::ProviderKind::OpenAI => {
+            let models: Vec<OpenAIModelInfo> = serde_json::from_str(OPENAI_MODELS)?;
+            models
+                .iter()
+                .find(|model| config.model.contains(&model.model_id))
+                .map(|model| ModelInfo {
+                    input_price: model.input_price,
+                    completion_price: model.output_price,
+                    max_tokens: model.max_context_tokens,
+                })
+                .ok_or_else(|| color_eyre::eyre::eyre!("Model not found"))
+        }
+        crate::config::ProviderKind::OpenRouter => {
+            let models: Vec<OpenRouterModelInfo> =
+                serde_json::from_value(if Path::new(OPENROUTER_MODELS_FILE).exists() {
+                    let data = fs::read_to_string(OPENROUTER_MODELS_FILE)?;
+                    serde_json::from_str(&data)?
+                } else {
+                    let mut data = reqwest::get("https://openrouter.ai/api/v1/models")
+                        .await?
+                        .json::<serde_json::Value>()
+                        .await?;
+                    let data = data["data"].take();
+                    fs::write(OPENROUTER_MODELS_FILE, data.to_string())?;
+                    data
+                })?;
+            models
+                .iter()
+                .find(|model| model.id == config.model)
+                .map(|model| ModelInfo {
+                    input_price: model.pricing.prompt.parse::<f64>().unwrap_or(0.0),
+                    completion_price: model.pricing.completion.parse::<f64>().unwrap_or(0.0),
+                    max_tokens: model.context_length,
+                })
+                .ok_or_else(|| color_eyre::eyre::eyre!("Model not found"))
+        }
+        crate::config::ProviderKind::LMStudio => {
+            let url = config
+                .provider_base_url
+                .clone()
+                .unwrap_or("http://127.0.0.1:1234/v1".to_string())
+                .replace("/v1", "/api/v0/models");
+            let mut data = reqwest::get(url).await?.json::<serde_json::Value>().await?;
+            let models: Vec<LMStudioModelInfo> = serde_json::from_value(data["data"].take())?;
+            models
+                .iter()
+                .find(|model| model.id == config.model)
+                .map(|model| ModelInfo {
+                    input_price: 0.0,
+                    completion_price: 0.0,
+                    max_tokens: model
+                        .loaded_context_length
+                        .unwrap_or(model.max_context_length),
+                })
+                .ok_or_else(|| color_eyre::eyre::eyre!("Model not found"))
+        }
+        crate::config::ProviderKind::Anthropic => {
+            let models: Vec<AnthropicModelInfo> = serde_json::from_str(ANTHROPIC_MODELS)?;
+            models
+                .iter()
+                .find(|model| config.model.contains(&model.model_id))
+                .map(|model| ModelInfo {
+                    input_price: model.input_price,
+                    completion_price: model.output_price,
+                    max_tokens: model.max_context_tokens,
+                })
+                .ok_or_else(|| color_eyre::eyre::eyre!("Model not found"))
+        }
+    }
+}