diff --git a/src/cost_tracker.py b/src/cost_tracker.py index 3b59720b..5016f7be 100644 --- a/src/cost_tracker.py +++ b/src/cost_tracker.py @@ -50,6 +50,17 @@ MODEL_PRICING = [ (r"qwen-vl-plus", {"input_per_mtok": 0.21, "output_per_mtok": 0.63}), (r"qwen-vl-max", {"input_per_mtok": 0.50, "output_per_mtok": 1.50}), (r"qwen-audio", {"input_per_mtok": 0.10, "output_per_mtok": 0.30}), + (r"grok-2", {"input_per_mtok": 2.00, "output_per_mtok": 10.00}), + (r"grok-2-vision", {"input_per_mtok": 2.00, "output_per_mtok": 10.00}), + (r"grok-beta", {"input_per_mtok": 5.00, "output_per_mtok": 15.00}), + (r"llama-3\.1-8b-instant", {"input_per_mtok": 0.05, "output_per_mtok": 0.08}), + (r"llama-3\.1-70b-versatile", {"input_per_mtok": 0.59, "output_per_mtok": 0.79}), + (r"llama-3\.1-405b-reasoning", {"input_per_mtok": 3.00, "output_per_mtok": 3.00}), + (r"llama-3\.2-1b-preview", {"input_per_mtok": 0.04, "output_per_mtok": 0.04}), + (r"llama-3\.2-3b-preview", {"input_per_mtok": 0.06, "output_per_mtok": 0.06}), + (r"llama-3\.2-11b-vision-preview", {"input_per_mtok": 0.18, "output_per_mtok": 0.18}), + (r"llama-3\.2-90b-vision-preview", {"input_per_mtok": 0.90, "output_per_mtok": 0.90}), + (r"llama-3\.3-70b-specdec", {"input_per_mtok": 0.59, "output_per_mtok": 0.79}), ] def estimate_cost(model: str, input_tokens: int, output_tokens: int) -> float: diff --git a/src/models.py b/src/models.py index 0db0795f..53735156 100644 --- a/src/models.py +++ b/src/models.py @@ -53,7 +53,7 @@ from src.paths import get_config_path #region: Constants -PROVIDERS: List[str] = ["gemini", "anthropic", "gemini_cli", "deepseek", "minimax", "qwen"] +PROVIDERS: List[str] = ["gemini", "anthropic", "gemini_cli", "deepseek", "minimax", "qwen", "grok", "llama"] AGENT_TOOL_NAMES: List[str] = [ "run_powershell",