feat sambanova models (#1858)

Co-authored-by: jorgep_snova <jorge.piedrahita@sambanovasystems.com> Co-authored-by: João Moura <joaomdmoura@gmail.com>
2026-01-09 16:18:30 +00:00 · 2025-01-07 10:03:26 -05:00
parent 673a38c5d9
commit 0e94236735
5 changed files with 47 additions and 0 deletions
--- a/docs/concepts/cli.mdx
+++ b/docs/concepts/cli.mdx
@@ -161,6 +161,7 @@ The CLI will initially prompt for API keys for the following services:
 * Groq
 * Anthropic
 * Google Gemini
 * SambaNova
 When you select a provider, the CLI will prompt you to enter your API key.
--- a/docs/concepts/llms.mdx
+++ b/docs/concepts/llms.mdx
@@ -146,6 +146,19 @@ Here's a detailed breakdown of supported models and their capabilities, you can
      Groq is known for its fast inference speeds, making it suitable for real-time applications.
    </Tip>
  </Tab>
  <Tab title="SambaNova">
    | Model | Context Window | Best For |
    |-------|---------------|-----------|
    | Llama 3.1 70B/8B | Up to 131,072 tokens | High-performance, large context tasks |
    | Llama 3.1 405B | 8,192 tokens | High-performance and output quality |
    | Llama 3.2 Series | 8,192 tokens | General-purpose tasks, multimodal |
    | Llama 3.3 70B | Up to 131,072 tokens | High-performance and output quality|
    | Qwen2 familly | 8,192 tokens | High-performance and output quality |
    <Tip>
      [SambaNova](https://cloud.sambanova.ai/) has several models with fast inference speed at full precision.
    </Tip>
  </Tab>
  <Tab title="Others">
    | Provider | Context Window | Key Features |
    |----------|---------------|--------------|
--- a/docs/how-to/llm-connections.mdx
+++ b/docs/how-to/llm-connections.mdx
@@ -32,6 +32,7 @@ LiteLLM supports a wide range of providers, including but not limited to:
 - Cloudflare Workers AI
 - DeepInfra
 - Groq
 - SambaNova
 - [NVIDIA NIMs](https://docs.api.nvidia.com/nim/reference/models-1)
 - And many more!
--- a/src/crewai/cli/constants.py
+++ b/src/crewai/cli/constants.py
@@ -85,6 +85,12 @@ ENV_VARS = {
            "key_name": "CEREBRAS_API_KEY",
        },
    ],
    "sambanova": [
        {
            "prompt": "Enter your SambaNovaCloud API key (press Enter to skip)",
            "key_name": "SAMBANOVA_API_KEY",
        }
    ],
 }
@@ -98,6 +104,7 @@ PROVIDERS = [
    "bedrock",
    "azure",
    "cerebras",
    "sambanova",
 ]
 MODELS = {
@@ -156,6 +163,19 @@ MODELS = {
        "bedrock/mistral.mistral-7b-instruct-v0:2",
        "bedrock/mistral.mixtral-8x7b-instruct-v0:1",
    ],
    "sambanova": [
        "sambanova/Meta-Llama-3.3-70B-Instruct",
        "sambanova/QwQ-32B-Preview",
        "sambanova/Qwen2.5-72B-Instruct",
        "sambanova/Qwen2.5-Coder-32B-Instruct",
        "sambanova/Meta-Llama-3.1-405B-Instruct",
        "sambanova/Meta-Llama-3.1-70B-Instruct",
        "sambanova/Meta-Llama-3.1-8B-Instruct",
        "sambanova/Llama-3.2-90B-Vision-Instruct",
        "sambanova/Llama-3.2-11B-Vision-Instruct",
        "sambanova/Meta-Llama-3.2-3B-Instruct",
        "sambanova/Meta-Llama-3.2-1B-Instruct",
    ],
 }
 DEFAULT_LLM_MODEL = "gpt-4o-mini"
--- a/src/crewai/llm.py
+++ b/src/crewai/llm.py
@@ -76,6 +76,18 @@ LLM_CONTEXT_WINDOW_SIZES = {
    "mixtral-8x7b-32768": 32768,
    "llama-3.3-70b-versatile": 128000,
    "llama-3.3-70b-instruct": 128000,
    #sambanova
    "Meta-Llama-3.3-70B-Instruct": 131072,
    "QwQ-32B-Preview": 8192,
    "Qwen2.5-72B-Instruct": 8192,
    "Qwen2.5-Coder-32B-Instruct": 8192,
    "Meta-Llama-3.1-405B-Instruct": 8192,
    "Meta-Llama-3.1-70B-Instruct": 131072,
    "Meta-Llama-3.1-8B-Instruct": 131072,
    "Llama-3.2-90B-Vision-Instruct": 16384,
    "Llama-3.2-11B-Vision-Instruct": 16384,
    "Meta-Llama-3.2-3B-Instruct": 4096,
    "Meta-Llama-3.2-1B-Instruct": 16384,
 }
 DEFAULT_CONTEXT_WINDOW_SIZE = 8192