From 2ef0930477b3ec1b036c3a1763ee79676b631642 Mon Sep 17 00:00:00 2001 From: Tim Pietrusky Date: Wed, 10 Dec 2025 21:27:32 +0100 Subject: [PATCH] fix(agent): switch model from gpt-oss-120b to qwen3-32b-awq gpt-oss-120b returns malformed json for tool calls, breaking agent functionality. qwen3-32b-awq properly supports tool calling. --- docs/context.md | 4 ++-- src/mastra/agents/weather-agent.ts | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/docs/context.md b/docs/context.md index b5f6422..543ec75 100644 --- a/docs/context.md +++ b/docs/context.md @@ -10,7 +10,7 @@ This document outlines the key technical conventions and architectural decisions - External functionalities are integrated as Mastra Tools or via MCP (Model Context Protocol). - Multiple agents can coexist in a single Mastra instance. - **AI Provider:** RunPod AI SDK Provider (`@runpod/ai-sdk-provider` v0.9.0) - - Uses OpenAI GPT-OSS-120B model (`openai/gpt-oss-120b`) for agent reasoning. + - Uses Qwen3-32B model (`qwen/qwen3-32b-awq`) for agent reasoning. - Supports streaming and non-streaming text generation. - **Server Framework:** Hono (via Mastra's built-in server) - **Storage:** Optional PostgreSQL with PgVector extension (defaults to in-memory) @@ -125,4 +125,4 @@ When all DB credentials are provided, PostgreSQL with PgVector is used. Otherwis - `README.md`: Hub-specific documentation displayed on the Hub page - **Endpoint Type:** Load Balancer (`LB`) for high availability - **Runtime:** CPU serverless (no GPU required) -- **Category:** `language` (AI/LLM category) \ No newline at end of file +- **Category:** `language` (AI/LLM category) diff --git a/src/mastra/agents/weather-agent.ts b/src/mastra/agents/weather-agent.ts index 1f87682..9df4c67 100644 --- a/src/mastra/agents/weather-agent.ts +++ b/src/mastra/agents/weather-agent.ts @@ -23,7 +23,7 @@ export const weatherAgent = new Agent({ Use the weatherTool to fetch current weather data. `, - model: runpod("openai/gpt-oss-120b"), + model: runpod("qwen/qwen3-32b-awq"), tools: { weatherTool }, memory, });