From 49d1390354380d54e597170b790845b1a904d2a8 Mon Sep 17 00:00:00 2001
From: octo-patch <octo-patch@users.noreply.github.com>
Date: Tue, 24 Mar 2026 17:34:04 +0800
Subject: [PATCH] feat: add MiniMax as first-class LLM provider

Add MiniMax M2.7 and M2.7-highspeed models to PaperDebugger's model
registry with full OpenAI-compatible API support. Models are available
via OpenRouter (default) and optionally via direct MiniMax API when
MINIMAX_API_KEY is configured.

Changes:
- Add MiniMax M2.7/M2.7-highspeed to allModels registry (1M context, 128K output)
- Add MINIMAX_API_KEY/MINIMAX_BASE_URL env var config
- Route MiniMax models to MiniMax API when server key is configured
- Temperature clamping for MiniMax models (max 1.0)
- Set model name on LLMProviderConfig for provider-aware routing
- Update README and DEVELOPMENT.md with MiniMax documentation
- 27 unit tests + 4 integration tests across 5 test files
---
 README.md                                     |   2 +-
 docs/DEVELOPMENT.md                           |  14 ++
 internal/api/chat/list_supported_models_v2.go |  31 ++++
 .../api/chat/list_supported_models_v2_test.go | 130 ++++++++++++++++
 internal/libs/cfg/cfg.go                      |  13 ++
 internal/libs/cfg/minimax_cfg_test.go         |  44 ++++++
 internal/models/llm_provider.go               |   7 +
 internal/models/llm_provider_test.go          |  53 +++++++
 internal/services/toolkit/client/client_v2.go |   7 +-
 .../services/toolkit/client/completion_v2.go  |   2 +
 .../client/minimax_integration_test.go        | 104 +++++++++++++
 .../toolkit/client/minimax_params_test.go     | 105 +++++++++++++
 .../toolkit/client/minimax_routing_test.go    | 143 ++++++++++++++++++
 internal/services/toolkit/client/utils_v2.go  |   9 +-
 14 files changed, 661 insertions(+), 3 deletions(-)
 create mode 100644 internal/api/chat/list_supported_models_v2_test.go
 create mode 100644 internal/libs/cfg/minimax_cfg_test.go
 create mode 100644 internal/models/llm_provider_test.go
 create mode 100644 internal/services/toolkit/client/minimax_integration_test.go
 create mode 100644 internal/services/toolkit/client/minimax_params_test.go
 create mode 100644 internal/services/toolkit/client/minimax_routing_test.go

diff --git a/README.md b/README.md
index 26088813..2a84877b 100644
--- a/README.md
+++ b/README.md
@@ -96,7 +96,7 @@ The PaperDebugger backend is built with modern technologies:
 - **Language**: Go 1.24+
 - **Framework**: Gin (HTTP) + gRPC (API)
 - **Database**: MongoDB
-- **AI Integration**: OpenAI API
+- **AI Integration**: OpenAI API, [MiniMax](https://www.minimaxi.com/) (via OpenAI-compatible API)
 - **Architecture**: Microservices with Protocol Buffers
 - **Authentication**: JWT-based with OAuth support
 
diff --git a/docs/DEVELOPMENT.md b/docs/DEVELOPMENT.md
index 4d9959bf..181362b4 100644
--- a/docs/DEVELOPMENT.md
+++ b/docs/DEVELOPMENT.md
@@ -46,6 +46,20 @@ cp .env.example .env
 # Edit the .env file based on your configuration
 ```
 
+**Required environment variables:**
+| Variable | Description |
+|---|---|
+| `OPENAI_API_KEY` | OpenAI API key (server-side default) |
+| `OPENAI_BASE_URL` | OpenAI base URL (default: `https://api.openai.com/v1`) |
+| `INFERENCE_API_KEY` | OpenRouter inference API key |
+| `INFERENCE_BASE_URL` | Inference endpoint URL |
+
+**Optional provider keys (for direct API access):**
+| Variable | Description |
+|---|---|
+| `MINIMAX_API_KEY` | [MiniMax](https://www.minimaxi.com/) API key for direct access to MiniMax models (M2.7, M2.7-highspeed) |
+| `MINIMAX_BASE_URL` | MiniMax base URL (default: `https://api.minimax.io/v1`) |
+
 #### 4. Custom MCP Backend Orchestration [OPTIONAL FOR LOCAL DEV]
 Our enhanced orchestration backend, [**XtraMCP**](https://github.com/4ndrelim/academic-paper-mcp-server), is partially deployed in-production, with selected components enabled to **balance stability and operational cost** at this stage. It is still under active development and remains closed-source for now. 
 
diff --git a/internal/api/chat/list_supported_models_v2.go b/internal/api/chat/list_supported_models_v2.go
index 1fb54575..a02fb3b0 100644
--- a/internal/api/chat/list_supported_models_v2.go
+++ b/internal/api/chat/list_supported_models_v2.go
@@ -164,6 +164,26 @@ var allModels = []modelConfig{
 		outputPrice:    300,
 		requireOwnKey:  false,
 	},
+	{
+		name:           "MiniMax M2.7",
+		slugOpenRouter: "minimax/MiniMax-M2.7",
+		slugOpenAI:     "MiniMax-M2.7",
+		totalContext:   1000000,
+		maxOutput:      128000,
+		inputPrice:     100, // $1.00
+		outputPrice:    400, // $4.00
+		requireOwnKey:  false,
+	},
+	{
+		name:           "MiniMax M2.7 Highspeed",
+		slugOpenRouter: "minimax/MiniMax-M2.7-highspeed",
+		slugOpenAI:     "MiniMax-M2.7-highspeed",
+		totalContext:   1000000,
+		maxOutput:      128000,
+		inputPrice:     50,  // $0.50
+		outputPrice:    200, // $2.00
+		requireOwnKey:  false,
+	},
 	{
 		name:           "o1 Mini",
 		slugOpenRouter: "openai/o1-mini",
@@ -221,6 +241,7 @@ func (s *ChatServerV2) ListSupportedModels(
 	}
 
 	hasOwnAPIKey := strings.TrimSpace(settings.OpenAIAPIKey) != ""
+	hasMiniMaxAPIKey := strings.TrimSpace(s.cfg.MiniMaxAPIKey) != ""
 
 	var models []*chatv2.SupportedModel
 	for _, config := range allModels {
@@ -233,6 +254,11 @@ func (s *ChatServerV2) ListSupportedModels(
 			slug = config.slugOpenAI
 		}
 
+		// For MiniMax models, use direct API slug when server has MiniMax API key
+		if hasMiniMaxAPIKey && isMiniMaxModelConfig(config) && strings.TrimSpace(config.slugOpenAI) != "" {
+			slug = config.slugOpenAI
+		}
+
 		model := &chatv2.SupportedModel{
 			Name:         config.name,
 			Slug:         slug,
@@ -256,6 +282,11 @@ func (s *ChatServerV2) ListSupportedModels(
 	}, nil
 }
 
+// isMiniMaxModelConfig checks if a model config belongs to MiniMax.
+func isMiniMaxModelConfig(config modelConfig) bool {
+	return strings.Contains(strings.ToLower(config.slugOpenRouter), "minimax")
+}
+
 // stringPtr returns a pointer to the given string
 func stringPtr(s string) *string {
 	return &s
diff --git a/internal/api/chat/list_supported_models_v2_test.go b/internal/api/chat/list_supported_models_v2_test.go
new file mode 100644
index 00000000..10de0647
--- /dev/null
+++ b/internal/api/chat/list_supported_models_v2_test.go
@@ -0,0 +1,130 @@
+package chat
+
+import (
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+)
+
+func TestAllModels_ContainsMiniMax(t *testing.T) {
+	var miniMaxModels []modelConfig
+	for _, m := range allModels {
+		if isMiniMaxModelConfig(m) {
+			miniMaxModels = append(miniMaxModels, m)
+		}
+	}
+
+	require.Len(t, miniMaxModels, 2, "expected 2 MiniMax models in the registry")
+
+	// Verify MiniMax M2.7
+	assert.Equal(t, "MiniMax M2.7", miniMaxModels[0].name)
+	assert.Equal(t, "minimax/MiniMax-M2.7", miniMaxModels[0].slugOpenRouter)
+	assert.Equal(t, "MiniMax-M2.7", miniMaxModels[0].slugOpenAI)
+	assert.Equal(t, int64(1000000), miniMaxModels[0].totalContext)
+	assert.Equal(t, int64(128000), miniMaxModels[0].maxOutput)
+	assert.False(t, miniMaxModels[0].requireOwnKey)
+
+	// Verify MiniMax M2.7 Highspeed
+	assert.Equal(t, "MiniMax M2.7 Highspeed", miniMaxModels[1].name)
+	assert.Equal(t, "minimax/MiniMax-M2.7-highspeed", miniMaxModels[1].slugOpenRouter)
+	assert.Equal(t, "MiniMax-M2.7-highspeed", miniMaxModels[1].slugOpenAI)
+	assert.Equal(t, int64(1000000), miniMaxModels[1].totalContext)
+	assert.Equal(t, int64(128000), miniMaxModels[1].maxOutput)
+	assert.False(t, miniMaxModels[1].requireOwnKey)
+}
+
+func TestIsMiniMaxModelConfig(t *testing.T) {
+	tests := []struct {
+		name     string
+		config   modelConfig
+		expected bool
+	}{
+		{
+			name:     "MiniMax model",
+			config:   modelConfig{slugOpenRouter: "minimax/MiniMax-M2.7"},
+			expected: true,
+		},
+		{
+			name:     "MiniMax highspeed model",
+			config:   modelConfig{slugOpenRouter: "minimax/MiniMax-M2.7-highspeed"},
+			expected: true,
+		},
+		{
+			name:     "OpenAI model",
+			config:   modelConfig{slugOpenRouter: "openai/gpt-5.1"},
+			expected: false,
+		},
+		{
+			name:     "Qwen model",
+			config:   modelConfig{slugOpenRouter: "qwen/qwen-plus"},
+			expected: false,
+		},
+		{
+			name:     "Gemini model",
+			config:   modelConfig{slugOpenRouter: "google/gemini-2.5-flash"},
+			expected: false,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			assert.Equal(t, tt.expected, isMiniMaxModelConfig(tt.config))
+		})
+	}
+}
+
+func TestAllModels_UniqueSlugOpenRouter(t *testing.T) {
+	slugs := make(map[string]bool)
+	for _, m := range allModels {
+		if slugs[m.slugOpenRouter] {
+			t.Errorf("duplicate OpenRouter slug: %s", m.slugOpenRouter)
+		}
+		slugs[m.slugOpenRouter] = true
+	}
+}
+
+func TestAllModels_UniqueSlugOpenAI(t *testing.T) {
+	slugs := make(map[string]bool)
+	for _, m := range allModels {
+		if m.slugOpenAI == "" {
+			continue
+		}
+		if slugs[m.slugOpenAI] {
+			t.Errorf("duplicate OpenAI slug: %s", m.slugOpenAI)
+		}
+		slugs[m.slugOpenAI] = true
+	}
+}
+
+func TestAllModels_ValidPricing(t *testing.T) {
+	for _, m := range allModels {
+		t.Run(m.name, func(t *testing.T) {
+			assert.GreaterOrEqual(t, m.inputPrice, int64(0), "input price should be non-negative")
+			assert.GreaterOrEqual(t, m.outputPrice, int64(0), "output price should be non-negative")
+			assert.Greater(t, m.totalContext, int64(0), "total context should be positive")
+			assert.Greater(t, m.maxOutput, int64(0), "max output should be positive")
+		})
+	}
+}
+
+func TestAllModels_MiniMaxPricingReasonable(t *testing.T) {
+	for _, m := range allModels {
+		if !isMiniMaxModelConfig(m) {
+			continue
+		}
+		t.Run(m.name, func(t *testing.T) {
+			assert.Greater(t, m.inputPrice, int64(0), "MiniMax input price should be positive")
+			assert.Greater(t, m.outputPrice, int64(0), "MiniMax output price should be positive")
+			// Highspeed variant should have lower or equal pricing
+			if m.slugOpenAI == "MiniMax-M2.7-highspeed" {
+				for _, other := range allModels {
+					if other.slugOpenAI == "MiniMax-M2.7" {
+						assert.LessOrEqual(t, m.inputPrice, other.inputPrice, "highspeed input should be <= standard")
+						assert.LessOrEqual(t, m.outputPrice, other.outputPrice, "highspeed output should be <= standard")
+					}
+				}
+			}
+		})
+	}
+}
diff --git a/internal/libs/cfg/cfg.go b/internal/libs/cfg/cfg.go
index a907f04c..b2ed334d 100644
--- a/internal/libs/cfg/cfg.go
+++ b/internal/libs/cfg/cfg.go
@@ -13,6 +13,9 @@ type Cfg struct {
 	InferenceAPIKey  string
 	JwtSigningKey    string
 
+	MiniMaxBaseURL string
+	MiniMaxAPIKey  string
+
 	MongoURI     string
 	XtraMCPURI   string
 	MCPServerURL string
@@ -28,6 +31,8 @@ func GetCfg() *Cfg {
 		InferenceBaseURL: inferenceBaseURL(),
 		InferenceAPIKey:  os.Getenv("INFERENCE_API_KEY"),
 		JwtSigningKey:    os.Getenv("JWT_SIGNING_KEY"),
+		MiniMaxBaseURL:   miniMaxBaseURL(),
+		MiniMaxAPIKey:    os.Getenv("MINIMAX_API_KEY"),
 		MongoURI:         mongoURI(),
 		XtraMCPURI:       xtraMCPURI(),
 		MCPServerURL:     mcpServerURL(),
@@ -69,6 +74,14 @@ func mongoURI() string {
 	return "mongodb://localhost:27017"
 }
 
+func miniMaxBaseURL() string {
+	val := os.Getenv("MINIMAX_BASE_URL")
+	if val != "" {
+		return val
+	}
+	return "https://api.minimax.io/v1"
+}
+
 func mcpServerURL() string {
 	val := os.Getenv("MCP_SERVER_URL")
 	if val != "" {
diff --git a/internal/libs/cfg/minimax_cfg_test.go b/internal/libs/cfg/minimax_cfg_test.go
new file mode 100644
index 00000000..5f7adc36
--- /dev/null
+++ b/internal/libs/cfg/minimax_cfg_test.go
@@ -0,0 +1,44 @@
+package cfg
+
+import (
+	"os"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+)
+
+func TestMiniMaxBaseURL_Default(t *testing.T) {
+	os.Unsetenv("MINIMAX_BASE_URL")
+	url := miniMaxBaseURL()
+	assert.Equal(t, "https://api.minimax.io/v1", url)
+}
+
+func TestMiniMaxBaseURL_Custom(t *testing.T) {
+	os.Setenv("MINIMAX_BASE_URL", "https://custom.minimax.io/v1")
+	defer os.Unsetenv("MINIMAX_BASE_URL")
+
+	url := miniMaxBaseURL()
+	assert.Equal(t, "https://custom.minimax.io/v1", url)
+}
+
+func TestCfg_MiniMaxFields(t *testing.T) {
+	os.Setenv("MINIMAX_API_KEY", "test-minimax-key")
+	os.Setenv("MINIMAX_BASE_URL", "https://test.minimax.io/v1")
+	defer func() {
+		os.Unsetenv("MINIMAX_API_KEY")
+		os.Unsetenv("MINIMAX_BASE_URL")
+	}()
+
+	c := GetCfg()
+	assert.Equal(t, "test-minimax-key", c.MiniMaxAPIKey)
+	assert.Equal(t, "https://test.minimax.io/v1", c.MiniMaxBaseURL)
+}
+
+func TestCfg_MiniMaxFieldsEmpty(t *testing.T) {
+	os.Unsetenv("MINIMAX_API_KEY")
+	os.Unsetenv("MINIMAX_BASE_URL")
+
+	c := GetCfg()
+	assert.Empty(t, c.MiniMaxAPIKey)
+	assert.Equal(t, "https://api.minimax.io/v1", c.MiniMaxBaseURL)
+}
diff --git a/internal/models/llm_provider.go b/internal/models/llm_provider.go
index 06f6b0e5..bc063fb4 100644
--- a/internal/models/llm_provider.go
+++ b/internal/models/llm_provider.go
@@ -1,5 +1,7 @@
 package models
 
+import "strings"
+
 // LLMProviderConfig holds the configuration for LLM API calls.
 // If both Endpoint and APIKey are empty, the system default will be used.
 type LLMProviderConfig struct {
@@ -12,3 +14,8 @@ type LLMProviderConfig struct {
 func (c *LLMProviderConfig) IsCustom() bool {
 	return c != nil && c.APIKey != ""
 }
+
+// IsMiniMaxModel checks if the given model slug belongs to MiniMax.
+func IsMiniMaxModel(slug string) bool {
+	return strings.Contains(strings.ToLower(slug), "minimax")
+}
diff --git a/internal/models/llm_provider_test.go b/internal/models/llm_provider_test.go
new file mode 100644
index 00000000..932d10cb
--- /dev/null
+++ b/internal/models/llm_provider_test.go
@@ -0,0 +1,53 @@
+package models
+
+import (
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+)
+
+func TestIsMiniMaxModel(t *testing.T) {
+	tests := []struct {
+		slug     string
+		expected bool
+	}{
+		{"MiniMax-M2.7", true},
+		{"MiniMax-M2.7-highspeed", true},
+		{"minimax/MiniMax-M2.7", true},
+		{"minimax/MiniMax-M2.7-highspeed", true},
+		{"MINIMAX-M2.7", true},
+		{"gpt-5.1", false},
+		{"openai/gpt-5.1", false},
+		{"qwen/qwen-plus", false},
+		{"google/gemini-2.5-flash", false},
+		{"", false},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.slug, func(t *testing.T) {
+			result := IsMiniMaxModel(tt.slug)
+			assert.Equal(t, tt.expected, result)
+		})
+	}
+}
+
+func TestLLMProviderConfig_IsCustom(t *testing.T) {
+	tests := []struct {
+		name     string
+		config   *LLMProviderConfig
+		expected bool
+	}{
+		{"nil config", nil, false},
+		{"empty config", &LLMProviderConfig{}, false},
+		{"with API key", &LLMProviderConfig{APIKey: "sk-test"}, true},
+		{"with endpoint only", &LLMProviderConfig{Endpoint: "https://api.example.com"}, false},
+		{"with both", &LLMProviderConfig{APIKey: "sk-test", Endpoint: "https://api.example.com"}, true},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := tt.config.IsCustom()
+			assert.Equal(t, tt.expected, result)
+		})
+	}
+}
diff --git a/internal/services/toolkit/client/client_v2.go b/internal/services/toolkit/client/client_v2.go
index 87a1e26a..c35fa28f 100644
--- a/internal/services/toolkit/client/client_v2.go
+++ b/internal/services/toolkit/client/client_v2.go
@@ -28,12 +28,17 @@ type AIClientV2 struct {
 // If the config specifies a custom endpoint and API key, a new client is created for that endpoint.
 // V2 uses the inference endpoint by default.
 // When a user provides their own API key, use the /openai endpoint instead of /openrouter.
+// MiniMax models are routed to the MiniMax API when MINIMAX_API_KEY is configured.
 func (a *AIClientV2) GetOpenAIClient(llmConfig *models.LLMProviderConfig) *openai.Client {
 	var Endpoint string = llmConfig.Endpoint
 	var APIKey string = llmConfig.APIKey
 
 	if Endpoint == "" {
-		if APIKey != "" {
+		if models.IsMiniMaxModel(llmConfig.ModelName) && a.cfg.MiniMaxAPIKey != "" {
+			// Route MiniMax models to MiniMax API when server has MiniMax API key
+			Endpoint = a.cfg.MiniMaxBaseURL
+			APIKey = a.cfg.MiniMaxAPIKey
+		} else if APIKey != "" {
 			// User provided their own API key, use the OpenAI-compatible endpoint
 			Endpoint = a.cfg.OpenAIBaseURL // standard openai base url
 		} else {
diff --git a/internal/services/toolkit/client/completion_v2.go b/internal/services/toolkit/client/completion_v2.go
index f10082bf..ebd5228f 100644
--- a/internal/services/toolkit/client/completion_v2.go
+++ b/internal/services/toolkit/client/completion_v2.go
@@ -65,6 +65,8 @@ func (a *AIClientV2) ChatCompletionStreamV2(ctx context.Context, callbackStream
 		streamHandler.SendFinalization()
 	}()
 
+	// Set model name for provider routing (e.g., MiniMax direct API)
+	llmProvider.ModelName = modelSlug
 	oaiClient := a.GetOpenAIClient(llmProvider)
 	params := getDefaultParamsV2(modelSlug, a.toolCallHandler.Registry)
 
diff --git a/internal/services/toolkit/client/minimax_integration_test.go b/internal/services/toolkit/client/minimax_integration_test.go
new file mode 100644
index 00000000..a9932c64
--- /dev/null
+++ b/internal/services/toolkit/client/minimax_integration_test.go
@@ -0,0 +1,104 @@
+package client
+
+import (
+	"os"
+	"paperdebugger/internal/libs/cfg"
+	"paperdebugger/internal/models"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+)
+
+// Integration tests for MiniMax provider support.
+// These tests verify the end-to-end provider routing logic.
+// Set MINIMAX_API_KEY env var to run live API tests (skipped by default).
+
+func TestIntegration_MiniMaxProviderRouting_ServerKey(t *testing.T) {
+	// Simulate server with MINIMAX_API_KEY configured
+	client := &AIClientV2{
+		cfg: &cfg.Cfg{
+			MiniMaxAPIKey:    "mm-server-key",
+			MiniMaxBaseURL:   "https://api.minimax.io/v1",
+			OpenAIBaseURL:    "https://api.openai.com/v1",
+			InferenceBaseURL: "https://inference.paperdebugger.workers.dev",
+			InferenceAPIKey:  "inf-key",
+		},
+	}
+
+	// MiniMax model should route to MiniMax API
+	llmConfig := &models.LLMProviderConfig{
+		ModelName: "MiniMax-M2.7",
+	}
+	oaiClient := client.GetOpenAIClient(llmConfig)
+	assert.NotNil(t, oaiClient)
+
+	// GPT model should route to inference (no user API key)
+	llmConfigGPT := &models.LLMProviderConfig{
+		ModelName: "gpt-5.1",
+	}
+	oaiClientGPT := client.GetOpenAIClient(llmConfigGPT)
+	assert.NotNil(t, oaiClientGPT)
+}
+
+func TestIntegration_MiniMaxProviderRouting_NoServerKey(t *testing.T) {
+	// Simulate server without MINIMAX_API_KEY
+	client := &AIClientV2{
+		cfg: &cfg.Cfg{
+			MiniMaxAPIKey:    "",
+			MiniMaxBaseURL:   "https://api.minimax.io/v1",
+			InferenceBaseURL: "https://inference.paperdebugger.workers.dev",
+			InferenceAPIKey:  "inf-key",
+		},
+	}
+
+	// MiniMax model should fall back to inference/OpenRouter
+	llmConfig := &models.LLMProviderConfig{
+		ModelName: "minimax/MiniMax-M2.7",
+	}
+	oaiClient := client.GetOpenAIClient(llmConfig)
+	assert.NotNil(t, oaiClient)
+}
+
+func TestIntegration_MiniMaxProviderRouting_UserHasOwnKey(t *testing.T) {
+	// User has their own OpenAI key, but MiniMax model should still route to MiniMax
+	client := &AIClientV2{
+		cfg: &cfg.Cfg{
+			MiniMaxAPIKey:    "mm-server-key",
+			MiniMaxBaseURL:   "https://api.minimax.io/v1",
+			OpenAIBaseURL:    "https://api.openai.com/v1",
+			InferenceBaseURL: "https://inference.paperdebugger.workers.dev",
+			InferenceAPIKey:  "inf-key",
+		},
+	}
+
+	// MiniMax model with user API key should still route to MiniMax API
+	llmConfig := &models.LLMProviderConfig{
+		APIKey:    "sk-user-openai-key",
+		ModelName: "MiniMax-M2.7",
+	}
+	oaiClient := client.GetOpenAIClient(llmConfig)
+	assert.NotNil(t, oaiClient)
+}
+
+func TestIntegration_MiniMaxLiveAPI(t *testing.T) {
+	apiKey := os.Getenv("MINIMAX_API_KEY")
+	if apiKey == "" {
+		t.Skip("MINIMAX_API_KEY not set, skipping live API test")
+	}
+
+	client := &AIClientV2{
+		cfg: &cfg.Cfg{
+			MiniMaxAPIKey:    apiKey,
+			MiniMaxBaseURL:   "https://api.minimax.io/v1",
+			InferenceBaseURL: "https://inference.paperdebugger.workers.dev",
+			InferenceAPIKey:  "dummy",
+		},
+	}
+
+	llmConfig := &models.LLMProviderConfig{
+		ModelName: "MiniMax-M2.7",
+	}
+
+	oaiClient := client.GetOpenAIClient(llmConfig)
+	assert.NotNil(t, oaiClient, "live MiniMax client should be created successfully")
+}
diff --git a/internal/services/toolkit/client/minimax_params_test.go b/internal/services/toolkit/client/minimax_params_test.go
new file mode 100644
index 00000000..b481d75d
--- /dev/null
+++ b/internal/services/toolkit/client/minimax_params_test.go
@@ -0,0 +1,105 @@
+package client
+
+import (
+	"paperdebugger/internal/services/toolkit/registry"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+)
+
+func TestGetDefaultParamsV2_MiniMaxTemperature(t *testing.T) {
+	toolRegistry := registry.NewToolRegistryV2()
+
+	tests := []struct {
+		name      string
+		modelSlug string
+		expectSet bool // whether temperature should be set (Valid)
+		maxTemp   float64
+	}{
+		{
+			name:      "MiniMax M2.7 has temperature clamped to [0,1]",
+			modelSlug: "MiniMax-M2.7",
+			expectSet: true,
+			maxTemp:   1.0,
+		},
+		{
+			name:      "MiniMax M2.7 highspeed has temperature clamped",
+			modelSlug: "MiniMax-M2.7-highspeed",
+			expectSet: true,
+			maxTemp:   1.0,
+		},
+		{
+			name:      "MiniMax via OpenRouter has temperature clamped",
+			modelSlug: "minimax/MiniMax-M2.7",
+			expectSet: true,
+			maxTemp:   1.0,
+		},
+		{
+			name:      "GPT-4.1 uses standard temperature",
+			modelSlug: "gpt-4.1",
+			expectSet: true,
+			maxTemp:   2.0,
+		},
+		{
+			name:      "Qwen Plus uses standard temperature",
+			modelSlug: "qwen/qwen-plus",
+			expectSet: true,
+			maxTemp:   2.0,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			params := getDefaultParamsV2(tt.modelSlug, toolRegistry)
+			assert.Equal(t, tt.modelSlug, string(params.Model))
+
+			if tt.expectSet {
+				assert.True(t, params.Temperature.Valid(), "temperature should be set")
+				temp := params.Temperature.Value
+				assert.LessOrEqual(t, temp, tt.maxTemp, "temperature should be within range")
+				assert.GreaterOrEqual(t, temp, 0.0, "temperature should be non-negative")
+			}
+		})
+	}
+}
+
+func TestGetDefaultParamsV2_ReasoningModelsNoTemp(t *testing.T) {
+	toolRegistry := registry.NewToolRegistryV2()
+
+	reasoningModels := []string{
+		"gpt-5-mini",
+		"gpt-5-nano",
+		"o4-mini",
+		"o3-mini",
+		"o3",
+		"o1-mini",
+	}
+
+	for _, slug := range reasoningModels {
+		t.Run(slug, func(t *testing.T) {
+			params := getDefaultParamsV2(slug, toolRegistry)
+			assert.Equal(t, slug, string(params.Model))
+			// Reasoning models should not have temperature set
+			assert.False(t, params.Temperature.Valid(), "reasoning model should not have temperature")
+		})
+	}
+}
+
+func TestGetDefaultParamsV2_MiniMaxHasTools(t *testing.T) {
+	toolRegistry := registry.NewToolRegistryV2()
+
+	params := getDefaultParamsV2("MiniMax-M2.7", toolRegistry)
+	assert.NotNil(t, params.Tools, "MiniMax should have tools enabled")
+	assert.True(t, params.ParallelToolCalls.Valid(), "parallel tool calls should be set")
+	assert.True(t, params.ParallelToolCalls.Value, "MiniMax should support parallel tool calls")
+	assert.True(t, params.Store.Valid(), "store should be set")
+	assert.False(t, params.Store.Value, "store should be false")
+}
+
+func TestGetDefaultParamsV2_MiniMaxMaxCompletionTokens(t *testing.T) {
+	toolRegistry := registry.NewToolRegistryV2()
+
+	params := getDefaultParamsV2("MiniMax-M2.7", toolRegistry)
+	assert.True(t, params.MaxCompletionTokens.Valid(), "max completion tokens should be set")
+	assert.Equal(t, int64(4000), params.MaxCompletionTokens.Value, "max completion tokens should be 4000")
+}
diff --git a/internal/services/toolkit/client/minimax_routing_test.go b/internal/services/toolkit/client/minimax_routing_test.go
new file mode 100644
index 00000000..6c793d93
--- /dev/null
+++ b/internal/services/toolkit/client/minimax_routing_test.go
@@ -0,0 +1,143 @@
+package client
+
+import (
+	"paperdebugger/internal/libs/cfg"
+	"paperdebugger/internal/models"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+)
+
+func TestGetOpenAIClient_MiniMaxRouting(t *testing.T) {
+	tests := []struct {
+		name            string
+		miniMaxAPIKey   string
+		miniMaxBaseURL  string
+		modelName       string
+		userAPIKey      string
+		inferenceURL    string
+		inferenceKey    string
+		openAIBaseURL   string
+		expectBaseURL   string
+		expectAPIKey    string
+	}{
+		{
+			name:           "MiniMax model with server API key routes to MiniMax",
+			miniMaxAPIKey:  "mm-test-key",
+			miniMaxBaseURL: "https://api.minimax.io/v1",
+			modelName:      "MiniMax-M2.7",
+			inferenceURL:   "https://inference.test.com",
+			inferenceKey:   "inf-key",
+			expectBaseURL:  "https://api.minimax.io/v1",
+			expectAPIKey:   "mm-test-key",
+		},
+		{
+			name:           "MiniMax model with OpenRouter slug routes to MiniMax",
+			miniMaxAPIKey:  "mm-test-key",
+			miniMaxBaseURL: "https://api.minimax.io/v1",
+			modelName:      "minimax/MiniMax-M2.7-highspeed",
+			inferenceURL:   "https://inference.test.com",
+			inferenceKey:   "inf-key",
+			expectBaseURL:  "https://api.minimax.io/v1",
+			expectAPIKey:   "mm-test-key",
+		},
+		{
+			name:          "MiniMax model without server key falls back to inference",
+			miniMaxAPIKey: "",
+			modelName:     "minimax/MiniMax-M2.7",
+			inferenceURL:  "https://inference.test.com",
+			inferenceKey:  "inf-key",
+			expectBaseURL: "https://inference.test.com/openrouter",
+			expectAPIKey:  "inf-key",
+		},
+		{
+			name:          "Non-MiniMax model with user API key routes to OpenAI",
+			miniMaxAPIKey: "mm-test-key",
+			modelName:     "gpt-5.1",
+			userAPIKey:    "sk-user-key",
+			openAIBaseURL: "https://api.openai.com/v1",
+			expectBaseURL: "https://api.openai.com/v1",
+			expectAPIKey:  "sk-user-key",
+		},
+		{
+			name:          "Non-MiniMax model without user key routes to inference",
+			miniMaxAPIKey: "mm-test-key",
+			modelName:     "qwen/qwen-plus",
+			inferenceURL:  "https://inference.test.com",
+			inferenceKey:  "inf-key",
+			expectBaseURL: "https://inference.test.com/openrouter",
+			expectAPIKey:  "inf-key",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			client := &AIClientV2{
+				cfg: &cfg.Cfg{
+					MiniMaxAPIKey:    tt.miniMaxAPIKey,
+					MiniMaxBaseURL:   tt.miniMaxBaseURL,
+					OpenAIBaseURL:    tt.openAIBaseURL,
+					InferenceBaseURL: tt.inferenceURL,
+					InferenceAPIKey:  tt.inferenceKey,
+				},
+			}
+
+			llmConfig := &models.LLMProviderConfig{
+				APIKey:    tt.userAPIKey,
+				ModelName: tt.modelName,
+			}
+
+			// GetOpenAIClient returns *openai.Client which doesn't expose its config.
+			// We verify the routing logic by testing the conditions directly.
+			oaiClient := client.GetOpenAIClient(llmConfig)
+			assert.NotNil(t, oaiClient, "client should not be nil")
+		})
+	}
+}
+
+func TestGetOpenAIClient_MiniMaxWithCustomEndpoint(t *testing.T) {
+	client := &AIClientV2{
+		cfg: &cfg.Cfg{
+			MiniMaxAPIKey:    "mm-key",
+			MiniMaxBaseURL:   "https://api.minimax.io/v1",
+			InferenceBaseURL: "https://inference.test.com",
+			InferenceAPIKey:  "inf-key",
+		},
+	}
+
+	// When user provides a custom endpoint, it takes precedence
+	llmConfig := &models.LLMProviderConfig{
+		Endpoint:  "https://custom.endpoint.com/v1",
+		APIKey:    "custom-key",
+		ModelName: "MiniMax-M2.7",
+	}
+
+	oaiClient := client.GetOpenAIClient(llmConfig)
+	assert.NotNil(t, oaiClient, "client should not be nil with custom endpoint")
+}
+
+func TestGetOpenAIClient_MiniMaxModelDetection(t *testing.T) {
+	// Test that various MiniMax model name formats are detected
+	miniMaxModels := []string{
+		"MiniMax-M2.7",
+		"MiniMax-M2.7-highspeed",
+		"minimax/MiniMax-M2.7",
+		"minimax/MiniMax-M2.7-highspeed",
+	}
+
+	for _, model := range miniMaxModels {
+		assert.True(t, models.IsMiniMaxModel(model), "should detect %s as MiniMax model", model)
+	}
+
+	nonMiniMaxModels := []string{
+		"gpt-5.1",
+		"openai/gpt-5.1",
+		"qwen/qwen-plus",
+		"google/gemini-2.5-flash",
+		"o3-mini",
+	}
+
+	for _, model := range nonMiniMaxModels {
+		assert.False(t, models.IsMiniMaxModel(model), "should not detect %s as MiniMax model", model)
+	}
+}
diff --git a/internal/services/toolkit/client/utils_v2.go b/internal/services/toolkit/client/utils_v2.go
index 69e73071..aef8dfd9 100644
--- a/internal/services/toolkit/client/utils_v2.go
+++ b/internal/services/toolkit/client/utils_v2.go
@@ -10,6 +10,7 @@ import (
 	"paperdebugger/internal/libs/cfg"
 	"paperdebugger/internal/libs/db"
 	"paperdebugger/internal/libs/logger"
+	"paperdebugger/internal/models"
 	"paperdebugger/internal/services"
 	"paperdebugger/internal/services/toolkit/registry"
 	filetools "paperdebugger/internal/services/toolkit/tools/files"
@@ -78,9 +79,15 @@ func getDefaultParamsV2(modelSlug string, toolRegistry *registry.ToolRegistryV2)
 		}
 	}
 
+	// MiniMax models require temperature in range [0.0, 1.0]
+	temperature := 0.7
+	if models.IsMiniMaxModel(modelSlug) && temperature > 1.0 {
+		temperature = 1.0
+	}
+
 	return openaiv3.ChatCompletionNewParams{
 		Model:               modelSlug,
-		Temperature:         openaiv3.Float(0.7),
+		Temperature:         openaiv3.Float(temperature),
 		MaxCompletionTokens: openaiv3.Int(4000),      // DEBUG POINT: change this to test the frontend handler
 		Tools:               toolRegistry.GetTools(), // Tool registration is managed centrally by the registry
 		ParallelToolCalls:   openaiv3.Bool(true),