update max_tokens to max_completion_tokens

This commit is contained in:
Paulo Santos
2026-02-04 21:24:03 +00:00
committed by GitHub
parent 95f4a27227
commit 725fb1c850
2 changed files with 5 additions and 5 deletions
+3 -3
View File
@@ -72,7 +72,7 @@ describe('inference.ts', () => {
content: 'Hello, AI!', content: 'Hello, AI!',
}, },
], ],
max_tokens: 100, max_completion_tokens: 100,
model: 'gpt-4', model: 'gpt-4',
}) })
@@ -176,7 +176,7 @@ describe('inference.ts', () => {
content: 'Hello, AI!', content: 'Hello, AI!',
}, },
], ],
max_tokens: 100, max_completion_tokens: 100,
model: 'gpt-4', model: 'gpt-4',
response_format: requestWithResponseFormat.responseFormat, response_format: requestWithResponseFormat.responseFormat,
}) })
@@ -228,7 +228,7 @@ describe('inference.ts', () => {
expect(callArgs.tools).toEqual(mockMcpClient.tools) expect(callArgs.tools).toEqual(mockMcpClient.tools)
expect(callArgs.response_format).toBeUndefined() expect(callArgs.response_format).toBeUndefined()
expect(callArgs.model).toBe('gpt-4') expect(callArgs.model).toBe('gpt-4')
expect(callArgs.max_tokens).toBe(100) expect(callArgs.max_completion_tokens).toBe(100)
// Verify OpenAI client was initialized with empty custom headers // Verify OpenAI client was initialized with empty custom headers
expect(mockOpenAIClient).toHaveBeenCalledWith({ expect(mockOpenAIClient).toHaveBeenCalledWith({
+2 -2
View File
@@ -47,7 +47,7 @@ export async function simpleInference(request: InferenceRequest): Promise<string
const chatCompletionRequest: OpenAI.Chat.Completions.ChatCompletionCreateParams = { const chatCompletionRequest: OpenAI.Chat.Completions.ChatCompletionCreateParams = {
messages: request.messages as OpenAI.Chat.Completions.ChatCompletionMessageParam[], messages: request.messages as OpenAI.Chat.Completions.ChatCompletionMessageParam[],
max_tokens: request.maxTokens, max_completion_tokens: request.maxTokens,
model: request.modelName, model: request.modelName,
temperature: request.temperature, temperature: request.temperature,
top_p: request.topP, top_p: request.topP,
@@ -95,7 +95,7 @@ export async function mcpInference(
const chatCompletionRequest: OpenAI.Chat.Completions.ChatCompletionCreateParams = { const chatCompletionRequest: OpenAI.Chat.Completions.ChatCompletionCreateParams = {
messages: messages as OpenAI.Chat.Completions.ChatCompletionMessageParam[], messages: messages as OpenAI.Chat.Completions.ChatCompletionMessageParam[],
max_tokens: request.maxTokens, max_completion_tokens: request.maxTokens,
model: request.modelName, model: request.modelName,
temperature: request.temperature, temperature: request.temperature,
top_p: request.topP, top_p: request.topP,