diff --git a/relay/channel/ollama/dto.go b/relay/channel/ollama/dto.go index a954c607..c4d97c86 100644 --- a/relay/channel/ollama/dto.go +++ b/relay/channel/ollama/dto.go @@ -11,6 +11,7 @@ type OllamaRequest struct { Topp float64 `json:"top_p,omitempty"` TopK int `json:"top_k,omitempty"` Stop any `json:"stop,omitempty"` + MaxTokens uint `json:"max_tokens,omitempty"` Tools []dto.ToolCall `json:"tools,omitempty"` ResponseFormat any `json:"response_format,omitempty"` FrequencyPenalty float64 `json:"frequency_penalty,omitempty"` diff --git a/relay/channel/ollama/relay-ollama.go b/relay/channel/ollama/relay-ollama.go index 8b53fbfb..89e9c214 100644 --- a/relay/channel/ollama/relay-ollama.go +++ b/relay/channel/ollama/relay-ollama.go @@ -58,6 +58,7 @@ func requestOpenAI2Ollama(request dto.GeneralOpenAIRequest) (*OllamaRequest, err TopK: request.TopK, Stop: Stop, Tools: request.Tools, + MaxTokens: request.MaxTokens, ResponseFormat: request.ResponseFormat, FrequencyPenalty: request.FrequencyPenalty, PresencePenalty: request.PresencePenalty,