From 8910efb1da1146a52de9a300a2b9ecfeecb275d4 Mon Sep 17 00:00:00 2001 From: xy3 <120182408@qq.com> Date: Sat, 8 Feb 2025 11:54:08 +0800 Subject: [PATCH 1/2] =?UTF-8?q?=E6=9B=B4=E6=AD=A3=E7=A1=85=E5=9F=BA?= =?UTF-8?q?=E6=B5=81=E5=8A=A8=E7=9A=84SenseVoiceSmall=E6=A8=A1=E5=9E=8B?= =?UTF-8?q?=E5=90=8D=E5=AD=97?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- relay/channel/siliconflow/constant.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/relay/channel/siliconflow/constant.go b/relay/channel/siliconflow/constant.go index 819f4aa0..fea6fcd4 100644 --- a/relay/channel/siliconflow/constant.go +++ b/relay/channel/siliconflow/constant.go @@ -40,7 +40,7 @@ var ModelList = []string{ "Pro/meta-llama/Meta-Llama-3-8B-Instruct", "Pro/mistralai/Mistral-7B-Instruct-v0.2", "black-forest-labs/FLUX.1-schnell", - "iic/SenseVoiceSmall", + "FunAudioLLM/SenseVoiceSmall", "netease-youdao/bce-embedding-base_v1", "BAAI/bge-m3", "internlm/internlm2_5-20b-chat", From 34fdac38bf75d9e7fcf43ef3fce764c07e5f8792 Mon Sep 17 00:00:00 2001 From: HynoR <20227709+HynoR@users.noreply.github.com> Date: Sun, 9 Feb 2025 12:35:37 +0800 Subject: [PATCH 2/2] =?UTF-8?q?chore:=20=E5=90=8C=E6=AD=A5deepseek?= =?UTF-8?q?=E4=BB=B7=E6=A0=BC?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- common/model-ratio.go | 13 ++++++------- 1 file changed, 6 insertions(+), 7 deletions(-) diff --git a/common/model-ratio.go b/common/model-ratio.go index e3482ba1..bb94ad36 100644 --- a/common/model-ratio.go +++ b/common/model-ratio.go @@ -191,8 +191,9 @@ var defaultModelRatio = map[string]float64{ "command-r-plus": 1.5, "command-r-08-2024": 0.075, "command-r-plus-08-2024": 1.25, - "deepseek-chat": 0.07, - "deepseek-coder": 0.07, + "deepseek-chat": 0.27 / 2, + "deepseek-coder": 0.27 / 2, + "deepseek-reasoner": 0.55 / 2, // 0.55 / 1k tokens // Perplexity online 模型对搜索额外收费,有需要应自行调整,此处不计入搜索费用 "llama-3-sonar-small-32k-chat": 0.2 / 1000 * USD, "llama-3-sonar-small-32k-online": 0.2 / 1000 * USD, @@ -418,11 +419,9 @@ func GetCompletionRatio(name string) float64 { return 4 } } - if strings.HasPrefix(lowercaseName, "deepseek") { - if strings.HasSuffix(lowercaseName, "reasoner") || strings.HasSuffix(lowercaseName, "r1") { - return 4 - } - return 2 + // hint 只给官方上4倍率,由于开源模型供应商自行定价,不对其进行补全倍率进行强制对齐 + if lowercaseName == "deepseek-chat" || lowercaseName == "deepseek-reasoner" { + return 4 } if strings.HasPrefix(name, "ERNIE-Speed-") { return 2