Skip to content

Commit 409cc7d

Browse files
sensebcrazywoola
andauthored
mark deprecated models in siliconflow #12399 (#12405)
Co-authored-by: crazywoola <[email protected]>
1 parent fe26be2 commit 409cc7d

9 files changed

+64
-10
lines changed

api/core/model_runtime/model_providers/siliconflow/llm/_position.yaml

-3
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,13 @@
1-
- Tencent/Hunyuan-A52B-Instruct
21
- Qwen/QwQ-32B-Preview
32
- Qwen/Qwen2.5-72B-Instruct
43
- Qwen/Qwen2.5-32B-Instruct
54
- Qwen/Qwen2.5-14B-Instruct
65
- Qwen/Qwen2.5-7B-Instruct
76
- Qwen/Qwen2.5-Coder-32B-Instruct
87
- Qwen/Qwen2.5-Coder-7B-Instruct
9-
- Qwen/Qwen2.5-Math-72B-Instruct
108
- Qwen/Qwen2-VL-72B-Instruct
119
- Qwen/Qwen2-1.5B-Instruct
1210
- Pro/Qwen/Qwen2-VL-7B-Instruct
13-
- OpenGVLab/InternVL2-Llama3-76B
1411
- OpenGVLab/InternVL2-26B
1512
- Pro/OpenGVLab/InternVL2-8B
1613
- deepseek-ai/DeepSeek-V2.5

api/core/model_runtime/model_providers/siliconflow/llm/hunyuan-a52b-instruct.yaml

+1
Original file line numberDiff line numberDiff line change
@@ -82,3 +82,4 @@ pricing:
8282
output: '21'
8383
unit: '0.000001'
8484
currency: RMB
85+
deprecated: true

api/core/model_runtime/model_providers/siliconflow/llm/internvl2-llama3-76b.yaml

+1
Original file line numberDiff line numberDiff line change
@@ -82,3 +82,4 @@ pricing:
8282
output: '21'
8383
unit: '0.000001'
8484
currency: RMB
85+
deprecated: true
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,54 @@
1+
model: Qwen/QVQ-72B-Preview
2+
label:
3+
en_US: Qwen/QVQ-72B-Preview
4+
model_type: llm
5+
features:
6+
- agent-thought
7+
- tool-call
8+
- stream-tool-call
9+
- vision
10+
model_properties:
11+
mode: chat
12+
context_size: 32768
13+
parameter_rules:
14+
- name: temperature
15+
use_template: temperature
16+
- name: max_tokens
17+
use_template: max_tokens
18+
type: int
19+
default: 8192
20+
min: 1
21+
max: 16384
22+
help:
23+
zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
24+
en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
25+
- name: top_p
26+
use_template: top_p
27+
- name: top_k
28+
label:
29+
zh_Hans: 取样数量
30+
en_US: Top k
31+
type: int
32+
help:
33+
zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
34+
en_US: Only sample from the top K options for each subsequent token.
35+
required: false
36+
- name: frequency_penalty
37+
use_template: frequency_penalty
38+
- name: response_format
39+
label:
40+
zh_Hans: 回复格式
41+
en_US: Response Format
42+
type: string
43+
help:
44+
zh_Hans: 指定模型必须输出的格式
45+
en_US: specifying the format that the model must output
46+
required: false
47+
options:
48+
- text
49+
- json_object
50+
pricing:
51+
input: '9.90'
52+
output: '9.90'
53+
unit: '0.000001'
54+
currency: RMB

api/core/model_runtime/model_providers/siliconflow/llm/qwen-qwq-32B-preview.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -15,9 +15,9 @@ parameter_rules:
1515
- name: max_tokens
1616
use_template: max_tokens
1717
type: int
18-
default: 512
18+
default: 4096
1919
min: 1
20-
max: 4096
20+
max: 8192
2121
help:
2222
zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
2323
en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.

api/core/model_runtime/model_providers/siliconflow/llm/qwen2-vl-72b-instruct.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,7 @@ parameter_rules:
7878
- text
7979
- json_object
8080
pricing:
81-
input: '21'
82-
output: '21'
81+
input: '4.13'
82+
output: '4.13'
8383
unit: '0.000001'
8484
currency: RMB

api/core/model_runtime/model_providers/siliconflow/llm/qwen2-vl-7b-Instruct.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,7 @@ parameter_rules:
7878
- text
7979
- json_object
8080
pricing:
81-
input: '21'
82-
output: '21'
81+
input: '0.35'
82+
output: '0.35'
8383
unit: '0.000001'
8484
currency: RMB

api/core/model_runtime/model_providers/siliconflow/llm/qwen2.5-math-72b-instruct.yaml

+1
Original file line numberDiff line numberDiff line change
@@ -82,3 +82,4 @@ pricing:
8282
output: '4.13'
8383
unit: '0.000001'
8484
currency: RMB
85+
deprecated: true

docker/docker-compose-template.yaml

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
x-shared-env: &shared-api-worker-env
1+
x-shared-env: &shared-api-worker-env
22
services:
33
# API service
44
api:

0 commit comments

Comments
 (0)