Skip to content

Commit b12b845

Browse files
author
LittleMouse
committed
[chore] Update model memory usage statistics
1 parent c9304f1 commit b12b845

File tree

1 file changed

+38
-24
lines changed

1 file changed

+38
-24
lines changed

config/config.yaml

Lines changed: 38 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -19,59 +19,73 @@ models:
1919
base_url: https://dashscope.aliyuncs.com/compatible-mode/v1
2020
model: deepseek-r1
2121

22-
qwen2.5-0.5b:
22+
qwen2.5-0.5B-p256-ax630c:
2323
type: tcp_client
24-
host: "192.168.20.65"
24+
host: "192.168.20.56"
2525
port: 10001
26-
model_name: "qwen2.5-0.5B-prefill-20e"
26+
model_name: "qwen2.5-0.5B-p256-ax630c"
2727
object: "llm.setup"
2828
pool_size: 2
2929
max_context_length: 128
3030
response_format: "llm.utf-8.stream"
3131
input: "llm.utf-8"
32-
memory_required: 716800
32+
memory_required: 560460
3333
system_prompt: |
3434
You are a helpful assistant.
3535
36-
Qwen2.5-0.5B-w8a16:
36+
qwen2.5-1.5B-p256-ax630c:
3737
type: tcp_client
38-
host: "192.168.20.65"
38+
host: "192.168.20.56"
3939
port: 10001
40-
model_name: "Qwen2.5-0.5B-w8a16"
40+
model_name: "qwen2.5-1.5B-p256-ax630c"
4141
object: "llm.setup"
42-
pool_size: 2
43-
max_context_length: 1024
42+
pool_size: 1
43+
max_context_length: 128
4444
response_format: "llm.utf-8.stream"
4545
input: "llm.utf-8"
46-
memory_required: 716800
46+
memory_required: 1686216
4747
system_prompt: |
4848
You are a helpful assistant.
4949
50-
deepseek-r1-distill-qwen-1.5b:
50+
deepseek-r1-1.5B-p256-ax630c:
5151
type: tcp_client
52-
host: "192.168.20.65"
52+
host: "192.168.20.56"
5353
port: 10001
54-
model_name: "deepseek-r1-1.5B-ax630c"
54+
model_name: "deepseek-r1-1.5B-p256-ax630c"
5555
object: "llm.setup"
5656
pool_size: 1
57-
max_context_length: 1024
57+
max_context_length: 128
58+
response_format: "llm.utf-8.stream"
59+
input: "llm.utf-8"
60+
memory_required: 1686552
61+
system_prompt: |
62+
You are a helpful assistant.
63+
64+
llama3.2-1B-p256-ax630c:
65+
type: tcp_client
66+
host: "192.168.20.56"
67+
port: 10001
68+
model_name: "llama3.2-1B-p256-ax630c"
69+
object: "llm.setup"
70+
pool_size: 2
71+
max_context_length: 128
5872
response_format: "llm.utf-8.stream"
5973
input: "llm.utf-8"
60-
memory_required: 2097152
74+
memory_required: 1336288
6175
system_prompt: |
6276
You are a helpful assistant.
6377
6478
internvl2.5-1B-ax630c:
6579
type: tcp_client
66-
host: "192.168.20.65"
80+
host: "192.168.20.56"
6781
port: 10001
6882
model_name: "internvl2.5-1B-ax630c"
6983
object: "vlm.setup"
7084
pool_size: 2
7185
max_context_length: 256
7286
response_format: "vlm.utf-8.stream"
7387
input: "vlm.utf-8"
74-
memory_required: 1048576
88+
memory_required: 905356
7589
system_prompt: |
7690
You are a helpful assistant.
7791
@@ -85,21 +99,21 @@ models:
8599

86100
melotts:
87101
type: tts
88-
host: "192.168.20.65"
102+
host: "192.168.20.56"
89103
port: 10001
90104
model_name: "melotts_zh-cn"
91105
object: "melotts.setup"
92106
response_format: "wav.base64"
93-
memory_required: 51200
107+
memory_required: 59764
94108
input: "tts.utf-8"
95109

96-
whisper-1:
110+
whisper-tiny:
97111
type: asr
98-
host: "192.168.20.65"
112+
host: "192.168.20.56"
99113
port: 10001
100114
model_name: "whisper-tiny"
101115
object: "whisper.setup"
102116
response_format: "asr.utf-8"
103-
input: "whisper-tiny"
104-
memory_required: 20480
105-
language: "en"
117+
memory_required: 289132
118+
language: "en"
119+
input: "pcm.base64"

0 commit comments

Comments
 (0)