@@ -19,59 +19,73 @@ models:
1919 base_url : https://dashscope.aliyuncs.com/compatible-mode/v1
2020 model : deepseek-r1
2121
22- qwen2.5-0.5b :
22+ qwen2.5-0.5B-p256-ax630c :
2323 type : tcp_client
24- host : " 192.168.20.65 "
24+ host : " 192.168.20.56 "
2525 port : 10001
26- model_name : " qwen2.5-0.5B-prefill-20e "
26+ model_name : " qwen2.5-0.5B-p256-ax630c "
2727 object : " llm.setup"
2828 pool_size : 2
2929 max_context_length : 128
3030 response_format : " llm.utf-8.stream"
3131 input : " llm.utf-8"
32- memory_required : 716800
32+ memory_required : 560460
3333 system_prompt : |
3434 You are a helpful assistant.
3535
36- Qwen2 .5-0 .5B-w8a16 :
36+ qwen2 .5-1 .5B-p256-ax630c :
3737 type : tcp_client
38- host : " 192.168.20.65 "
38+ host : " 192.168.20.56 "
3939 port : 10001
40- model_name : " Qwen2 .5-0 .5B-w8a16 "
40+ model_name : " qwen2 .5-1 .5B-p256-ax630c "
4141 object : " llm.setup"
42- pool_size : 2
43- max_context_length : 1024
42+ pool_size : 1
43+ max_context_length : 128
4444 response_format : " llm.utf-8.stream"
4545 input : " llm.utf-8"
46- memory_required : 716800
46+ memory_required : 1686216
4747 system_prompt : |
4848 You are a helpful assistant.
4949
50- deepseek-r1-distill-qwen-1.5b :
50+ deepseek-r1-1.5B-p256-ax630c :
5151 type : tcp_client
52- host : " 192.168.20.65 "
52+ host : " 192.168.20.56 "
5353 port : 10001
54- model_name : " deepseek-r1-1.5B-ax630c"
54+ model_name : " deepseek-r1-1.5B-p256- ax630c"
5555 object : " llm.setup"
5656 pool_size : 1
57- max_context_length : 1024
57+ max_context_length : 128
58+ response_format : " llm.utf-8.stream"
59+ input : " llm.utf-8"
60+ memory_required : 1686552
61+ system_prompt : |
62+ You are a helpful assistant.
63+
64+ llama3.2-1B-p256-ax630c :
65+ type : tcp_client
66+ host : " 192.168.20.56"
67+ port : 10001
68+ model_name : " llama3.2-1B-p256-ax630c"
69+ object : " llm.setup"
70+ pool_size : 2
71+ max_context_length : 128
5872 response_format : " llm.utf-8.stream"
5973 input : " llm.utf-8"
60- memory_required : 2097152
74+ memory_required : 1336288
6175 system_prompt : |
6276 You are a helpful assistant.
6377
6478 internvl2.5-1B-ax630c :
6579 type : tcp_client
66- host : " 192.168.20.65 "
80+ host : " 192.168.20.56 "
6781 port : 10001
6882 model_name : " internvl2.5-1B-ax630c"
6983 object : " vlm.setup"
7084 pool_size : 2
7185 max_context_length : 256
7286 response_format : " vlm.utf-8.stream"
7387 input : " vlm.utf-8"
74- memory_required : 1048576
88+ memory_required : 905356
7589 system_prompt : |
7690 You are a helpful assistant.
7791
@@ -85,21 +99,21 @@ models:
8599
86100 melotts :
87101 type : tts
88- host : " 192.168.20.65 "
102+ host : " 192.168.20.56 "
89103 port : 10001
90104 model_name : " melotts_zh-cn"
91105 object : " melotts.setup"
92106 response_format : " wav.base64"
93- memory_required : 51200
107+ memory_required : 59764
94108 input : " tts.utf-8"
95109
96- whisper-1 :
110+ whisper-tiny :
97111 type : asr
98- host : " 192.168.20.65 "
112+ host : " 192.168.20.56 "
99113 port : 10001
100114 model_name : " whisper-tiny"
101115 object : " whisper.setup"
102116 response_format : " asr.utf-8"
103- input : " whisper-tiny "
104- memory_required : 20480
105- language : " en "
117+ memory_required : 289132
118+ language : " en "
119+ input : " pcm.base64 "
0 commit comments