Skip to content

Commit aa772c2

Browse files
committed
added typical_p
1 parent b8eb7c9 commit aa772c2

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

inference/text-client/text_client_utils.py

-3
Original file line numberDiff line numberDiff line change
@@ -36,11 +36,8 @@ def send_message(self, message, model_id):
3636
"content": message,
3737
"work_parameters": {
3838
"model_name": model_id,
39-
"top_k": 1024,
4039
"top_p": 0.9,
41-
"temperature": 1.0,
4240
"repetition_penalty": 1.2,
43-
"max_new_tokens": 1024,
4441
},
4542
},
4643
headers=self.auth_headers,

inference/worker/interface.py

+2
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@ class GenerateStreamParameters(pydantic.BaseModel):
99
do_sample: bool | None
1010
top_k: int | None
1111
top_p: float | None
12+
typical_p: float | None
1213
temperature: float | None
1314
repetition_penalty: float | None
1415
seed: int | None
@@ -26,6 +27,7 @@ def from_work_parameters(params: inference.WorkParameters) -> "GenerateStreamPar
2627
do_sample=params.do_sample,
2728
top_k=params.top_k,
2829
top_p=params.top_p,
30+
typical_p=params.typical_p,
2931
temperature=params.temperature,
3032
repetition_penalty=params.repetition_penalty,
3133
seed=params.seed,

oasst-shared/oasst_shared/schemas/inference.py

+1
Original file line numberDiff line numberDiff line change
@@ -110,6 +110,7 @@ class WorkParametersInput(pydantic.BaseModel):
110110
model_name: str = DEFAULT_MODEL_NAME
111111
top_k: int | None = None
112112
top_p: float | None = None
113+
typical_p: float | None = None
113114
temperature: float | None = None
114115
repetition_penalty: float | None = None
115116
max_new_tokens: int | None = None

0 commit comments

Comments
 (0)