forked from LAION-AI/Open-Assistant
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhf_streamer.py
36 lines (27 loc) · 981 Bytes
/
hf_streamer.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
import typing
import transformers
from loguru import logger
class Printer(typing.Protocol):
def __call__(self, value: int) -> None:
...
def _unpack(value):
if len(value.shape) > 1 and value.shape[0] > 1:
raise ValueError("HFStreamer only supports batch size 1")
elif len(value.shape) > 1:
value = value[0]
return value.cpu().tolist()
# based on HF text streamer
class HFStreamer(transformers.generation.streamers.BaseStreamer):
def __init__(self, input_ids, printer: Printer):
self.input_ids = _unpack(input_ids)[::-1]
self.printer = printer
def put(self, value):
for token_id in _unpack(value):
if self.input_ids:
input_id = self.input_ids.pop()
if input_id != token_id:
logger.warning(f"Input id {input_id} does not match output id {token_id}")
else:
self.printer(token_id)
def end(self):
pass