forked from LAION-AI/Open-Assistant
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathuser_chat_repository.py
326 lines (290 loc) · 13.6 KB
/
user_chat_repository.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
import fastapi
import pydantic
import sqlalchemy.orm
import sqlmodel
from loguru import logger
from oasst_inference_server import database, models
from oasst_inference_server.settings import settings
from oasst_shared.schemas import inference
class UserChatRepository(pydantic.BaseModel):
"""Wrapper around a database session providing user-specific functionality relating to chats."""
session: database.AsyncSession
user_id: str = pydantic.Field(..., min_length=1)
class Config:
arbitrary_types_allowed = True
async def get_chats(
self,
include_hidden: bool = False,
limit: int | None = None,
before: str | None = None,
after: str | None = None,
) -> list[models.DbChat]:
if after is not None and before is not None:
raise fastapi.HTTPException(status_code=400, detail="Cannot specify both after and before.")
query = sqlmodel.select(models.DbChat)
query = query.where(models.DbChat.user_id == self.user_id)
if not include_hidden:
query = query.where(models.DbChat.hidden.is_(False))
if limit is not None:
query = query.limit(limit)
if before is not None:
query = query.where(models.DbChat.id > before)
if after is not None:
query = query.where(models.DbChat.id < after)
query = query.order_by(models.DbChat.created_at.desc() if before is None else models.DbChat.created_at)
return (await self.session.exec(query)).all()
async def get_chat_by_id(self, chat_id: str, include_messages: bool = True) -> models.DbChat:
query = sqlmodel.select(models.DbChat).where(
models.DbChat.id == chat_id,
models.DbChat.user_id == self.user_id,
)
if include_messages:
query = query.options(
sqlalchemy.orm.selectinload(models.DbChat.messages).selectinload(models.DbMessage.reports),
)
chat = (await self.session.exec(query)).one_or_none()
if chat is None:
raise fastapi.HTTPException(status_code=404, detail="Chat not found")
return chat
async def get_message_by_id(self, chat_id: str, message_id: str) -> models.DbMessage:
query = (
sqlmodel.select(models.DbMessage)
.where(
models.DbMessage.id == message_id,
models.DbMessage.chat_id == chat_id,
)
.options(
sqlalchemy.orm.selectinload(models.DbMessage.reports),
)
.join(models.DbChat)
.where(
models.DbChat.user_id == self.user_id,
)
)
message = (await self.session.exec(query)).one()
return message
async def create_chat(self) -> models.DbChat:
# Try to find the user first
user: models.DbUser = (
await self.session.execute(sqlmodel.select(models.DbUser).where(models.DbUser.id == self.user_id))
).one_or_none()
if not user:
raise fastapi.HTTPException(status_code=404, detail="User not found")
chat = models.DbChat(user_id=self.user_id)
self.session.add(chat)
await self.session.commit()
return chat
async def delete_chat(self, chat_id: str) -> models.DbChat:
chat = await self.get_chat_by_id(chat_id)
if chat is None:
raise fastapi.HTTPException(status_code=403)
logger.debug(f"Deleting {chat_id=}")
message_ids = [message.id for message in chat.messages]
# delete reports associated with messages
await self.session.exec(sqlmodel.delete(models.DbReport).where(models.DbReport.message_id.in_(message_ids)))
# delete message evaluations associated with message
await self.session.exec(
sqlmodel.delete(models.DbMessageEval).where(models.DbMessageEval.selected_message_id.in_(message_ids))
)
# delete messages
await self.session.exec(sqlmodel.delete(models.DbMessage).where(models.DbMessage.chat_id == chat_id))
# delete chat
await self.session.exec(
sqlmodel.delete(models.DbChat).where(
models.DbChat.id == chat_id,
models.DbChat.user_id == self.user_id,
)
)
await self.session.commit()
async def add_prompter_message(self, chat_id: str, parent_id: str | None, content: str) -> models.DbMessage:
logger.info(f"Adding prompter message {len(content)=} to chat {chat_id}")
if settings.message_max_length is not None:
if len(content) > settings.message_max_length:
raise fastapi.HTTPException(status_code=413, detail="Message content exceeds max length")
chat: models.DbChat = (
await self.session.exec(
sqlmodel.select(models.DbChat)
.options(sqlalchemy.orm.selectinload(models.DbChat.messages))
.where(
models.DbChat.id == chat_id,
models.DbChat.user_id == self.user_id,
)
)
).one()
if settings.chat_max_messages is not None:
if len(chat.messages) >= settings.chat_max_messages:
raise fastapi.HTTPException(status_code=413, detail="Maximum number of messages reached for this chat")
if parent_id is None:
if len(chat.messages) > 0:
raise fastapi.HTTPException(status_code=400, detail="Trying to add first message to non-empty chat")
if chat.title is None:
chat.title = content
else:
msg_dict = chat.get_msg_dict()
if parent_id not in msg_dict:
raise fastapi.HTTPException(status_code=400, detail="Parent message not found")
if msg_dict[parent_id].role != "assistant":
raise fastapi.HTTPException(status_code=400, detail="Parent message is not an assistant message")
if msg_dict[parent_id].state != inference.MessageState.complete:
raise fastapi.HTTPException(status_code=400, detail="Parent message is not complete")
message = models.DbMessage(role="prompter", chat_id=chat_id, chat=chat, parent_id=parent_id, content=content)
self.session.add(message)
chat.modified_at = message.created_at
await self.session.commit()
logger.debug(f"Added prompter message {len(content)=} to chat {chat_id}")
query = (
sqlmodel.select(models.DbMessage)
.options(
sqlalchemy.orm.selectinload(models.DbMessage.chat)
.selectinload(models.DbChat.messages)
.selectinload(models.DbMessage.reports),
)
.where(
models.DbMessage.id == message.id,
)
)
message = (await self.session.exec(query)).one()
return message
async def initiate_assistant_message(
self, parent_id: str, work_parameters: inference.WorkParameters, worker_compat_hash: str
) -> models.DbMessage:
logger.info(f"Adding stub assistant message to {parent_id=}")
# find and cancel all pending messages by this user
pending_msg_query = (
sqlmodel.select(models.DbMessage)
.where(
models.DbMessage.role == "assistant",
models.DbMessage.state == inference.MessageState.pending,
models.DbMessage.parent_id != parent_id, # Prevent draft messages from cancelling each other
)
.join(models.DbChat)
.where(
models.DbChat.user_id == self.user_id,
)
)
pending_msgs: list[models.DbMessage] = (await self.session.exec(pending_msg_query)).all()
for pending_msg in pending_msgs:
logger.warning(
f"User {self.user_id} has a pending message {pending_msg.id} in chat {pending_msg.chat_id}. Cancelling..."
)
pending_msg.state = inference.MessageState.cancelled
await self.session.commit()
logger.debug(f"Cancelled message {pending_msg.id} in chat {pending_msg.chat_id}.")
query = (
sqlmodel.select(models.DbMessage)
.options(sqlalchemy.orm.selectinload(models.DbMessage.chat))
.where(
models.DbMessage.id == parent_id,
models.DbMessage.role == "prompter",
)
)
parent: models.DbMessage = (await self.session.exec(query)).one()
if parent.chat.user_id != self.user_id:
raise fastapi.HTTPException(status_code=400, detail="Message not found")
if settings.chat_max_messages is not None:
count_query = sqlmodel.select(sqlmodel.func.count(models.DbMessage.id)).where(
models.DbMessage.chat_id == parent.chat.id
)
num_msgs: int = (await self.session.exec(count_query)).one()
if num_msgs >= settings.chat_max_messages:
raise fastapi.HTTPException(status_code=413, detail="Maximum number of messages reached for this chat")
message = models.DbMessage(
role="assistant",
chat_id=parent.chat_id,
chat=parent.chat,
parent_id=parent_id,
state=inference.MessageState.pending,
work_parameters=work_parameters,
worker_compat_hash=worker_compat_hash,
)
self.session.add(message)
await self.session.commit()
logger.debug(f"Initiated assistant message of {parent_id=}")
query = (
sqlmodel.select(models.DbMessage)
.options(
sqlalchemy.orm.selectinload(models.DbMessage.chat)
.selectinload(models.DbChat.messages)
.selectinload(models.DbMessage.reports),
)
.where(models.DbMessage.id == message.id)
)
message = (await self.session.exec(query)).one()
return message
async def update_score(self, message_id: str, score: int) -> models.DbMessage:
if score < -1 or score > 1:
raise fastapi.HTTPException(status_code=400, detail="Invalid score")
logger.info(f"Updating message score to {message_id=}: {score=}")
query = (
sqlmodel.select(models.DbMessage)
.options(sqlalchemy.orm.selectinload(models.DbMessage.chat))
.where(
models.DbMessage.id == message_id,
models.DbMessage.role == "assistant",
)
)
message: models.DbMessage = (await self.session.exec(query)).one()
if message.chat.user_id != self.user_id:
raise fastapi.HTTPException(status_code=400, detail="Message not found")
message.score = score
await self.session.commit()
return message
async def add_message_eval(self, message_id: str, inferior_message_ids: list[str]):
logger.info(f"Adding message evaluation to {message_id=}: {inferior_message_ids=}")
query = (
sqlmodel.select(models.DbMessage)
.options(sqlalchemy.orm.selectinload(models.DbMessage.chat))
.where(models.DbMessage.id == message_id)
)
message: models.DbMessage = (await self.session.exec(query)).one()
if message.chat.user_id != self.user_id:
raise fastapi.HTTPException(status_code=400, detail="Message not found")
message_eval = models.DbMessageEval(
chat_id=message.chat_id,
user_id=message.chat.user_id,
selected_message_id=message.id,
inferior_message_ids=inferior_message_ids,
)
self.session.add(message_eval)
await self.session.commit()
async def add_report(self, message_id: str, reason: str, report_type: inference.ReportType) -> models.DbReport:
logger.info(f"Adding report to {message_id=}: {reason=}")
query = (
sqlmodel.select(models.DbMessage)
.options(sqlalchemy.orm.selectinload(models.DbMessage.chat))
.where(
models.DbMessage.id == message_id,
models.DbMessage.role == "assistant",
)
)
message: models.DbMessage = (await self.session.exec(query)).one()
if message.chat.user_id != self.user_id:
raise fastapi.HTTPException(status_code=400, detail="Message not found")
report = models.DbReport(message_id=message.id, reason=reason, report_type=report_type)
self.session.add(report)
await self.session.commit()
await self.session.refresh(report)
return report
async def update_chat(
self,
chat_id: str,
title: str | None = None,
hidden: bool | None = None,
allow_data_use: bool | None = None,
active_thread_tail_message_id: str | None = None,
) -> None:
logger.info(f"Updating chat {chat_id=}: {title=} {hidden=} {active_thread_tail_message_id=}")
chat = await self.get_chat_by_id(chat_id=chat_id, include_messages=False)
if title is not None:
logger.info(f"Updating title of chat {chat_id=}: {title=}")
chat.title = title
if hidden is not None:
logger.info(f"Setting chat {chat_id=} to {'hidden' if hidden else 'visible'}")
chat.hidden = hidden
if allow_data_use is not None:
logger.info(f"Updating allow_data_use of chat {chat_id=}: {allow_data_use=}")
chat.allow_data_use = allow_data_use
if active_thread_tail_message_id is not None:
logger.info(f"Updating active_thread_tail_message_id of chat {chat_id=}: {active_thread_tail_message_id=}")
chat.active_thread_tail_message_id = active_thread_tail_message_id
await self.session.commit()