mirror of
https://github.com/wassname/Open-Assistant.git
synced 2026-07-02 17:00:28 +08:00
a5bc9bf492
* add dupe checks to store_text_reply() & store_text_labels * remove test export file * add user_id to protocol.ConversationMessage * add show_on_leaderboard ot protocol.FrontEndUser
61 lines
1.9 KiB
Python
61 lines
1.9 KiB
Python
import re
|
|
from uuid import UUID
|
|
|
|
from oasst_backend.models import Message
|
|
from oasst_shared.schemas import protocol
|
|
|
|
|
|
def prepare_message(m: Message) -> protocol.Message:
|
|
return protocol.Message(
|
|
id=m.id,
|
|
frontend_message_id=m.frontend_message_id,
|
|
parent_id=m.parent_id,
|
|
user_id=m.user_id,
|
|
text=m.text,
|
|
lang=m.lang,
|
|
is_assistant=(m.role == "assistant"),
|
|
created_date=m.created_date,
|
|
emojis=m.emojis or {},
|
|
user_emojis=m.user_emojis or [],
|
|
review_result=m.review_result,
|
|
review_count=m.review_count,
|
|
)
|
|
|
|
|
|
def prepare_message_list(messages: list[Message]) -> list[protocol.Message]:
|
|
return [prepare_message(m) for m in messages]
|
|
|
|
|
|
def prepare_conversation_message(message: Message) -> protocol.ConversationMessage:
|
|
return protocol.ConversationMessage(
|
|
id=message.id,
|
|
user_id=message.user_id,
|
|
frontend_message_id=message.frontend_message_id,
|
|
text=message.text,
|
|
lang=message.lang,
|
|
is_assistant=(message.role == "assistant"),
|
|
emojis=message.emojis or {},
|
|
user_emojis=message.user_emojis or [],
|
|
)
|
|
|
|
|
|
def prepare_conversation_message_list(messages: list[Message]) -> list[protocol.ConversationMessage]:
|
|
return [prepare_conversation_message(message) for message in messages]
|
|
|
|
|
|
def prepare_conversation(messages: list[Message]) -> protocol.Conversation:
|
|
return protocol.Conversation(messages=prepare_conversation_message_list(messages))
|
|
|
|
|
|
def prepare_tree(tree: list[Message], tree_id: UUID) -> protocol.MessageTree:
|
|
tree_messages = []
|
|
for message in tree:
|
|
tree_messages.append(prepare_message(message))
|
|
|
|
return protocol.MessageTree(id=tree_id, messages=tree_messages)
|
|
|
|
|
|
split_uuid_pattern = re.compile(
|
|
r"^([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12})\$(.*)$"
|
|
)
|