mirror of
https://github.com/wassname/Open-Assistant.git
synced 2026-07-02 17:00:28 +08:00
c2fa476904
* add disposition to text labeling tasks
* add emoji stats to ConversationMessage
* add user emoji augmentation for message queries
* add auth_method,username to message queries (query emoji status)
* add auth_method+username for single message
* fix param name typo
* only join rows when message.emojis != JSON.NULL
* formatting
* make sure emojis and user_emojis default to {}, []
* remove init_user(), use fresh empty default collections
56 lines
1.6 KiB
Python
56 lines
1.6 KiB
Python
import re
|
|
from uuid import UUID
|
|
|
|
from oasst_backend.models import Message
|
|
from oasst_shared.schemas import protocol
|
|
|
|
|
|
def prepare_message(m: Message) -> protocol.Message:
|
|
return protocol.Message(
|
|
id=m.id,
|
|
frontend_message_id=m.frontend_message_id,
|
|
parent_id=m.parent_id,
|
|
text=m.text,
|
|
lang=m.lang,
|
|
is_assistant=(m.role == "assistant"),
|
|
created_date=m.created_date,
|
|
emojis=m.emojis or {},
|
|
user_emojis=m.user_emojis or [],
|
|
)
|
|
|
|
|
|
def prepare_message_list(messages: list[Message]) -> list[protocol.Message]:
|
|
return [prepare_message(m) for m in messages]
|
|
|
|
|
|
def prepare_conversation_message_list(messages: list[Message]) -> list[protocol.ConversationMessage]:
|
|
return [
|
|
protocol.ConversationMessage(
|
|
id=message.id,
|
|
frontend_message_id=message.frontend_message_id,
|
|
text=message.text,
|
|
lang=message.lang,
|
|
is_assistant=(message.role == "assistant"),
|
|
emojis=message.emojis or {},
|
|
user_emojis=message.user_emojis or [],
|
|
)
|
|
for message in messages
|
|
]
|
|
|
|
|
|
def prepare_conversation(messages: list[Message]) -> protocol.Conversation:
|
|
return protocol.Conversation(messages=prepare_conversation_message_list(messages))
|
|
|
|
|
|
def prepare_tree(tree: list[Message], tree_id: UUID) -> protocol.MessageTree:
|
|
tree_messages = []
|
|
for message in tree:
|
|
tree_messages.append(prepare_message(message))
|
|
|
|
return protocol.MessageTree(id=tree_id, messages=tree_messages)
|
|
|
|
|
|
split_uuid_pattern = re.compile(
|
|
r"^([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12})\$(.*)$"
|
|
)
|