from dataclasses import dataclass | |
from pandas import Timestamp | |
from pydantic import BaseModel | |
class ChatMessage: | |
id: int | |
MsgSvrID: int | |
type_name: str | |
is_sender: int | |
talker: str | |
room_name: str | |
msg: str | |
src: str | |
CreateTime: Timestamp | |
class CutMessage: | |
is_sender: int | |
cut_type: str | |
CreateTime: Timestamp | |
class QaPair: | |
id: int | |
system: str | |
instruction: str | |
output: str | |
history: list[list[str]] | |
time: Timestamp | |
score: int | |
class QaPairScore(BaseModel): | |
id: int | |
score: int | |
skip_type_list = [ | |
"添加好友", | |
"推荐公众号", | |
"动画表情", | |
"位置", | |
"文件", | |
"位置共享", | |
"接龙", | |
"引用回复", | |
"视频号直播或直播回放", | |
"用户上传的GIF表情", | |
"文件(猜)", | |
"群公告", | |
"视频号直播或直播回放等", | |
"游戏相关", | |
"转账", | |
"赠送红包封面", | |
"语音通话", | |
"企业微信打招呼(猜)", | |
"企业微信添加好友(猜)", | |
"系统通知", | |
"消息撤回1", | |
"拍一拍", | |
"消息撤回5", | |
"消息撤回6", | |
"消息撤回33", | |
"消息撤回36", | |
"消息撤回57", | |
"邀请加群", | |
"未知-11000,0", | |
] | |
# 没处理的类型 | |
unprocessed_type_list = [] | |