-
Notifications
You must be signed in to change notification settings - Fork 27
/
Copy pathmain.py
326 lines (287 loc) · 15 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
# encoding:utf-8
import json
import os,re
import time
from bot import bot_factory
from bridge.bridge import Bridge
from bridge.context import ContextType
from bridge.reply import Reply, ReplyType
from channel.chat_channel import check_contain, check_prefix
from channel.chat_message import ChatMessage
from config import conf
import plugins
from plugins import *
from common.log import logger
from common import const
import sqlite3
from chatgpt_tool_hub.chains.llm import LLMChain
from chatgpt_tool_hub.models import build_model_params
from chatgpt_tool_hub.models.model_factory import ModelFactory
from chatgpt_tool_hub.prompts import PromptTemplate
TRANSLATE_PROMPT = '''
You are now the following python function:
```# {{translate text to commands}}"
def translate_text(text: str) -> str:
```
Only respond with your `return` value, Don't reply anything else.
Commands:
{{Summary chat logs}}: "summary", args: {{("duration_in_seconds"): <integer>, ("count"): <integer>}}
{{Do Nothing}}:"do_nothing", args: {{}}
argument in brackets means optional argument.
You should only respond in JSON format as described below.
Response Format:
{{
"name": "command name",
"args": {{"arg name": "value"}}
}}
Ensure the response can be parsed by Python json.loads.
Input: {input}
'''
def find_json(json_string):
json_pattern = re.compile(r"\{[\s\S]*\}")
json_match = json_pattern.search(json_string)
if json_match:
json_string = json_match.group(0)
else:
json_string = ""
return json_string
@plugins.register(name="summary", desire_priority=-1, desc="A simple plugin to summary messages", version="0.3.2", author="lanvent")
class Summary(Plugin):
def __init__(self):
super().__init__()
curdir = os.path.dirname(__file__)
db_path = os.path.join(curdir, "chat.db")
self.conn = sqlite3.connect(db_path, check_same_thread=False)
c = self.conn.cursor()
c.execute('''CREATE TABLE IF NOT EXISTS chat_records
(sessionid TEXT, msgid INTEGER, user TEXT, content TEXT, type TEXT, timestamp INTEGER, is_triggered INTEGER,
PRIMARY KEY (sessionid, msgid))''')
# 后期增加了is_triggered字段,这里做个过渡,这段代码某天会删除
c = c.execute("PRAGMA table_info(chat_records);")
column_exists = False
for column in c.fetchall():
logger.debug("[Summary] column: {}" .format(column))
if column[1] == 'is_triggered':
column_exists = True
break
if not column_exists:
self.conn.execute("ALTER TABLE chat_records ADD COLUMN is_triggered INTEGER DEFAULT 0;")
self.conn.execute("UPDATE chat_records SET is_triggered = 0;")
self.conn.commit()
btype = Bridge().btype['chat']
if btype not in [const.OPEN_AI, const.CHATGPT, const.CHATGPTONAZURE, const.LINKAI]:
raise Exception("[Summary] init failed, not supported bot type")
self.bot = bot_factory.create_bot(Bridge().btype['chat'])
self.handlers[Event.ON_HANDLE_CONTEXT] = self.on_handle_context
self.handlers[Event.ON_RECEIVE_MESSAGE] = self.on_receive_message
logger.info("[Summary] inited")
def _insert_record(self, session_id, msg_id, user, content, msg_type, timestamp, is_triggered = 0):
c = self.conn.cursor()
logger.debug("[Summary] insert record: {} {} {} {} {} {} {}" .format(session_id, msg_id, user, content, msg_type, timestamp, is_triggered))
c.execute("INSERT OR REPLACE INTO chat_records VALUES (?,?,?,?,?,?,?)", (session_id, msg_id, user, content, msg_type, timestamp, is_triggered))
self.conn.commit()
def _get_records(self, session_id, start_timestamp=0, limit=9999):
c = self.conn.cursor()
c.execute("SELECT * FROM chat_records WHERE sessionid=? and timestamp>? ORDER BY timestamp DESC LIMIT ?", (session_id, start_timestamp, limit))
return c.fetchall()
def on_receive_message(self, e_context: EventContext):
context = e_context['context']
cmsg : ChatMessage = e_context['context']['msg']
username = None
session_id = cmsg.from_user_id
if conf().get('channel_type', 'wx') == 'wx' and cmsg.from_user_nickname is not None:
session_id = cmsg.from_user_nickname # itchat channel id会变动,只好用群名作为session id
if context.get("isgroup", False):
username = cmsg.actual_user_nickname
if username is None:
username = cmsg.actual_user_id
else:
username = cmsg.from_user_nickname
if username is None:
username = cmsg.from_user_id
is_triggered = False
content = context.content
if context.get("isgroup", False): # 群聊
# 校验关键字
match_prefix = check_prefix(content, conf().get('group_chat_prefix'))
match_contain = check_contain(content, conf().get('group_chat_keyword'))
if match_prefix is not None or match_contain is not None:
is_triggered = True
if context['msg'].is_at and not conf().get("group_at_off", False):
is_triggered = True
else: # 单聊
match_prefix = check_prefix(content, conf().get('single_chat_prefix',['']))
if match_prefix is not None:
is_triggered = True
self._insert_record(session_id, cmsg.msg_id, username, context.content, str(context.type), cmsg.create_time, int(is_triggered))
# logger.debug("[Summary] {}:{} ({})" .format(username, context.content, session_id))
def _translate_text_to_commands(self, text):
llm = ModelFactory().create_llm_model(**build_model_params({
"openai_api_key": conf().get("open_ai_api_key", ""),
"proxy": conf().get("proxy", ""),
}))
prompt = PromptTemplate(
input_variables=["input"],
template=TRANSLATE_PROMPT,
)
bot = LLMChain(llm=llm, prompt=prompt)
content = bot.run(text)
return content
def _check_tokens(self, records, max_tokens=3600):
query = ""
for record in records[::-1]:
username = record[2]
content = record[3]
is_triggered = record[6]
if record[4] in [str(ContextType.IMAGE),str(ContextType.VOICE)]:
content = f"[{record[4]}]"
sentence = ""
sentence += f'{username}' + ": \"" + content + "\""
if is_triggered:
sentence += " <T>"
query += "\n\n"+sentence
prompt = "你是一位群聊机器人,需要对聊天记录进行简明扼要的总结,用列表的形式输出。\n聊天记录格式:[x]是emoji表情或者是对图片和声音文件的说明,消息最后出现<T>表示消息触发了群聊机器人的回复,内容通常是提问,若带有特殊符号如#和$则是触发你无法感知的某个插件功能,聊天记录中不包含你对这类消息的回复,可降低这些消息的权重。请不要在回复中包含聊天记录格式中出现的符号。\n"
firstmsg_id = records[0][1]
session = self.bot.sessions.build_session(firstmsg_id, prompt)
session.add_query("需要你总结的聊天记录如下:%s"%query)
if session.calc_tokens() > max_tokens:
# logger.debug("[Summary] summary failed, tokens: %d" % session.calc_tokens())
return None
return session
def _split_messages_to_summarys(self, records, max_tokens_persession=3600 , max_summarys=8):
summarys = []
count = 0
self.bot.args["max_tokens"] = 400
while len(records) > 0 and len(summarys) < max_summarys:
session = self._check_tokens(records,max_tokens_persession)
last = 0
if session is None:
left,right = 0, len(records)
while left < right:
mid = (left + right) // 2
logger.debug("[Summary] left: %d, right: %d, mid: %d" % (left, right, mid))
session = self._check_tokens(records[:mid], max_tokens_persession)
if session is None:
right = mid - 1
else:
left = mid + 1
session = self._check_tokens(records[:left-1], max_tokens_persession)
last = left
logger.debug("[Summary] summary %d messages" % (left))
else:
last = len(records)
logger.debug("[Summary] summary all %d messages" % (len(records)))
if session is None:
logger.debug("[Summary] summary failed, session is None")
break
logger.debug("[Summary] session query: %s, prompt_tokens: %d" % (session.messages, session.calc_tokens()))
result = self.bot.reply_text(session)
total_tokens, completion_tokens, reply_content = result['total_tokens'], result['completion_tokens'], result['content']
logger.debug("[Summary] total_tokens: %d, completion_tokens: %d, reply_content: %s" % (total_tokens, completion_tokens, reply_content))
if completion_tokens == 0:
if len(summarys) == 0:
return count,reply_content
else:
break
summary = reply_content
summarys.append(summary)
records = records[last:]
count += last
return count,summarys
def on_handle_context(self, e_context: EventContext):
if e_context['context'].type != ContextType.TEXT:
return
content = e_context['context'].content
logger.debug("[Summary] on_handle_context. content: %s" % content)
trigger_prefix = conf().get('plugin_trigger_prefix', "$")
clist = content.split()
if clist[0].startswith(trigger_prefix):
limit = 99
duration = -1
if "总结" in clist[0]:
flag = False
if clist[0] == trigger_prefix+"总结":
flag = True
if len(clist) > 1:
try:
limit = int(clist[1])
logger.debug("[Summary] limit: %d" % limit)
except Exception as e:
flag = False
if not flag:
text = content.split(trigger_prefix,maxsplit=1)[1]
try:
command_json = find_json(self._translate_text_to_commands(text))
command = json.loads(command_json)
name = command["name"]
if name.lower() == "summary":
limit = int(command["args"].get("count", 99))
if limit < 0:
limit = 299
duration = int(command["args"].get("duration_in_seconds", -1))
logger.debug("[Summary] limit: %d, duration: %d seconds" % (limit, duration))
except Exception as e:
logger.error("[Summary] translate failed: %s" % e)
return
else:
return
start_time = int(time.time())
if duration > 0:
start_time = start_time - duration
else:
start_time = 0
msg:ChatMessage = e_context['context']['msg']
session_id = msg.from_user_id
if conf().get('channel_type', 'wx') == 'wx' and msg.from_user_nickname is not None:
session_id = msg.from_user_nickname # itchat channel id会变动,只好用名字作为session id
records = self._get_records(session_id, start_time, limit)
for i in range(len(records)):
record=list(records[i])
content = record[3]
clist = re.split(r'\n- - - - - - - - -.*?\n', content)
if len(clist) > 1:
record[3] = clist[1]
records[i] = tuple(record)
if len(records) <= 1:
reply = Reply(ReplyType.INFO, "无聊天记录可供总结")
e_context['reply'] = reply
e_context.action = EventAction.BREAK_PASS
return
max_tokens_persession = 3600
count, summarys = self._split_messages_to_summarys(records, max_tokens_persession)
if count == 0 :
if isinstance(summarys,str):
reply = Reply(ReplyType.ERROR, summarys)
else:
reply = Reply(ReplyType.ERROR, "总结聊天记录失败")
e_context['reply'] = reply
e_context.action = EventAction.BREAK_PASS
return
if len(summarys) == 1:
reply = Reply(ReplyType.TEXT, f"本次总结了{count}条消息。\n\n"+summarys[0])
e_context['reply'] = reply
e_context.action = EventAction.BREAK_PASS
return
self.bot.args["max_tokens"] = None
query = ""
for i,summary in enumerate(reversed(summarys)):
query += summary + "\n----------------\n\n"
prompt = "你是一位群聊机器人,聊天记录已经在你的大脑中被你总结成多段摘要总结,你需要对它们进行摘要总结,最后输出一篇完整的摘要总结,用列表的形式输出。\n"
session = self.bot.sessions.build_session(session_id, prompt)
session.add_query(query)
result = self.bot.reply_text(session)
total_tokens, completion_tokens, reply_content = result['total_tokens'], result['completion_tokens'], result['content']
logger.debug("[Summary] total_tokens: %d, completion_tokens: %d, reply_content: %s" % (total_tokens, completion_tokens, reply_content))
if completion_tokens == 0:
reply = Reply(ReplyType.ERROR, "合并摘要失败,"+reply_content+"\n原始多段摘要如下:\n"+query)
else:
reply = Reply(ReplyType.TEXT, f"本次总结了{count}条消息。\n\n"+reply_content)
e_context['reply'] = reply
e_context.action = EventAction.BREAK_PASS # 事件结束,并跳过处理context的默认逻辑
def get_help_text(self, verbose = False, **kwargs):
help_text = "聊天记录总结插件。\n"
if not verbose:
return help_text
trigger_prefix = conf().get('plugin_trigger_prefix', "$")
help_text += f"使用方法:输入\"{trigger_prefix}总结 最近消息数量\",我会帮助你总结聊天记录。\n例如:\"{trigger_prefix}总结 100\",我会总结最近100条消息。\n\n你也可以直接输入\"{trigger_prefix}总结前99条信息\"或\"{trigger_prefix}总结3小时内的最近10条消息\"\n我会尽可能理解你的指令。"
return help_text