ali_qwen_bot.py 10.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. # encoding:utf-8
  2. import json
  3. import time
  4. from typing import List, Tuple
  5. import openai
  6. import openai.error
  7. import broadscope_bailian
  8. from broadscope_bailian import ChatQaMessage
  9. from bot.bot import Bot
  10. from bot.ali.ali_qwen_session import AliQwenSession
  11. from bot.openai.open_ai_image import OpenAIImage
  12. from bot.openai.open_ai_vision import OpenAIVision
  13. from bot.session_manager import SessionManager
  14. from bridge.context import ContextType
  15. from bridge.reply import Reply, ReplyType
  16. from common.log import logger
  17. from common import const
  18. from config import conf, load_config
  19. class AliQwenBot(Bot, OpenAIImage, OpenAIVision):
  20. def __init__(self):
  21. super().__init__()
  22. self.api_key_expired_time = self.set_api_key()
  23. self.sessions = SessionManager(AliQwenSession, model=conf().get("model", const.QWEN))
  24. def api_key_client(self):
  25. return broadscope_bailian.AccessTokenClient(access_key_id=self.access_key_id(), access_key_secret=self.access_key_secret())
  26. def access_key_id(self):
  27. return conf().get("qwen_access_key_id")
  28. def access_key_secret(self):
  29. return conf().get("qwen_access_key_secret")
  30. def agent_key(self):
  31. return conf().get("qwen_agent_key")
  32. def app_id(self):
  33. return conf().get("qwen_app_id")
  34. def node_id(self):
  35. return conf().get("qwen_node_id", "")
  36. def temperature(self):
  37. return conf().get("temperature", 0.2 )
  38. def top_p(self):
  39. return conf().get("top_p", 1)
  40. def reply(self, query, context=None):
  41. # acquire reply content
  42. if context.type == ContextType.TEXT:
  43. logger.info("[QWEN] query={}".format(query))
  44. session_id = context["session_id"]
  45. reply = None
  46. clear_memory_commands = conf().get("clear_memory_commands", ["#清除记忆"])
  47. if query in clear_memory_commands:
  48. self.sessions.clear_session(session_id)
  49. reply = Reply(ReplyType.INFO, "记忆已清除")
  50. elif query == "#清除所有":
  51. self.sessions.clear_all_session()
  52. reply = Reply(ReplyType.INFO, "所有人记忆已清除")
  53. elif query == "#更新配置":
  54. load_config()
  55. reply = Reply(ReplyType.INFO, "配置已更新")
  56. if reply:
  57. return reply
  58. session = self.sessions.session_query(query, session_id)
  59. logger.debug("[QWEN] session query={}".format(session.messages))
  60. reply_content = self.reply_text(session_id, session)
  61. logger.debug(
  62. "[QWEN] new_query={}, session_id={}, reply_cont={}, completion_tokens={}".format(
  63. session.messages,
  64. session_id,
  65. reply_content["content"],
  66. reply_content["completion_tokens"],
  67. )
  68. )
  69. if reply_content["completion_tokens"] == 0 and len(reply_content["content"]) > 0:
  70. reply = Reply(ReplyType.ERROR, reply_content["content"])
  71. elif reply_content["completion_tokens"] > 0:
  72. self.sessions.session_reply(reply_content["content"], session_id, reply_content["total_tokens"])
  73. reply = Reply(ReplyType.TEXT, reply_content["content"])
  74. else:
  75. reply = Reply(ReplyType.ERROR, reply_content["content"])
  76. logger.debug("[QWEN] reply {} used 0 tokens.".format(reply_content))
  77. return reply
  78. elif context.type == ContextType.IMAGE_CREATE and conf().get("text_to_image", False):
  79. ok, retstring = self.create_img(query, 0, context=context)
  80. reply = None
  81. if ok:
  82. reply = Reply(ReplyType.IMAGE_URL, retstring)
  83. else:
  84. reply = Reply(ReplyType.ERROR, retstring)
  85. return reply
  86. else:
  87. reply = Reply(ReplyType.ERROR, "Bot不支持处理{}类型的消息".format(context.type))
  88. return reply
  89. def reply_text(self, session_id: str, session: AliQwenSession, retry_count=0) -> dict:
  90. """
  91. call bailian's ChatCompletion to get the answer
  92. :param session: a conversation session
  93. :param retry_count: retry count
  94. :return: {}
  95. """
  96. try:
  97. res = self.do_vision_completion_if_need(session_id, session.messages[-1]['content'])
  98. if res:
  99. return res
  100. prompt, history = self.convert_messages_format(session.messages)
  101. self.update_api_key_if_expired()
  102. # NOTE 阿里百炼的call()函数未提供temperature参数,考虑到temperature和top_p参数作用相同,取两者较小的值作为top_p参数传入,详情见文档 https://help.aliyun.com/document_detail/2587502.htm
  103. response = broadscope_bailian.Completions().call(app_id=self.app_id(), prompt=prompt, history=history, top_p=min(self.temperature(), self.top_p()))
  104. completion_content = self.get_completion_content(response, self.node_id())
  105. completion_tokens, total_tokens = self.calc_tokens(session.messages, completion_content)
  106. return {
  107. "total_tokens": total_tokens,
  108. "completion_tokens": completion_tokens,
  109. "content": completion_content,
  110. }
  111. except Exception as e:
  112. need_retry = retry_count < 2
  113. result = {"completion_tokens": 0, "content": "我现在有点累了,等会再来吧"}
  114. if isinstance(e, openai.error.RateLimitError):
  115. logger.warn("[QWEN] RateLimitError: {}".format(e))
  116. result["content"] = "提问太快啦,请休息一下再问我吧"
  117. if need_retry:
  118. time.sleep(20)
  119. elif isinstance(e, openai.error.Timeout):
  120. logger.warn("[QWEN] Timeout: {}".format(e))
  121. result["content"] = "我没有收到你的消息"
  122. if need_retry:
  123. time.sleep(5)
  124. elif isinstance(e, openai.error.APIError):
  125. logger.warn("[QWEN] Bad Gateway: {}".format(e))
  126. result["content"] = "请再问我一次"
  127. if need_retry:
  128. time.sleep(10)
  129. elif isinstance(e, openai.error.APIConnectionError):
  130. logger.warn("[QWEN] APIConnectionError: {}".format(e))
  131. need_retry = False
  132. result["content"] = "我连接不到你的网络"
  133. else:
  134. logger.exception("[QWEN] Exception: {}".format(e))
  135. need_retry = False
  136. self.sessions.clear_session(session.session_id)
  137. if need_retry:
  138. logger.warn("[QWEN] 第{}次重试".format(retry_count + 1))
  139. return self.reply_text(session_id, session, retry_count + 1)
  140. else:
  141. return result
  142. def set_api_key(self):
  143. api_key, expired_time = self.api_key_client().create_token(agent_key=self.agent_key())
  144. broadscope_bailian.api_key = api_key
  145. return expired_time
  146. def update_api_key_if_expired(self):
  147. if time.time() > self.api_key_expired_time:
  148. self.api_key_expired_time = self.set_api_key()
  149. def convert_messages_format(self, messages) -> Tuple[str, List[ChatQaMessage]]:
  150. history = []
  151. user_content = ''
  152. assistant_content = ''
  153. system_content = ''
  154. for message in messages:
  155. role = message.get('role')
  156. if role == 'user':
  157. user_content += message.get('content')
  158. elif role == 'assistant':
  159. assistant_content = message.get('content')
  160. history.append(ChatQaMessage(user_content, assistant_content))
  161. user_content = ''
  162. assistant_content = ''
  163. elif role =='system':
  164. system_content += message.get('content')
  165. if user_content == '':
  166. raise Exception('no user message')
  167. if system_content != '':
  168. # NOTE 模拟系统消息,测试发现人格描述以"你需要扮演ChatGPT"开头能够起作用,而以"你是ChatGPT"开头模型会直接否认
  169. system_qa = ChatQaMessage(system_content, '好的,我会严格按照你的设定回答问题')
  170. history.insert(0, system_qa)
  171. logger.debug("[QWEN] converted qa messages: {}".format([item.to_dict() for item in history]))
  172. logger.debug("[QWEN] user content as prompt: {}".format(user_content))
  173. return user_content, history
  174. def get_completion_content(self, response, node_id):
  175. if not response['Success']:
  176. return f"[ERROR]\n{response['Code']}:{response['Message']}"
  177. text = response['Data']['Text']
  178. if node_id == '':
  179. return text
  180. # TODO: 当使用流程编排创建大模型应用时,响应结构如下,最终结果在['finalResult'][node_id]['response']['text']中,暂时先这么写
  181. # {
  182. # 'Success': True,
  183. # 'Code': None,
  184. # 'Message': None,
  185. # 'Data': {
  186. # 'ResponseId': '9822f38dbacf4c9b8daf5ca03a2daf15',
  187. # 'SessionId': 'session_id',
  188. # 'Text': '{"finalResult":{"LLM_T7islK":{"params":{"modelId":"qwen-plus-v1","prompt":"${systemVars.query}${bizVars.Text}"},"response":{"text":"作为一个AI语言模型,我没有年龄,因为我没有生日。\n我只是一个程序,没有生命和身体。"}}}}',
  189. # 'Thoughts': [],
  190. # 'Debug': {},
  191. # 'DocReferences': []
  192. # },
  193. # 'RequestId': '8e11d31551ce4c3f83f49e6e0dd998b0',
  194. # 'Failed': None
  195. # }
  196. text_dict = json.loads(text)
  197. completion_content = text_dict['finalResult'][node_id]['response']['text']
  198. return completion_content
  199. def calc_tokens(self, messages, completion_content):
  200. completion_tokens = len(completion_content)
  201. prompt_tokens = 0
  202. for message in messages:
  203. prompt_tokens += len(message["content"])
  204. return completion_tokens, prompt_tokens + completion_tokens