from flask import Flask, request, make_response import hashlib import time import xml.etree.ElementTree as ET import os import json from openai import OpenAI from dotenv import load_dotenv from markdown import markdown import re import threading import logging from datetime import datetime import asyncio from concurrent.futures import ThreadPoolExecutor import queue import uuid import base64 from Crypto.Cipher import AES import struct import random import string import requests logging.basicConfig( level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s', handlers=[ logging.FileHandler('wechat_service.log'), logging.StreamHandler() ] ) load_dotenv() app = Flask(__name__) # Configuration TOKEN = os.getenv('TOKEN') ENCODING_AES_KEY = os.getenv('ENCODING_AES_KEY') APPID = os.getenv('APPID') APPSECRET = os.getenv('APPSECRET') # 新增 AppSecret API_KEY = os.getenv("API_KEY") BASE_URL = os.getenv("OPENAI_BASE_URL") IMAGE_MODEL_URL = os.getenv("IMAGE_MODEL_URL") IMAGE_MODEL_KEY = os.getenv("IMAGE_MODEL_KEY") client = OpenAI(api_key=API_KEY, base_url=BASE_URL) executor = ThreadPoolExecutor(max_workers=10) # Define tools for image generation TOOLS = [ { "type": "function", "function": { "name": "generate_image", "description": "Generate an image based on text description", "parameters": { "type": "object", "properties": { "prompt": { "type": "string", "description": "The description of the image to generate" } }, "required": ["prompt"] } } } ] class AccessTokenManager: def __init__(self): self._access_token = None self._expires_at = 0 self._lock = threading.Lock() def get_token(self): with self._lock: now = time.time() # 提前5分钟刷新token,确保在调用时token都是有效的 if self._access_token and now < (self._expires_at - 300): return self._access_token try: url = "https://api.weixin.qq.com/cgi-bin/token" params = { "grant_type": "client_credential", "appid": APPID, "secret": APPSECRET } logging.info("开始获取新的access_token") response = requests.get(url, params=params) response.raise_for_status() result = response.json() if "access_token" not in result: error_msg = f"获取access_token失败: {result}" logging.error(error_msg) raise ValueError(error_msg) self._access_token = result["access_token"] self._expires_at = now + result["expires_in"] logging.info("成功获取新的access_token") return self._access_token except Exception as e: error_msg = f"获取access_token时发生错误: {str(e)}" logging.error(error_msg) raise def refresh_token(self): with self._lock: self._access_token = None return self.get_token() class WeChatCrypto: def __init__(self, key, app_id): self.key = base64.b64decode(key + '=') self.app_id = app_id def encrypt(self, text): random_str = ''.join(random.choices(string.ascii_letters + string.digits, k=16)) text_bytes = text.encode('utf-8') msg_len = struct.pack('>I', len(text_bytes)) message = random_str.encode('utf-8') + msg_len + text_bytes + self.app_id.encode('utf-8') pad_len = 32 - (len(message) % 32) message += chr(pad_len).encode('utf-8') * pad_len cipher = AES.new(self.key, AES.MODE_CBC, self.key[:16]) encrypted = cipher.encrypt(message) return base64.b64encode(encrypted).decode('utf-8') def decrypt(self, encrypted_text): encrypted_data = base64.b64decode(encrypted_text) cipher = AES.new(self.key, AES.MODE_CBC, self.key[:16]) decrypted = cipher.decrypt(encrypted_data) pad_len = decrypted[-1] if not isinstance(pad_len, int): pad_len = ord(pad_len) content = decrypted[16:-pad_len] msg_len = struct.unpack('>I', content[:4])[0] xml_content = content[4:msg_len + 4].decode('utf-8') app_id = content[msg_len + 4:].decode('utf-8') if app_id != self.app_id: raise ValueError('Invalid AppID') return xml_content class AsyncResponse: def __init__(self): self.status = "processing" self.result = None self.error = None self.create_time = time.time() self.timeout = 3600 self.response_type = "text" # Can be "text" or "image" self.media_id = None # For image responses def is_expired(self): return time.time() - self.create_time > self.timeout class UserSession: def __init__(self): self.messages = [{"role": "system", "content": "你是HXIAO公众号的智能助手,这一个用来分享与学习人工智能的公众号,我们的目标是专注AI应用的简单研究与实践。致力于分享切实可行的技术方案,希望让复杂的技术变得简单易懂。也喜欢用通俗的语言来解释专业概念,让技术真正服务于每个学习者"}] self.pending_parts = [] self.last_active = time.time() self.current_task = None self.response_queue = {} self.session_timeout = 3600 def is_expired(self): return time.time() - self.last_active > self.session_timeout def cleanup_expired_tasks(self): expired_tasks = [ task_id for task_id, response in self.response_queue.items() if response.is_expired() ] for task_id in expired_tasks: del self.response_queue[task_id] if self.current_task == task_id: self.current_task = None class SessionManager: def __init__(self): self.sessions = {} self._lock = threading.Lock() self.crypto = WeChatCrypto(ENCODING_AES_KEY, APPID) def get_session(self, user_id): with self._lock: current_time = time.time() if user_id in self.sessions: session = self.sessions[user_id] if session.is_expired(): session = UserSession() else: session.cleanup_expired_tasks() else: session = UserSession() session.last_active = current_time self.sessions[user_id] = session return session def clear_session(self, user_id): with self._lock: if user_id in self.sessions: self.sessions[user_id] = UserSession() def cleanup_expired_sessions(self): with self._lock: current_time = time.time() expired_users = [ user_id for user_id, session in self.sessions.items() if session.is_expired() ] for user_id in expired_users: del self.sessions[user_id] logging.info(f"已清理过期会话: {user_id}") def convert_markdown_to_wechat(md_text): if not md_text: return md_text md_text = re.sub(r'^# (.*?)$', r'【标题】\1', md_text, flags=re.MULTILINE) md_text = re.sub(r'^## (.*?)$', r'【子标题】\1', md_text, flags=re.MULTILINE) md_text = re.sub(r'^### (.*?)$', r'【小标题】\1', md_text, flags=re.MULTILINE) md_text = re.sub(r'\*\*(.*?)\*\*', r'『\1』', md_text) md_text = re.sub(r'\*(.*?)\*', r'「\1」', md_text) md_text = re.sub(r'`(.*?)`', r'「\1」', md_text) md_text = re.sub(r'^\- ', '• ', md_text, flags=re.MULTILINE) md_text = re.sub(r'^\d\. ', '○ ', md_text, flags=re.MULTILINE) md_text = re.sub(r'```[\w]*\n(.*?)```', r'【代码开始】\n\1\n【代码结束】', md_text, flags=re.DOTALL) md_text = re.sub(r'^> (.*?)$', r'▎\1', md_text, flags=re.MULTILINE) md_text = re.sub(r'^-{3,}$', r'—————————', md_text, flags=re.MULTILINE) md_text = re.sub(r'\[(.*?)\]\((.*?)\)', r'\1(\2)', md_text) md_text = re.sub(r'\n{3,}', '\n\n', md_text) return md_text def verify_signature(signature, timestamp, nonce, token): items = [token, timestamp, nonce] items.sort() temp_str = ''.join(items) hash_sha1 = hashlib.sha1(temp_str.encode('utf-8')).hexdigest() return hash_sha1 == signature def verify_msg_signature(msg_signature, timestamp, nonce, token, encrypt_msg): items = [token, timestamp, nonce, encrypt_msg] items.sort() temp_str = ''.join(items) hash_sha1 = hashlib.sha1(temp_str.encode('utf-8')).hexdigest() return hash_sha1 == msg_signature def parse_xml_message(xml_content): root = ET.fromstring(xml_content) return { 'content': root.find('Content').text if root.find('Content') is not None else '', 'from_user': root.find('FromUserName').text, 'to_user': root.find('ToUserName').text, 'msg_id': root.find('MsgId').text if root.find('MsgId') is not None else '', 'create_time': root.find('CreateTime').text, 'msg_type': root.find('MsgType').text } def generate_response_xml(to_user, from_user, content, response_type='text', media_id=None, encrypt_type='aes'): timestamp = str(int(time.time())) nonce = ''.join(random.choices(string.ascii_letters + string.digits, k=10)) if response_type == 'image' and media_id: xml_content = f''' {timestamp} ''' else: formatted_content = convert_markdown_to_wechat(content) xml_content = f''' {timestamp} ''' if encrypt_type == 'aes': encrypted = session_manager.crypto.encrypt(xml_content) signature_list = [TOKEN, timestamp, nonce, encrypted] signature_list.sort() msg_signature = hashlib.sha1(''.join(signature_list).encode('utf-8')).hexdigest() response_xml = f''' {timestamp} ''' else: response_xml = xml_content response = make_response(response_xml) response.content_type = 'application/xml' return response # 创建全局的token管理器实例 token_manager = AccessTokenManager() def upload_image_to_wechat(image_data): """上传图片到微信服务器并获取media_id""" try: access_token = token_manager.get_token() upload_url = f'https://api.weixin.qq.com/cgi-bin/media/upload?access_token={access_token}&type=image' files = {'media': ('image.jpg', image_data, 'image/jpeg')} logging.info("开始上传图片到微信服务器") response = requests.post(upload_url, files=files) response.raise_for_status() result = response.json() if 'media_id' not in result: if 'errcode' in result and result['errcode'] == 40001: # access_token 可能过期,尝试刷新并重试 logging.info("access_token已过期,正在刷新并重试") access_token = token_manager.refresh_token() upload_url = f'https://api.weixin.qq.com/cgi-bin/media/upload?access_token={access_token}&type=image' response = requests.post(upload_url, files=files) response.raise_for_status() result = response.json() if 'media_id' not in result: error_msg = f"上传图片失败: {result}" logging.error(error_msg) raise ValueError(error_msg) logging.info(f"图片上传成功,获取到media_id") return result['media_id'] except Exception as e: error_msg = f"上传图片过程中发生错误: {str(e)}" logging.error(error_msg) raise def process_long_running_task(messages): try: logging.info("开始调用AI服务") response = client.chat.completions.create( model="o3-mini", messages=messages, tools=TOOLS, tool_choice="auto", timeout=60 ) logging.info("AI服务响应成功") if response.choices[0].message.tool_calls: logging.info("检测到tool调用") tool_call = response.choices[0].message.tool_calls[0] if tool_call.function.name == "generate_image": logging.info("开始处理图片生成请求") args = json.loads(tool_call.function.arguments) image_response = requests.post( IMAGE_MODEL_URL, headers={ 'Content-Type': 'application/json', 'Authorization': f'Bearer {IMAGE_MODEL_KEY}' }, json={ "model": "grok-latest-image", "messages": [{ "role": "user", "content": args['prompt'] }] } ) image_response.raise_for_status() result = image_response.json() logging.info("图片生成成功,准备下载图片") # 从markdown格式中提取URL markdown_content = result['choices'][0]['message']['content'] image_url = re.search(r'\!\[image\]\((.*?)\)', markdown_content).group(1) logging.info(f"提取到图片URL: {image_url}") img_response = requests.get(image_url) img_response.raise_for_status() media_id = upload_image_to_wechat(img_response.content) return { "type": "image", "media_id": media_id } logging.info("返回文本响应") return { "type": "text", "content": response.choices[0].message.content } except Exception as e: logging.error(f"API调用错误: {str(e)}") raise def handle_async_task(session, task_id, messages): try: logging.info(f"开始处理异步任务: {task_id}") if task_id not in session.response_queue: return result = process_long_running_task(messages) if task_id in session.response_queue and not session.response_queue[task_id].is_expired(): session.response_queue[task_id].status = "completed" session.response_queue[task_id].response_type = result.get("type", "text") if result["type"] == "image": session.response_queue[task_id].media_id = result["media_id"] session.response_queue[task_id].result = None messages.append({"role": "assistant", "content": "图片已生成"}) else: session.response_queue[task_id].result = result["content"] messages.append({"role": "assistant", "content": result["content"]}) except Exception as e: logging.error(f"异步任务处理失败: {str(e)}") if task_id in session.response_queue: session.response_queue[task_id].status = "failed" session.response_queue[task_id].error = str(e) def generate_initial_response(): return "您的请求正在处理中,请回复'查询'获取结果(生图需要时间)" def split_message(message, max_length=500): return [message[i:i+max_length] for i in range(0, len(message), max_length)] def append_status_message(content, has_pending_parts=False, is_processing=False): if "您的请求正在处理中" in content: return content + "\n\n-------------------\n发送'新对话'开始新的对话" status_message = "\n\n-------------------" if is_processing: status_message += "\n请回复'查询'获取结果" elif has_pending_parts: status_message += "\n当前消息已截断,发送'继续'查看后续内容" status_message += "\n发送'新对话'开始新的对话" return content + status_message session_manager = SessionManager() @app.route('/api/wx', methods=['GET', 'POST']) def wechatai(): if request.method == 'GET': signature = request.args.get('signature') timestamp = request.args.get('timestamp') nonce = request.args.get('nonce') echostr = request.args.get('echostr') if verify_signature(signature, timestamp, nonce, TOKEN): return echostr return 'error', 403 try: encrypt_type = request.args.get('encrypt_type', '') if encrypt_type == 'aes': msg_signature = request.args.get('msg_signature') timestamp = request.args.get('timestamp') nonce = request.args.get('nonce') xml_tree = ET.fromstring(request.data) encrypted_text = xml_tree.find('Encrypt').text if not verify_msg_signature(msg_signature, timestamp, nonce, TOKEN, encrypted_text): return 'Invalid signature', 403 decrypted_xml = session_manager.crypto.decrypt(encrypted_text) message_data = parse_xml_message(decrypted_xml) else: message_data = parse_xml_message(request.data) user_content = message_data['content'].strip() from_user = message_data['from_user'] to_user = message_data['to_user'] logging.info(f"收到用户({from_user})消息: {user_content}") session = session_manager.get_session(from_user) if user_content == '新对话': session_manager.clear_session(from_user) return generate_response_xml( from_user, to_user, append_status_message('已开始新的对话。请描述您的问题。'), encrypt_type=encrypt_type ) if user_content == '继续': if session.pending_parts: next_part = session.pending_parts.pop(0) has_more = bool(session.pending_parts) return generate_response_xml( from_user, to_user, append_status_message(next_part, has_more), encrypt_type=encrypt_type ) return generate_response_xml( from_user, to_user, append_status_message('没有更多内容了。请继续您的问题。'), encrypt_type=encrypt_type ) if user_content == '查询': if session.current_task: task_response = session.response_queue.get(session.current_task) if task_response: if task_response.is_expired(): del session.response_queue[session.current_task] session.current_task = None return generate_response_xml( from_user, to_user, append_status_message('请求已过期,请重新提问。'), encrypt_type=encrypt_type ) if task_response.status == "completed": if task_response.response_type == "image": logging.info("返回图片响应") del session.response_queue[session.current_task] session.current_task = None return generate_response_xml( from_user, to_user, "", response_type="image", media_id=task_response.media_id, encrypt_type=encrypt_type ) else: response = task_response.result del session.response_queue[session.current_task] session.current_task = None if len(response) > 500: parts = split_message(response) first_part = parts.pop(0) session.pending_parts = parts return generate_response_xml( from_user, to_user, append_status_message(first_part, True), encrypt_type=encrypt_type ) return generate_response_xml( from_user, to_user, append_status_message(response), encrypt_type=encrypt_type ) elif task_response.status == "failed": error_message = '处理过程中出现错误,请重新提问。' del session.response_queue[session.current_task] session.current_task = None return generate_response_xml( from_user, to_user, append_status_message(error_message), encrypt_type=encrypt_type ) else: return generate_response_xml( from_user, to_user, append_status_message('正在处理中,请稍后再次查询。(生图需要时间)', is_processing=True), encrypt_type=encrypt_type ) return generate_response_xml( from_user, to_user, append_status_message('没有正在处理的请求。'), encrypt_type=encrypt_type ) session.messages.append({"role": "user", "content": user_content}) task_id = str(uuid.uuid4()) session.current_task = task_id session.response_queue[task_id] = AsyncResponse() executor.submit(handle_async_task, session, task_id, session.messages.copy()) logging.info("返回初始响应") return generate_response_xml( from_user, to_user, append_status_message(generate_initial_response(), is_processing=True), encrypt_type=encrypt_type ) except Exception as e: logging.error(f"处理请求时出错: {str(e)}") return generate_response_xml( message_data['from_user'], message_data['to_user'], append_status_message('抱歉,系统暂时出现问题,请稍后重试。'), encrypt_type if 'encrypt_type' in locals() else '' ) def cleanup_sessions(): while True: time.sleep(3600) # 每小时清理一次 try: session_manager.cleanup_expired_sessions() except Exception as e: logging.error(f"清理会话时出错: {str(e)}") if __name__ == '__main__': cleanup_thread = threading.Thread(target=cleanup_sessions, daemon=True) cleanup_thread.start() app.run(host='0.0.0.0', port=7860, debug=True)