Spaces:
Running
Running
import asyncio | |
import atexit | |
import base64 | |
import glob | |
import io | |
import json | |
import os | |
import queue | |
import re | |
import shutil | |
import signal | |
import subprocess | |
import sys | |
import time | |
import uuid | |
from pathlib import Path | |
from typing import Dict, Optional | |
import matplotlib | |
import PIL.Image | |
from jupyter_client import BlockingKernelClient | |
sys.path.insert(0, str(Path(__file__).absolute().parent.parent.parent)) # NOQA | |
from qwen_agent.log import logger # NOQA | |
from qwen_agent.utils.utils import extract_code, print_traceback # NOQA | |
WORK_DIR = os.getenv('M6_CODE_INTERPRETER_WORK_DIR', '/tmp/m6_ci_workspace') | |
STATIC_URL = os.getenv('M6_CODE_INTERPRETER_STATIC_URL', | |
'http://127.0.0.1:7866/static') | |
LAUNCH_KERNEL_PY = """ | |
from ipykernel import kernelapp as app | |
app.launch_new_instance() | |
""" | |
INIT_CODE_FILE = str( | |
Path(__file__).absolute().parent / 'resource' / | |
'code_interpreter_init_kernel.py') | |
ALIB_FONT_FILE = str( | |
Path(__file__).absolute().parent / 'resource' / | |
'AlibabaPuHuiTi-3-45-Light.ttf') | |
_KERNEL_CLIENTS: Dict[int, BlockingKernelClient] = {} | |
def _start_kernel(pid) -> BlockingKernelClient: | |
connection_file = os.path.join(WORK_DIR, | |
f'kernel_connection_file_{pid}.json') | |
launch_kernel_script = os.path.join(WORK_DIR, f'launch_kernel_{pid}.py') | |
for f in [connection_file, launch_kernel_script]: | |
if os.path.exists(f): | |
logger.info(f'WARNING: {f} already exists') | |
os.remove(f) | |
os.makedirs(WORK_DIR, exist_ok=True) | |
with open(launch_kernel_script, 'w') as fout: | |
fout.write(LAUNCH_KERNEL_PY) | |
kernel_process = subprocess.Popen([ | |
sys.executable, | |
launch_kernel_script, | |
'--IPKernelApp.connection_file', | |
connection_file, | |
'--matplotlib=inline', | |
'--quiet', | |
], | |
cwd=WORK_DIR) | |
logger.info(f"INFO: kernel process's PID = {kernel_process.pid}") | |
# Wait for kernel connection file to be written | |
while True: | |
if not os.path.isfile(connection_file): | |
time.sleep(0.1) | |
else: | |
# Keep looping if JSON parsing fails, file may be partially written | |
try: | |
with open(connection_file, 'r') as fp: | |
json.load(fp) | |
break | |
except json.JSONDecodeError: | |
pass | |
# Client | |
kc = BlockingKernelClient(connection_file=connection_file) | |
asyncio.set_event_loop_policy(asyncio.DefaultEventLoopPolicy()) | |
kc.load_connection_file() | |
kc.start_channels() | |
kc.wait_for_ready() | |
return kc | |
def _kill_kernels(): | |
for v in _KERNEL_CLIENTS.values(): | |
v.shutdown() | |
for k in list(_KERNEL_CLIENTS.keys()): | |
del _KERNEL_CLIENTS[k] | |
atexit.register(_kill_kernels) | |
signal.signal(signal.SIGTERM, _kill_kernels) | |
signal.signal(signal.SIGINT, _kill_kernels) | |
def _serve_image(image_base64: str) -> str: | |
image_file = f'{uuid.uuid4()}.png' | |
local_image_file = os.path.join(WORK_DIR, image_file) | |
png_bytes = base64.b64decode(image_base64) | |
assert isinstance(png_bytes, bytes) | |
bytes_io = io.BytesIO(png_bytes) | |
PIL.Image.open(bytes_io).save(local_image_file, 'png') | |
image_url = f'{STATIC_URL}/{image_file}' | |
return image_url | |
def _escape_ansi(line: str) -> str: | |
ansi_escape = re.compile(r'(?:\x1B[@-_]|[\x80-\x9F])[0-?]*[ -/]*[@-~]') | |
return ansi_escape.sub('', line) | |
def _execute_code(kc: BlockingKernelClient, code: str) -> str: | |
kc.wait_for_ready() | |
kc.execute(code) | |
result = '' | |
image_idx = 0 | |
while True: | |
text = '' | |
image = '' | |
finished = False | |
msg_type = 'error' | |
try: | |
msg = kc.get_iopub_msg() | |
msg_type = msg['msg_type'] | |
if msg_type == 'status': | |
if msg['content'].get('execution_state') == 'idle': | |
finished = True | |
elif msg_type == 'execute_result': | |
text = msg['content']['data'].get('text/plain', '') | |
if 'image/png' in msg['content']['data']: | |
image_b64 = msg['content']['data']['image/png'] | |
image_url = _serve_image(image_b64) | |
image_idx += 1 | |
image = '![fig-%03d](%s)' % (image_idx, image_url) | |
elif msg_type == 'display_data': | |
if 'image/png' in msg['content']['data']: | |
image_b64 = msg['content']['data']['image/png'] | |
image_url = _serve_image(image_b64) | |
image_idx += 1 | |
image = '![fig-%03d](%s)' % (image_idx, image_url) | |
else: | |
text = msg['content']['data'].get('text/plain', '') | |
elif msg_type == 'stream': | |
msg_type = msg['content']['name'] # stdout, stderr | |
text = msg['content']['text'] | |
elif msg_type == 'error': | |
text = _escape_ansi('\n'.join(msg['content']['traceback'])) | |
if 'M6_CODE_INTERPRETER_TIMEOUT' in text: | |
text = 'Timeout: Code execution exceeded the time limit.' | |
except queue.Empty: | |
text = 'Timeout: Code execution exceeded the time limit.' | |
finished = True | |
except Exception: | |
text = 'The code interpreter encountered an unexpected error.' | |
print_traceback() | |
finished = True | |
if text: | |
result += f'\n\n{msg_type}:\n\n```\n{text}\n```' | |
if image: | |
result += f'\n\n{image}' | |
if finished: | |
break | |
result = result.lstrip('\n') | |
return result | |
def _fix_matplotlib_cjk_font_issue(): | |
ttf_name = os.path.basename(ALIB_FONT_FILE) | |
local_ttf = os.path.join( | |
os.path.abspath( | |
os.path.join(matplotlib.matplotlib_fname(), os.path.pardir)), | |
'fonts', 'ttf', ttf_name) | |
if not os.path.exists(local_ttf): | |
try: | |
shutil.copy(ALIB_FONT_FILE, local_ttf) | |
font_list_cache = os.path.join(matplotlib.get_cachedir(), | |
'fontlist-*.json') | |
for cache_file in glob.glob(font_list_cache): | |
with open(cache_file) as fin: | |
cache_content = fin.read() | |
if ttf_name not in cache_content: | |
os.remove(cache_file) | |
except Exception: | |
print_traceback() | |
def code_interpreter(action_input: str, timeout: Optional[int] = 30) -> str: | |
code = extract_code(action_input) | |
if not code.strip(): | |
return '' | |
pid: int = os.getpid() | |
if pid in _KERNEL_CLIENTS: | |
kc = _KERNEL_CLIENTS[pid] | |
else: | |
_fix_matplotlib_cjk_font_issue() | |
kc = _start_kernel(pid) | |
with open(INIT_CODE_FILE) as fin: | |
start_code = fin.read() | |
start_code = start_code.replace('{{M6_FONT_PATH}}', | |
repr(ALIB_FONT_FILE)[1:-1]) | |
logger.info(_execute_code(kc, start_code)) | |
_KERNEL_CLIENTS[pid] = kc | |
if timeout: | |
code = f'_M6CountdownTimer.start({timeout})\n{code}' | |
fixed_code = [] | |
for line in code.split('\n'): | |
fixed_code.append(line) | |
if line.startswith('sns.set_theme('): | |
fixed_code.append( | |
'plt.rcParams["font.family"] = _m6_font_prop.get_name()') | |
fixed_code = '\n'.join(fixed_code) | |
result = _execute_code(kc, fixed_code) | |
if timeout: | |
_execute_code(kc, '_M6CountdownTimer.cancel()') | |
return result | |
def _get_multiline_input(hint: str) -> str: | |
logger.info( | |
'// Press ENTER to make a new line. Press CTRL-D to end input.') | |
lines = [] | |
while True: | |
try: | |
line = input() | |
except EOFError: # CTRL-D | |
break | |
lines.append(line) | |
logger.info('// Input received.') | |
if lines: | |
return '\n'.join(lines) | |
else: | |
return '' | |
if __name__ == '__main__': | |
while True: | |
logger.info( | |
code_interpreter(_get_multiline_input('Enter python code:'))) | |