File size: 6,343 Bytes
cff82fa d62232c 0b0a2f7 b8a7df8 1ddc959 d62232c 1ddc959 1af48fa d62232c 1af48fa 0b0a2f7 1af48fa d62232c 1ddc959 82c93cf 783c658 1ddc959 0b0a2f7 3f0a3dd 1af48fa 3e3ea9a 1af48fa d37cc67 1af48fa 60cf2f7 1af48fa 7158ded b54a508 7158ded 60cf2f7 1af48fa 52bcfe4 1af48fa 3f0a3dd 52bcfe4 9d7f082 3f0a3dd 9410047 52bcfe4 9410047 b8a7df8 9410047 783c658 e86d80a fc14950 b8a7df8 9410047 e86d80a 9410047 3f0a3dd 9410047 3f0a3dd b54a508 3f0a3dd b3ed199 0b0a2f7 b3ed199 3f0a3dd b3ed199 9d7f082 3f0a3dd 1af48fa 3f0a3dd f0d6a67 1af48fa 9d7f082 b3ed199 3f0a3dd 0b0a2f7 9410047 3790bd8 b8a7df8 60cf2f7 783c658 60cf2f7 783c658 0b0a2f7 1ddc959 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 |
import json
import traceback
import httpx
import secrets
from contextlib import asynccontextmanager
from fastapi import FastAPI, HTTPException, Depends
from models import RequestModel
from utils import config, api_keys_db, api_list, error_handling_wrapper, get_all_models, verify_api_key
from request import get_payload
from response import fetch_response, fetch_response_stream
from typing import List, Dict
from urllib.parse import urlparse
from fastapi.responses import StreamingResponse
@asynccontextmanager
async def lifespan(app: FastAPI):
# 启动时的代码
timeout = httpx.Timeout(connect=15.0, read=5.0, write=30.0, pool=30.0)
app.state.client = httpx.AsyncClient(timeout=timeout)
yield
# 关闭时的代码
await app.state.client.aclose()
app = FastAPI(lifespan=lifespan)
async def process_request(request: RequestModel, provider: Dict):
print("provider: ", provider['provider'])
url = provider['base_url']
parsed_url = urlparse(url)
# print(parsed_url)
engine = None
if parsed_url.netloc == 'generativelanguage.googleapis.com':
engine = "gemini"
elif parsed_url.netloc == 'api.anthropic.com' or parsed_url.path.endswith("v1/messages"):
engine = "claude"
elif parsed_url.netloc == 'openrouter.ai':
engine = "openrouter"
else:
engine = "gpt"
if "claude" not in provider['model'][request.model] \
and "gpt" not in provider['model'][request.model] \
and "gemini" not in provider['model'][request.model]:
engine = "openrouter"
if provider.get("engine"):
engine = provider["engine"]
print("engine", engine)
url, headers, payload = await get_payload(request, engine, provider)
# request_info = {
# "url": url,
# "headers": headers,
# "payload": payload
# }
# print(f"Request details: {json.dumps(request_info, indent=4, ensure_ascii=False)}")
if request.stream:
model = provider['model'][request.model]
# try:
generator = fetch_response_stream(app.state.client, url, headers, payload, engine, model)
wrapped_generator = await error_handling_wrapper(generator, status_code=500)
return StreamingResponse(wrapped_generator, media_type="text/event-stream")
# except HTTPException as e:
# return JSONResponse(status_code=e.status_code, content={"error": str(e.detail)})
# except Exception as e:
# # 处理其他异常
# return JSONResponse(status_code=500, content={"error": str(e)})
else:
return await fetch_response(app.state.client, url, headers, payload)
class ModelRequestHandler:
def __init__(self):
self.last_provider_index = -1
def get_matching_providers(self, model_name, token):
# for provider in config:
# print("provider", model_name, list(provider['model'].keys()))
# if model_name in provider['model'].keys():
# print("provider", provider)
api_index = api_list.index(token)
provider_rules = []
for model in config['api_keys'][api_index]['model']:
if "/" in model:
provider_name = model.split("/")[0]
model = model.split("/")[1]
for provider in config['providers']:
if provider['provider'] == provider_name:
models_list = provider['model'].keys()
if (model and model_name in models_list) or (model == "*" and model_name in models_list):
provider_rules.append(provider_name)
provider_list = []
for provider in config['providers']:
if model_name in provider['model'].keys() and ((provider_rules and provider['provider'] in provider_rules) or provider_rules == []):
provider_list.append(provider)
return provider_list
async def request_model(self, request: RequestModel, token: str):
model_name = request.model
matching_providers = self.get_matching_providers(model_name, token)
print("matching_providers", json.dumps(matching_providers, indent=4, ensure_ascii=False))
if not matching_providers:
raise HTTPException(status_code=404, detail="No matching model found")
# 检查是否启用轮询
api_index = api_list.index(token)
use_round_robin = False
if config['api_keys'][api_index].get("preferences"):
use_round_robin = config['api_keys'][api_index]["preferences"].get("USE_ROUND_ROBIN")
return await self.try_all_providers(request, matching_providers, use_round_robin)
async def try_all_providers(self, request: RequestModel, providers: List[Dict], use_round_robin: bool):
num_providers = len(providers)
for i in range(num_providers + 1):
self.last_provider_index = i % num_providers
provider = providers[self.last_provider_index]
try:
response = await process_request(request, provider)
return response
except Exception as e:
print('\033[31m')
print(f"Error with provider {provider['provider']}: {str(e)}")
traceback.print_exc()
print('\033[0m')
if use_round_robin:
continue
else:
raise HTTPException(status_code=500, detail="Error: Current provider response failed!")
raise HTTPException(status_code=500, detail="All providers failed")
model_handler = ModelRequestHandler()
@app.post("/v1/chat/completions")
async def request_model(request: RequestModel, token: str = Depends(verify_api_key)):
return await model_handler.request_model(request, token)
@app.post("/v1/models")
async def list_models(token: str = Depends(verify_api_key)):
models = get_all_models(token)
return {
"object": "list",
"data": models
}
@app.get("/generate-api-key")
def generate_api_key():
api_key = "sk-" + secrets.token_urlsafe(32)
return {"api_key": api_key}
# async def on_fetch(request, env):
# import asgi
# return await asgi.fetch(app, request, env)
if __name__ == '__main__':
import uvicorn
uvicorn.run("__main__:app", host="0.0.0.0", port=8000, reload=True) |