File size: 11,185 Bytes
319a292
f84a20c
03ed2e0
64cb25e
03ed2e0
64cb25e
d02c5c6
d18a95c
319a292
64cb25e
 
aea29cb
64cb25e
 
03ed2e0
319a292
 
 
 
 
f84a20c
319a292
d18a95c
 
 
319a292
 
 
 
d18a95c
64cb25e
d18a95c
 
319a292
 
 
 
 
 
 
 
b5bc6a9
319a292
 
 
 
64cb25e
 
 
 
 
 
 
 
 
 
 
 
319a292
b5bc6a9
319a292
b5bc6a9
64cb25e
b5bc6a9
64cb25e
 
319a292
3504513
 
64cb25e
 
 
f173552
03ed2e0
 
 
 
 
64cb25e
03ed2e0
 
 
 
 
 
 
 
64cb25e
03ed2e0
 
 
 
 
64cb25e
03ed2e0
64cb25e
03ed2e0
 
64cb25e
03ed2e0
 
319a292
a58952e
64cb25e
319a292
b5bc6a9
04f810c
64cb25e
 
 
 
 
 
3e20aa7
64cb25e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3e20aa7
f564ebf
64cb25e
f564ebf
64cb25e
f564ebf
 
 
64cb25e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a58952e
f564ebf
64cb25e
 
 
 
 
 
 
 
 
 
 
 
 
 
e86e33b
 
64cb25e
 
 
 
 
 
 
 
 
 
 
 
 
 
aea29cb
d18a95c
64cb25e
 
 
 
 
 
 
 
 
 
 
 
 
aea29cb
3e20aa7
64cb25e
3e20aa7
319a292
64cb25e
d18a95c
319a292
64cb25e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d706a96
 
64cb25e
a58952e
319a292
aea29cb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
import os
import json
import uuid
import requests
import threading
import logging
from fastapi import FastAPI, HTTPException
from pydantic import BaseModel
from google.cloud import storage
from google.auth import exceptions
from transformers import pipeline
from dotenv import load_dotenv
import uvicorn
import io

load_dotenv()

API_KEY = os.getenv("API_KEY")
GCS_BUCKET_NAME = os.getenv("GCS_BUCKET_NAME")
GOOGLE_APPLICATION_CREDENTIALS_JSON = os.getenv("GOOGLE_APPLICATION_CREDENTIALS_JSON")
HF_API_TOKEN = os.getenv("HF_API_TOKEN")

logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s')
logger = logging.getLogger(__name__)

try:
    credentials_info = json.loads(GOOGLE_APPLICATION_CREDENTIALS_JSON)
    storage_client = storage.Client.from_service_account_info(credentials_info)
    bucket = storage_client.bucket(GCS_BUCKET_NAME)
    logger.info(f"Conexión con Google Cloud Storage exitosa. Bucket: {GCS_BUCKET_NAME}")
except (exceptions.DefaultCredentialsError, json.JSONDecodeError, KeyError, ValueError) as e:
    logger.error(f"Error al cargar las credenciales o bucket: {e}")
    raise RuntimeError(f"Error al cargar las credenciales o bucket: {e}")

app = FastAPI()

class DownloadModelRequest(BaseModel):
    model_name: str
    pipeline_task: str
    input_text: str

class GCSHandler:
    def __init__(self, bucket_name):
        self.bucket = storage_client.bucket(bucket_name)

    def file_exists(self, blob_name):
        exists = self.bucket.blob(blob_name).exists()
        logger.debug(f"Comprobando existencia de archivo '{blob_name}': {exists}")
        return exists

    def upload_file(self, blob_name, file_stream):
        blob = self.bucket.blob(blob_name)
        try:
            blob.upload_from_file(file_stream)
            logger.info(f"Archivo '{blob_name}' subido exitosamente a GCS.")
        except Exception as e:
            logger.error(f"Error subiendo el archivo '{blob_name}' a GCS: {e}")
            raise HTTPException(status_code=500, detail=f"Error subiendo archivo '{blob_name}' a GCS")

    def download_file(self, blob_name):
        blob = self.bucket.blob(blob_name)
        if not blob.exists():
            logger.error(f"Archivo '{blob_name}' no encontrado en GCS.")
            raise HTTPException(status_code=404, detail=f"File '{blob_name}' not found.")
        logger.debug(f"Descargando archivo '{blob_name}' de GCS.")
        return blob.open("rb")  # Abre el archivo en modo lectura de bytes

    def generate_signed_url(self, blob_name, expiration=3600):
        blob = self.bucket.blob(blob_name)
        url = blob.generate_signed_url(expiration=expiration)
        logger.debug(f"Generada URL firmada para '{blob_name}': {url}")
        return url

def download_model_from_huggingface(model_name):
    url = f"https://huggingface.co/{model_name}/tree/main"
    headers = {"Authorization": f"Bearer {HF_API_TOKEN}"}
    
    try:
        logger.info(f"Descargando el modelo '{model_name}' desde Hugging Face...")
        response = requests.get(url, headers=headers)
        if response.status_code == 200:
            model_files = [
                "pytorch_model.bin",
                "config.json",
                "tokenizer.json",
                "model.safetensors",
            ]
            for file_name in model_files:
                file_url = f"https://huggingface.co/{model_name}/resolve/main/{file_name}"
                file_content = requests.get(file_url).content
                blob_name = f"{model_name}/{file_name}"
                blob = bucket.blob(blob_name)
                blob.upload_from_string(file_content)
                logger.info(f"Archivo '{file_name}' subido exitosamente al bucket GCS.")
        else:
            logger.error(f"Error al acceder al árbol de archivos de Hugging Face para '{model_name}'.")
            raise HTTPException(status_code=404, detail="Error al acceder al árbol de archivos de Hugging Face.")
    except Exception as e:
        logger.error(f"Error descargando archivos de Hugging Face: {e}")
        raise HTTPException(status_code=500, detail=f"Error descargando archivos de Hugging Face: {e}")

@app.post("/predict/")
async def predict(request: DownloadModelRequest):
    logger.info(f"Iniciando predicción para el modelo '{request.model_name}' con tarea '{request.pipeline_task}'...")
    try:
        gcs_handler = GCSHandler(GCS_BUCKET_NAME)
        model_prefix = request.model_name
        model_files = [
            "pytorch_model.bin",
            "config.json",
            "tokenizer.json",
            "model.safetensors",
        ]
        
        model_files_exist = all(gcs_handler.file_exists(f"{model_prefix}/{file}") for file in model_files)
        
        if not model_files_exist:
            logger.info(f"Modelos no encontrados en GCS, descargando '{model_prefix}' desde Hugging Face...")
            download_model_from_huggingface(model_prefix)
        
        model_files_streams = {file: gcs_handler.download_file(f"{model_prefix}/{file}") for file in model_files if gcs_handler.file_exists(f"{model_prefix}/{file}")}
        
        config_stream = model_files_streams.get("config.json")
        tokenizer_stream = model_files_streams.get("tokenizer.json")
        model_stream = model_files_streams.get("pytorch_model.bin")
        
        if not config_stream or not tokenizer_stream or not model_stream:
            logger.error(f"Faltan archivos necesarios para el modelo '{model_prefix}'.")
            raise HTTPException(status_code=500, detail="Required model files missing.")
        
        if request.pipeline_task in ["text-generation", "translation", "summarization"]:
            pipe = pipeline(request.pipeline_task, model=model_stream, tokenizer=tokenizer_stream)
            result = pipe(request.input_text)
            logger.info(f"Resultado generado para la tarea '{request.pipeline_task}': {result[0]}")
            return {"response": result[0]}

        elif request.pipeline_task == "image-generation":
            try:
                pipe = pipeline("image-generation", model=model_stream)
                images = pipe(request.input_text)
                image = images[0]
                image_filename = f"{uuid.uuid4().hex}.png"
                image_path = f"images/{image_filename}"
                image.save(image_path)
                
                gcs_handler.upload_file(image_path, open(image_path, "rb"))
                image_url = gcs_handler.generate_signed_url(image_path)
                logger.info(f"Imagen generada y subida correctamente con URL: {image_url}")
                return {"response": {"image_url": image_url}}
            except Exception as e:
                logger.error(f"Error generando la imagen: {e}")
                raise HTTPException(status_code=400, detail="Error generando la imagen.")

        elif request.pipeline_task == "image-editing":
            try:
                pipe = pipeline("image-editing", model=model_stream)
                edited_images = pipe(request.input_text)
                edited_image = edited_images[0]
                edited_image_filename = f"{uuid.uuid4().hex}_edited.png"
                edited_image.save(edited_image_filename)

                gcs_handler.upload_file(f"images/{edited_image_filename}", open(edited_image_filename, "rb"))
                edited_image_url = gcs_handler.generate_signed_url(f"images/{edited_image_filename}")
                logger.info(f"Imagen editada y subida correctamente con URL: {edited_image_url}")
                return {"response": {"edited_image_url": edited_image_url}}
            except Exception as e:
                logger.error(f"Error editando la imagen: {e}")
                raise HTTPException(status_code=400, detail="Error editando la imagen.")

        elif request.pipeline_task == "image-to-image":
            try:
                pipe = pipeline("image-to-image", model=model_stream)
                transformed_images = pipe(request.input_text)
                transformed_image = transformed_images[0]
                transformed_image_filename = f"{uuid.uuid4().hex}_transformed.png"
                transformed_image.save(transformed_image_filename)

                gcs_handler.upload_file(f"images/{transformed_image_filename}", open(transformed_image_filename, "rb"))
                transformed_image_url = gcs_handler.generate_signed_url(f"images/{transformed_image_filename}")
                logger.info(f"Imagen transformada y subida correctamente con URL: {transformed_image_url}")
                return {"response": {"transformed_image_url": transformed_image_url}}
            except Exception as e:
                logger.error(f"Error transformando la imagen: {e}")
                raise HTTPException(status_code=400, detail="Error transformando la imagen.")

        elif request.pipeline_task == "text-to-3d":
            try:
                model_3d_filename = f"{uuid.uuid4().hex}.obj"
                model_3d_path = f"3d-models/{model_3d_filename}"
                with open(model_3d_path, "w") as f:
                    f.write("Simulated 3D model data")

                gcs_handler.upload_file(f"3d-models/{model_3d_filename}", open(model_3d_path, "rb"))
                model_3d_url = gcs_handler.generate_signed_url(f"3d-models/{model_3d_filename}")
                logger.info(f"Modelo 3D generado y subido con URL: {model_3d_url}")
                return {"response": {"model_3d_url": model_3d_url}}
            except Exception as e:
                logger.error(f"Error generando el modelo 3D: {e}")
                raise HTTPException(status_code=400, detail="Error generando el modelo 3D.")

    except HTTPException as e:
        logger.error(f"HTTPException: {e.detail}")
        raise e
    except Exception as e:
        logger.error(f"Error inesperado: {e}")
        raise HTTPException(status_code=500, detail=f"Error: {e}")

def download_all_models_in_background():
    models_url = "https://huggingface.co/api/models"
    try:
        logger.info("Obteniendo lista de modelos desde Hugging Face...")
        response = requests.get(models_url)
        if response.status_code != 200:
            logger.error("Error al obtener la lista de modelos de Hugging Face.")
            raise HTTPException(status_code=500, detail="Error al obtener la lista de modelos.")
        
        models = response.json()
        for model in models:
            model_name = model["id"]
            logger.info(f"Descargando el modelo '{model_name}' desde Hugging Face...")
            download_model_from_huggingface(model_name)
    except Exception as e:
        logger.error(f"Error al descargar modelos en segundo plano: {e}")
        raise HTTPException(status_code=500, detail="Error al descargar modelos en segundo plano.")

def run_in_background():
    logger.info("Iniciando la descarga de modelos en segundo plano...")
    threading.Thread(target=download_all_models_in_background, daemon=True).start()

@app.on_event("startup")
async def startup_event():
    run_in_background()

if __name__ == "__main__":
    uvicorn.run(app, host="0.0.0.0", port=7860)