Spaces:

hiddenFront
/

textClassifierAPI

Sleeping

App Files Files Community

textClassifierAPI / app.py

hiddenFront

Update app.py

e66afc2 verified 5 months ago

raw

history blame

2.35 kB

	from fastapi import FastAPI, Request
	from transformers import AutoTokenizer
	from huggingface_hub import hf_hub_download
	import torch
	import pickle
	import os
	import psutil
	import sys

	app = FastAPI()
	device = torch.device("cpu")

	# category.pkl 로드
	try:
	with open("category.pkl", "rb") as f:
	category = pickle.load(f)
	print("✅ category.pkl 로드 성공.")
	except FileNotFoundError:
	print("❌ Error: category.pkl 파일을 찾을 수 없습니다. 프로젝트 루트에 있는지 확인하세요.")
	sys.exit(1)

	# 토크나이저 로드
	tokenizer = AutoTokenizer.from_pretrained("skt/kobert-base-v1")
	print("✅ 토크나이저 로드 성공.")

	HF_MODEL_REPO_ID = "hiddenFront/TextClassifier"
	HF_MODEL_FILENAME = "textClassifierModel.pt"

	# 메모리 확인
	process = psutil.Process(os.getpid())
	mem_before = process.memory_info().rss / (1024 * 1024)
	print(f"📦 모델 다운로드 전 메모리 사용량: {mem_before:.2f} MB")

	# 모델 다운로드 및 로드
	try:
	model_path = hf_hub_download(repo_id=HF_MODEL_REPO_ID, filename=HF_MODEL_FILENAME)
	print(f"✅ 모델 파일 다운로드 성공: {model_path}")

	mem_after_dl = process.memory_info().rss / (1024 * 1024)
	print(f"📦 모델 다운로드 후 메모리 사용량: {mem_after_dl:.2f} MB")

	model = torch.load(model_path, map_location=device) # 전체 모델 객체 로드
	model.eval()

	mem_after_load = process.memory_info().rss / (1024 * 1024)
	print(f"📦 모델 로드 후 메모리 사용량: {mem_after_load:.2f} MB")
	print("✅ 모델 로드 성공")
	except Exception as e:
	print(f"❌ Error: 모델 다운로드 또는 로드 중 오류 발생: {e}")
	sys.exit(1)

	# 예측 API
	@app.post("/predict")
	async def predict_api(request: Request):
	data = await request.json()
	text = data.get("text")
	if not text:
	return {"error": "No text provided", "classification": "null"}

	encoded = tokenizer.encode_plus(
	text, max_length=64, padding='max_length', truncation=True, return_tensors='pt'
	)

	with torch.no_grad():
	outputs = model(**encoded)
	probs = torch.nn.functional.softmax(outputs.logits, dim=1)
	predicted = torch.argmax(probs, dim=1).item()

	label = list(category.keys())[predicted]
	return {"text": text, "classification": label}