Spaces:
Running
Running
Update config.py
Browse files
config.py
CHANGED
|
@@ -4,6 +4,7 @@ import json
|
|
| 4 |
from datetime import datetime
|
| 5 |
import time
|
| 6 |
import threading
|
|
|
|
| 7 |
|
| 8 |
ARENA_NAME = "# π The GPU-Poor LLM Gladiator Arena π v25.10"
|
| 9 |
|
|
@@ -61,6 +62,10 @@ def load_approved_models():
|
|
| 61 |
MODEL_REFRESH_INTERVAL = 3600 # Check every 1 hour
|
| 62 |
_last_model_check = 0 # Track last check time
|
| 63 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
def get_approved_models():
|
| 65 |
"""Get the current list of approved models with periodic refresh."""
|
| 66 |
global _last_model_check
|
|
@@ -72,7 +77,7 @@ def get_approved_models():
|
|
| 72 |
get_approved_models._models = load_approved_models()
|
| 73 |
_last_model_check = current_time
|
| 74 |
|
| 75 |
-
return get_approved_models._models
|
| 76 |
|
| 77 |
def refresh_approved_models():
|
| 78 |
"""Force refresh of the approved models list."""
|
|
@@ -80,6 +85,9 @@ def refresh_approved_models():
|
|
| 80 |
delattr(get_approved_models, '_models')
|
| 81 |
return get_approved_models()
|
| 82 |
|
|
|
|
|
|
|
|
|
|
| 83 |
# Keep FALLBACK_MODELS as a safety net
|
| 84 |
FALLBACK_MODELS = [
|
| 85 |
("hf.co/unsloth/Qwen3-4B-Instruct-2507-GGUF:Q8_K_XL", "Qwen 3 Instruct 2507 Unsloth (4B, 8-bit)")
|
|
|
|
| 4 |
from datetime import datetime
|
| 5 |
import time
|
| 6 |
import threading
|
| 7 |
+
import leaderboard
|
| 8 |
|
| 9 |
ARENA_NAME = "# π The GPU-Poor LLM Gladiator Arena π v25.10"
|
| 10 |
|
|
|
|
| 62 |
MODEL_REFRESH_INTERVAL = 3600 # Check every 1 hour
|
| 63 |
_last_model_check = 0 # Track last check time
|
| 64 |
|
| 65 |
+
# Model archiving configuration
|
| 66 |
+
ARCHIVE_BATTLE_THRESHOLD = int(os.environ.get("ARCHIVE_BATTLE_THRESHOLD", 150))
|
| 67 |
+
ARCHIVED_MODELS_PATH = os.environ.get("NEXTCLOUD_ARCHIVED_MODELS_PATH", "/gpu_poor_archived_models.json")
|
| 68 |
+
|
| 69 |
def get_approved_models():
|
| 70 |
"""Get the current list of approved models with periodic refresh."""
|
| 71 |
global _last_model_check
|
|
|
|
| 77 |
get_approved_models._models = load_approved_models()
|
| 78 |
_last_model_check = current_time
|
| 79 |
|
| 80 |
+
return [model for model in get_approved_models._models if model[0] not in leaderboard.load_archived_models()]
|
| 81 |
|
| 82 |
def refresh_approved_models():
|
| 83 |
"""Force refresh of the approved models list."""
|
|
|
|
| 85 |
delattr(get_approved_models, '_models')
|
| 86 |
return get_approved_models()
|
| 87 |
|
| 88 |
+
# Maximum tokens for model generation to prevent timeouts
|
| 89 |
+
MAX_TOKENS = int(os.environ.get("MAX_TOKENS", 2048)) # Increased to 2048 based on feedback
|
| 90 |
+
|
| 91 |
# Keep FALLBACK_MODELS as a safety net
|
| 92 |
FALLBACK_MODELS = [
|
| 93 |
("hf.co/unsloth/Qwen3-4B-Instruct-2507-GGUF:Q8_K_XL", "Qwen 3 Instruct 2507 Unsloth (4B, 8-bit)")
|