SmolFactory / config /train_smollm3_no_think_test.py
Tonic's picture
adds no think tag correctly
32fca7d verified
raw
history blame contribute delete
914 Bytes
"""
SmolLM3 Training Configuration with /no_think tag
Test configuration to verify /no_think tag functionality
"""
from config.train_smollm3 import SmolLM3Config
config = SmolLM3Config(
# Model configuration
model_name="HuggingFaceTB/SmolLM3-3B",
max_seq_length=4096,
use_flash_attention=True,
use_gradient_checkpointing=True,
# Training configuration
batch_size=2,
gradient_accumulation_steps=4,
learning_rate=2e-5,
weight_decay=0.01,
warmup_steps=100,
max_iters=100, # Short test run
# Mixed precision
fp16=True,
bf16=False,
# Logging and saving
save_steps=50,
eval_steps=25,
logging_steps=10,
# Chat template configuration with /no_think tag
use_chat_template=True,
chat_template_kwargs={
"add_generation_prompt": True,
"no_think_system_message": True # Enable /no_think tag
}
)