sunkencity commited on
Commit
4d6ed12
·
verified ·
1 Parent(s): 5c34124

Upload train_aviation.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. train_aviation.py +9 -17
train_aviation.py CHANGED
@@ -25,25 +25,17 @@ from peft import LoraConfig, prepare_model_for_kbit_training, get_peft_model
25
  from trl import SFTTrainer, SFTConfig
26
  from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, AutoConfig
27
 
28
- # Register 'ministral3' config if needed
29
  print("🔧 Registering ministral3 config...")
30
  try:
31
- # Try to find Mistral3Config (available in very recent transformers)
32
- from transformers import Mistral3Config
33
- AutoConfig.register("ministral3", Mistral3Config)
34
- print(" Registered ministral3 -> Mistral3Config")
35
- except ImportError:
36
- try:
37
- # Fallback to internal path if not exposed
38
- from transformers.models.mistral3.configuration_mistral3 import Mistral3Config
39
- AutoConfig.register("ministral3", Mistral3Config)
40
- print(" Registered ministral3 -> Mistral3Config (internal)")
41
- except ImportError:
42
- # Fallback to standard MistralConfig
43
- print(" Mistral3Config not found, falling back to MistralConfig")
44
- from transformers import MistralConfig
45
- AutoConfig.register("ministral3", MistralConfig)
46
- print(" Registered ministral3 -> MistralConfig")
47
 
48
  # Model ID
49
  # model_id defined above
 
25
  from trl import SFTTrainer, SFTConfig
26
  from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, AutoConfig
27
 
28
+ # Register 'ministral3' config to handle nested text_config
29
  print("🔧 Registering ministral3 config...")
30
  try:
31
+ from transformers import MistralConfig
32
+ class MinistralConfig(MistralConfig):
33
+ model_type = "ministral3"
34
+
35
+ AutoConfig.register("ministral3", MinistralConfig)
36
+ print(" Registered ministral3 -> MinistralConfig (subclass)")
37
+ except Exception as e:
38
+ print(f" ❌ Failed to register ministral3 config: {e}")
 
 
 
 
 
 
 
 
39
 
40
  # Model ID
41
  # model_id defined above