Upload folder using huggingface_hub

Files changed (13) hide show

.locks/models--psd401--llama3-2-1b-Solutions/ef85b799c596b5809377eb3268cd9f789c037ce4.lock ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/README.md ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/adapter_config.json ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/adapter_model.safetensors ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/config.json ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/generation_config.json ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/special_tokens_map.json ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/tokenizer.json ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/tokenizer_config.json ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/.no_exist/8813c4cef407330136f13ab6ed5b83fd989f093e/training_args.bin ADDED Viewed

File without changes

models--psd401--llama3-2-1b-Solutions/blobs/ef85b799c596b5809377eb3268cd9f789c037ce4 ADDED Viewed

+{
+    "model": "meta-llama/Llama-3.2-1B-Instruct",
+    "project_name": "llama3-2-1b-Solutions",
+    "data_path": "psd401/PSD401SolutionsData",
+    "train_split": "train",
+    "valid_split": null,
+    "add_eos_token": true,
+    "block_size": -1,
+    "model_max_length": 2048,
+    "padding": "right",
+    "trainer": "sft",
+    "use_flash_attention_2": false,
+    "log": "tensorboard",
+    "disable_gradient_checkpointing": false,
+    "logging_steps": -1,
+    "eval_strategy": "epoch",
+    "save_total_limit": 1,
+    "auto_find_batch_size": false,
+    "mixed_precision": "bf16",
+    "lr": 0.00001,
+    "epochs": 3,
+    "batch_size": 1,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 8,
+    "optimizer": "paged_adamw_8bit",
+    "scheduler": "cosine",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "chat_template": "tokenizer",
+    "quantization": "int8",
+    "target_modules": "all-linear",
+    "merge_adapter": true,
+    "peft": true,
+    "lora_r": 16,
+    "lora_alpha": 32,
+    "lora_dropout": 0.05,
+    "model_ref": null,
+    "dpo_beta": 0.1,
+    "max_prompt_length": 128,
+    "max_completion_length": null,
+    "prompt_text_column": null,
+    "text_column": "messages",
+    "rejected_text_column": null,
+    "push_to_hub": false,
+    "username": null,
+    "token": null,
+    "unsloth": false,
+    "distributed_backend": null
+}

models--psd401--llama3-2-1b-Solutions/refs/main CHANGED Viewed

	@@ -1 +1 @@
1	- ~~94115ce35647c6da6fdd605765875b74579ba563~~


1	+ 8813c4cef407330136f13ab6ed5b83fd989f093e

models--psd401--llama3-2-1b-Solutions/snapshots/8813c4cef407330136f13ab6ed5b83fd989f093e/training_params.json ADDED Viewed

+{
+    "model": "meta-llama/Llama-3.2-1B-Instruct",
+    "project_name": "llama3-2-1b-Solutions",
+    "data_path": "psd401/PSD401SolutionsData",
+    "train_split": "train",
+    "valid_split": null,
+    "add_eos_token": true,
+    "block_size": -1,
+    "model_max_length": 2048,
+    "padding": "right",
+    "trainer": "sft",
+    "use_flash_attention_2": false,
+    "log": "tensorboard",
+    "disable_gradient_checkpointing": false,
+    "logging_steps": -1,
+    "eval_strategy": "epoch",
+    "save_total_limit": 1,
+    "auto_find_batch_size": false,
+    "mixed_precision": "bf16",
+    "lr": 0.00001,
+    "epochs": 3,
+    "batch_size": 1,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 8,
+    "optimizer": "paged_adamw_8bit",
+    "scheduler": "cosine",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "chat_template": "tokenizer",
+    "quantization": "int8",
+    "target_modules": "all-linear",
+    "merge_adapter": true,
+    "peft": true,
+    "lora_r": 16,
+    "lora_alpha": 32,
+    "lora_dropout": 0.05,
+    "model_ref": null,
+    "dpo_beta": 0.1,
+    "max_prompt_length": 128,
+    "max_completion_length": null,
+    "prompt_text_column": null,
+    "text_column": "messages",
+    "rejected_text_column": null,
+    "push_to_hub": false,
+    "username": null,
+    "token": null,
+    "unsloth": false,
+    "distributed_backend": null
+}