Oimos
/

llm-jp-3-13b-it_lora

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Oimos commited on Dec 16, 2024

Commit

5f73776

·

verified ·

1 Parent(s): b735d84

Update README.md

Files changed (1) hide show

README.md +5 -7

README.md CHANGED Viewed

@@ -60,9 +60,9 @@ if torch.cuda.get_device_capability()[0] >= 8:
 from unsloth import FastLanguageModel
 import torch
-# max_seq_length = 512 # unslothではRoPEをサポートしているのでコンテキスト長は自由に設定可能
 # 1024に増やしてみる
-max_seq_length = 1024
 dtype = None # Noneにしておけば自動で設定
 load_in_4bit = True # 今回は13Bモデルを扱うためTrue
@@ -120,7 +120,6 @@ prompt = """### 指示
 ### 回答
 {}"""
 """
 formatting_prompts_func: 各データをプロンプトに合わせた形式に合わせる
 """
@@ -135,7 +134,7 @@ pass
 # # 各データにフォーマットを適用
 dataset = dataset.map(
     formatting_prompts_func,
-    num_proc= 4, # 並列処理数を指定
 )
 dataset
@@ -143,7 +142,6 @@ dataset
 # データを確認
 print(dataset["train"]["formatted_text"][3])
-"""
 """
 training_arguments: 学習の設定
@@ -218,9 +216,9 @@ trainer = SFTTrainer(
     args = TrainingArguments(
         per_device_train_batch_size = 2,
         gradient_accumulation_steps = 4,
-        # num_train_epochs = 1,
         # epochを増やす
-        num_train_epochs = 5,
         logging_steps = 10,
         warmup_steps = 10,
         save_steps=100,

 from unsloth import FastLanguageModel
 import torch
+max_seq_length = 512 # unslothではRoPEをサポートしているのでコンテキスト長は自由に設定可能
 # 1024に増やしてみる
+# max_seq_length = 1024
 dtype = None # Noneにしておけば自動で設定
 load_in_4bit = True # 今回は13Bモデルを扱うためTrue
 ### 回答
 {}"""
 """
 formatting_prompts_func: 各データをプロンプトに合わせた形式に合わせる
 """
 # # 各データにフォーマットを適用
 dataset = dataset.map(
     formatting_prompts_func,
+    # num_proc= 4, # 並列処理数を指定
 )
 dataset
 # データを確認
 print(dataset["train"]["formatted_text"][3])
 """
 training_arguments: 学習の設定
     args = TrainingArguments(
         per_device_train_batch_size = 2,
         gradient_accumulation_steps = 4,
+        num_train_epochs = 1,
         # epochを増やす
+        # num_train_epochs = 5,
         logging_steps = 10,
         warmup_steps = 10,
         save_steps=100,