tricktreat commited on
Commit
a4a02e4
1 Parent(s): c0ed9c6

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +22 -1
README.md CHANGED
@@ -1,8 +1,29 @@
1
  ---
2
  library_name: peft
3
- base_model: guanaco_Llama-2-7b-chat-hf_freeze_embed_tokens_q_v_proj
 
4
  ---
5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  # Model Card for Model ID
7
 
8
  <!-- Provide a quick summary of what the model is/does. -->
 
1
  ---
2
  library_name: peft
3
+ base_model: tricktreat/Llama-2-7b-chat-hf-guanaco-freeze-embed-tokens-q-v-proj
4
+ license: apache-2.0
5
  ---
6
 
7
+ # Training
8
+
9
+ ```
10
+ deepspeed --include=node-0:3 --master_port=12001 sft_prompt_tuning.py --deepspeed dp_zero0.json \
11
+ --model_name_or_path="guanaco_Llama-2-7b-chat-hf_freeze_embed_tokens_q_v_proj" \
12
+ --dataset_name="timdettmers/openassistant-guanaco" \
13
+ --dataset_text_field="text" \
14
+ --report_to="tensorboard" \
15
+ --learning_rate=1e-5 \
16
+ --per_device_train_batch_size=32 \
17
+ --gradient_accumulation_steps=4 \
18
+ --output_dir="guanaco_Llama-2-7b-chat-hf_freeze_embed_tokens_q_v_projs_prompttuning" \
19
+ --logging_steps=1 \
20
+ --num_train_epochs=15 \
21
+ --max_steps=-1 \
22
+ --save_steps=0.3 \
23
+ --gradient_checkpointing \
24
+ --fp16
25
+ ```
26
+
27
  # Model Card for Model ID
28
 
29
  <!-- Provide a quick summary of what the model is/does. -->