Nekochu commited on
Commit
04c031f
·
1 Parent(s): d42aa91

update defaults: LR 3e-4, rank 32, alpha 2x rank (per Side-Step author)

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -546,7 +546,7 @@ def gradio_main():
546
  epochs=epochs,
547
  lr=lr,
548
  rank=rank,
549
- alpha=rank,
550
  dropout=0.0,
551
  batch_size=1,
552
  gradient_accumulation_steps=4,
@@ -716,10 +716,10 @@ def gradio_main():
716
  label="Epochs", minimum=1, maximum=1000,
717
  value=3, step=1,
718
  )
719
- train_lr = gr.Number(label="Learning Rate", value=1e-4)
720
  train_rank = gr.Slider(
721
- label="Rank (r)", minimum=1, maximum=64,
722
- value=16, step=1,
723
  )
724
 
725
  with gr.Row(elem_classes="compact-row"):
 
546
  epochs=epochs,
547
  lr=lr,
548
  rank=rank,
549
+ alpha=rank * 2,
550
  dropout=0.0,
551
  batch_size=1,
552
  gradient_accumulation_steps=4,
 
716
  label="Epochs", minimum=1, maximum=1000,
717
  value=3, step=1,
718
  )
719
+ train_lr = gr.Number(label="Learning Rate", value=3e-4)
720
  train_rank = gr.Slider(
721
+ label="Rank (r)", minimum=1, maximum=128,
722
+ value=32, step=1,
723
  )
724
 
725
  with gr.Row(elem_classes="compact-row"):