Spaces:
Running
Running
update defaults: LR 3e-4, rank 32, alpha 2x rank (per Side-Step author)
Browse files
app.py
CHANGED
|
@@ -546,7 +546,7 @@ def gradio_main():
|
|
| 546 |
epochs=epochs,
|
| 547 |
lr=lr,
|
| 548 |
rank=rank,
|
| 549 |
-
alpha=rank,
|
| 550 |
dropout=0.0,
|
| 551 |
batch_size=1,
|
| 552 |
gradient_accumulation_steps=4,
|
|
@@ -716,10 +716,10 @@ def gradio_main():
|
|
| 716 |
label="Epochs", minimum=1, maximum=1000,
|
| 717 |
value=3, step=1,
|
| 718 |
)
|
| 719 |
-
train_lr = gr.Number(label="Learning Rate", value=
|
| 720 |
train_rank = gr.Slider(
|
| 721 |
-
label="Rank (r)", minimum=1, maximum=
|
| 722 |
-
value=
|
| 723 |
)
|
| 724 |
|
| 725 |
with gr.Row(elem_classes="compact-row"):
|
|
|
|
| 546 |
epochs=epochs,
|
| 547 |
lr=lr,
|
| 548 |
rank=rank,
|
| 549 |
+
alpha=rank * 2,
|
| 550 |
dropout=0.0,
|
| 551 |
batch_size=1,
|
| 552 |
gradient_accumulation_steps=4,
|
|
|
|
| 716 |
label="Epochs", minimum=1, maximum=1000,
|
| 717 |
value=3, step=1,
|
| 718 |
)
|
| 719 |
+
train_lr = gr.Number(label="Learning Rate", value=3e-4)
|
| 720 |
train_rank = gr.Slider(
|
| 721 |
+
label="Rank (r)", minimum=1, maximum=128,
|
| 722 |
+
value=32, step=1,
|
| 723 |
)
|
| 724 |
|
| 725 |
with gr.Row(elem_classes="compact-row"):
|