We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 280e2a1 commit f5e51baCopy full SHA for f5e51ba
src/thunder/config/adaptation/lora.yaml
@@ -5,6 +5,6 @@ lora_alpha: 16
5
# Hyperparameters
6
batch_size: 2
7
num_workers: 2
8
-lr: [1e-5, 1e-6, 1e-7]
+lr: [1e-3, 1e-4, 1e-5]
9
weight_decay: [0.0, 1e-3, 1e-4]
10
epochs: 20
src/thunder/models/adapters.py
@@ -114,7 +114,7 @@ def __init__(
114
std = torch.sqrt(torch.tensor(rank).float())
115
self.A = torch.nn.Parameter(torch.randn(in_dim, rank) / std)
116
self.B = torch.nn.Parameter(torch.zeros(rank, out_dim))
117
- self.alpha = alpha
+ self.alpha = alpha / rank
118
119
def forward(self, src: torch.Tensor) -> torch.Tensor:
120
"""
0 commit comments