We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 1ec7804 commit a1bfee9Copy full SHA for a1bfee9
sweeps/transformer.yaml
@@ -12,15 +12,15 @@ metric:
12
name: Val/loss
13
parameters:
14
trainer.max_epochs:
15
- value: 35000
+ value: 50000
16
model.dim_model:
17
- value: 8
+ value: 10
18
model.num_heads:
19
- value: 4
+ value: 5
20
model.dim_feedforward:
21
value: 1024
22
model.num_decoder_layers:
23
- value: 3
24
model.dropout_p:
25
value: 0.1
26
model.test_prompt_length:
@@ -31,6 +31,10 @@ parameters:
31
value: 0.002
32
model.layer_norm_eps:
33
value: 6e-3
34
+ model.adversarial_training:
35
+ value: false
36
+ model.extrapolation_training:
37
38
data.max_length:
39
value: 256
40
data.batch_size:
0 commit comments