-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathresults_torch_substrate_softmax.json
More file actions
79 lines (79 loc) · 1.69 KB
/
results_torch_substrate_softmax.json
File metadata and controls
79 lines (79 loc) · 1.69 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
{
"results": {
"softmax": {
"train": [
3.286557741165161,
3.1191217947006225,
2.883688154220581
],
"val": [
3.343192450205485,
2.996395452817281,
2.9558159987131756
],
"n_params": 33793,
"train_mean": 3.096455896695455,
"val_mean": 3.098467967245314,
"val_std": 0.2129066167218368
},
"smod": {
"train": [
3.1185076236724854,
3.2255805063247682,
2.633924136161804
],
"val": [
3.19204466342926,
3.0865708192189536,
2.620266048113505
],
"n_params": 33793,
"train_mean": 2.9926707553863525,
"val_mean": 2.9662938435872395,
"val_std": 0.3042739051963452
},
"ssnap": {
"train": [
3.285893063545227,
3.2220983839035036,
2.802310576438904
],
"val": [
3.342144997914632,
3.0825433492660523,
2.8597730795542398
],
"n_params": 33793,
"train_mean": 3.103434007962545,
"val_mean": 3.094820475578308,
"val_std": 0.24142019960752362
},
"srank": {
"train": [
3.2800048542022706,
3.232453718185425,
3.2827095651626585
],
"val": [
3.340387765566508,
3.091373840967814,
3.3481504599253338
],
"n_params": 33793,
"train_mean": 3.265056045850118,
"val_mean": 3.259970688819885,
"val_std": 0.14606073286536667
}
},
"config": {
"seeds": "42,7,123",
"steps": 1500,
"lr": 0.005,
"seq_len": 32,
"d_model": 32,
"n_heads": 4,
"ff_dim": 64,
"n_blocks": 4,
"out": "results_torch_substrate_softmax.json"
}
}