-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathresults_torch_q_unfrozen.json
More file actions
89 lines (89 loc) · 1.88 KB
/
Copy pathresults_torch_q_unfrozen.json
File metadata and controls
89 lines (89 loc) · 1.88 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
{
"results": {
"L0": {
"train": [
0.1095681644976139,
0.12120531469583512,
0.09855730962008238
],
"val": [
0.1069627777673304,
0.12103371061384678,
0.1112413645721972
],
"n_params": 11617,
"train_mean": 0.10977692960451046,
"val_mean": 0.11307928431779146
},
"L1": {
"train": [
0.10707426002249122,
0.10433656617999076,
0.09862479900941253
],
"val": [
0.09411124289035797,
0.11662751976400614,
0.10126861715689302
],
"n_params": 10593,
"train_mean": 0.10334520840396484,
"val_mean": 0.10400245993708572
},
"L3": {
"train": [
2.5881427192687987,
2.5479656267166138,
2.5295474338531494
],
"val": [
2.5645218968391417,
2.625992774963379,
2.5610082149505615
],
"n_params": 8545,
"train_mean": 2.5552185932795206,
"val_mean": 2.583840962251027
},
"L5": {
"train": [
0.7723635441064834,
2.5342285442352295,
2.5166834115982057
],
"val": [
0.7477515071630478,
2.635182094573975,
2.543583881855011
],
"n_params": 9569,
"train_mean": 1.9410918333133063,
"val_mean": 1.9755058278640112
},
"L6": {
"train": [
0.6715569049119949,
2.519856564998627,
2.505311279296875
],
"val": [
0.6756465345621109,
2.6699543237686156,
2.536313998699188
],
"n_params": 9570,
"train_mean": 1.8989082497358323,
"val_mean": 1.9606382856766382
}
},
"config": {
"seeds": "42,7,123",
"steps": 1500,
"lr": 0.005,
"seq_len": 32,
"d_model": 32,
"ff_dim": 64,
"variants": "L0,L1,L3,L5,L6",
"out": "results_torch_q_unfrozen.json"
}
}