ribesstefano commited on
Commit
1a52d24
·
verified ·
1 Parent(s): 3e0993c

Training in progress, step 5000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66aa69c6aaea9c3f43fcbb61232c4f6be0ad63939e2948af761ca5ed8f362f49
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afe9292cb16f6f6dee824dc08aadbb1c611c31986da611344faf125b15d5879d
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91541c07eb7e3bf0aa7fc5915be7e455c4f07451374b81c7cd866d04ea8fd962
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d970277ab277da4a302ec9754c9012b105fa92af9c6209062f67c3e4a508d75b
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f294bf906f6c9e7b32fccab7328465e8e4b434c32a973d1cc6684f0187d99dd4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbe8ab180daf6fea30575d831f91f1de7eb9d7b789eecb0d5221fe9efa820f08
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4da18a6f8a6db8955c278a8d0efe2d6193cd4355e0f3807dd771856fd055aa46
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c3af5bdcc9c194cb334426a90ed6c0eb206e307298871d9d80a97054340126b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,278 +1,124 @@
1
  {
2
- "best_metric": 0.19496243923994697,
3
- "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine_restarts-opt25/trial-number=24-learning_rate=1.2e-05-warmup_ratio=0.020-num_cycles=9/checkpoint-10000",
4
- "epoch": 0.9863878477017163,
5
  "eval_steps": 2500,
6
- "global_step": 10000,
7
- "is_hyper_param_search": true,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.049319392385085814,
13
- "grad_norm": 1.1682956218719482,
14
- "learning_rate": 8.609489056175177e-06,
15
- "loss": 2.1752,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09863878477017163,
20
- "grad_norm": 1.1533381938934326,
21
- "learning_rate": 9.656008727064383e-07,
22
- "loss": 0.672,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14795817715525744,
27
- "grad_norm": 0.9731566905975342,
28
- "learning_rate": 1.0065956095929134e-05,
29
- "loss": 0.5459,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.19727756954034326,
34
- "grad_norm": 0.7106562256813049,
35
- "learning_rate": 2.0993649965972538e-06,
36
- "loss": 0.3736,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.24659696192542907,
41
- "grad_norm": 0.980603039264679,
42
- "learning_rate": 1.1199720219819944e-05,
43
- "loss": 0.3217,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.2959163543105149,
48
- "grad_norm": 0.6568108201026917,
49
- "learning_rate": 3.555832036351209e-06,
50
- "loss": 0.2471,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.3452357466956007,
55
- "grad_norm": 0.583015501499176,
56
- "learning_rate": 1.1918930601284844e-05,
57
- "loss": 0.2145,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.3945551390806865,
62
- "grad_norm": 0.5566324591636658,
63
- "learning_rate": 5.2170076943504535e-06,
64
- "loss": 0.1804,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.4438745314657723,
69
- "grad_norm": 0.5157020092010498,
70
- "learning_rate": 1.2165321092526382e-05,
71
- "loss": 0.155,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.49319392385085814,
76
- "grad_norm": 0.516018271446228,
77
- "learning_rate": 6.948313398175921e-06,
78
- "loss": 0.1403,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.49319392385085814,
83
- "eval_all_ligands_equal": 0.006098099867432612,
84
- "eval_e3_equal": 0.43163941670349093,
85
- "eval_e3_graph_edit_distance": 9.999999999999999e+63,
86
- "eval_e3_graph_edit_distance_norm": 1.0,
87
- "eval_e3_has_attachment_point(s)": 0.9950508174988952,
88
- "eval_e3_heavy_atoms_difference": -0.6882015024304021,
89
- "eval_e3_heavy_atoms_difference_norm": -0.043577084852665905,
90
  "eval_e3_tanimoto_similarity": 0.0,
91
- "eval_e3_valid": 0.9950508174988952,
92
- "eval_has_all_attachment_points": 0.9637649138311976,
93
- "eval_has_three_substructures": 0.996464869642068,
94
- "eval_heavy_atoms_difference": 16.120282810428634,
95
- "eval_heavy_atoms_difference_norm": 0.20922444422385186,
96
- "eval_linker_equal": 0.023862129916040652,
97
- "eval_linker_graph_edit_distance": 9.999999999999999e+63,
98
- "eval_linker_graph_edit_distance_norm": 1.0,
99
- "eval_linker_has_attachment_point(s)": 0.9878921785240831,
100
- "eval_linker_heavy_atoms_difference": 3.8430402121078213,
101
- "eval_linker_heavy_atoms_difference_norm": 0.15478254398680125,
102
  "eval_linker_tanimoto_similarity": 0.0,
103
- "eval_linker_valid": 0.9878921785240831,
104
- "eval_loss": 0.33513495326042175,
105
- "eval_num_fragments": 2.9966416261599647,
106
- "eval_poi_equal": 0.41555457357490055,
107
- "eval_poi_graph_edit_distance": 9.999999999999999e+63,
108
- "eval_poi_graph_edit_distance_norm": 1.0,
109
- "eval_poi_has_attachment_point(s)": 0.8372072470172338,
110
- "eval_poi_heavy_atoms_difference": 5.426336721166593,
111
- "eval_poi_heavy_atoms_difference_norm": 0.16311688485735315,
112
  "eval_poi_tanimoto_similarity": 0.0,
113
- "eval_poi_valid": 0.8372072470172338,
114
- "eval_reassembly": 0.0061864781263809105,
115
- "eval_reassembly_nostereo": 0.00821917808219178,
116
- "eval_runtime": 1598.5131,
117
- "eval_samples_per_second": 7.078,
118
- "eval_steps_per_second": 0.111,
119
  "eval_tanimoto_similarity": 0.0,
120
- "eval_valid": 0.830490499337163,
121
  "step": 5000
122
- },
123
- {
124
- "epoch": 0.542513316235944,
125
- "grad_norm": 0.4676644504070282,
126
- "learning_rate": 2.46390491241543e-07,
127
- "loss": 0.1194,
128
- "step": 5500
129
- },
130
- {
131
- "epoch": 0.5918327086210298,
132
- "grad_norm": 0.4235730469226837,
133
- "learning_rate": 8.609489056175182e-06,
134
- "loss": 0.1113,
135
- "step": 6000
136
- },
137
- {
138
- "epoch": 0.6411521010061156,
139
- "grad_norm": 0.36409395933151245,
140
- "learning_rate": 9.656008727064383e-07,
141
- "loss": 0.0943,
142
- "step": 6500
143
- },
144
- {
145
- "epoch": 0.6904714933912014,
146
- "grad_norm": 0.45415812730789185,
147
- "learning_rate": 1.0065956095929123e-05,
148
- "loss": 0.0884,
149
- "step": 7000
150
- },
151
- {
152
- "epoch": 0.7397908857762873,
153
- "grad_norm": 0.2938048243522644,
154
- "learning_rate": 2.0993649965972457e-06,
155
- "loss": 0.0749,
156
- "step": 7500
157
- },
158
- {
159
- "epoch": 0.7397908857762873,
160
- "eval_all_ligands_equal": 0.07954043305346885,
161
- "eval_e3_equal": 0.5972602739726027,
162
- "eval_e3_graph_edit_distance": 9.999999999999999e+63,
163
- "eval_e3_graph_edit_distance_norm": 1.0,
164
- "eval_e3_has_attachment_point(s)": 0.9971718957136544,
165
- "eval_e3_heavy_atoms_difference": -0.43817940786566506,
166
- "eval_e3_heavy_atoms_difference_norm": -0.031709951383128494,
167
- "eval_e3_tanimoto_similarity": 0.0,
168
- "eval_e3_valid": 0.9971718957136544,
169
- "eval_has_all_attachment_points": 0.9825011047282368,
170
- "eval_has_three_substructures": 0.9985859478568272,
171
- "eval_heavy_atoms_difference": 9.341935483870968,
172
- "eval_heavy_atoms_difference_norm": 0.12436168186436197,
173
- "eval_linker_equal": 0.14891736632788333,
174
- "eval_linker_graph_edit_distance": 9.999999999999999e+63,
175
- "eval_linker_graph_edit_distance_norm": 1.0,
176
- "eval_linker_has_attachment_point(s)": 0.9946973044631021,
177
- "eval_linker_heavy_atoms_difference": 1.7425541316836057,
178
- "eval_linker_heavy_atoms_difference_norm": 0.0540184783099769,
179
- "eval_linker_tanimoto_similarity": 0.0,
180
- "eval_linker_valid": 0.9946973044631021,
181
- "eval_loss": 0.3053259253501892,
182
- "eval_num_fragments": 2.999646486964207,
183
- "eval_poi_equal": 0.5743703049049934,
184
- "eval_poi_graph_edit_distance": 9.999999999999999e+63,
185
- "eval_poi_graph_edit_distance_norm": 1.0,
186
- "eval_poi_has_attachment_point(s)": 0.8965090587715422,
187
- "eval_poi_heavy_atoms_difference": 3.1149801148917367,
188
- "eval_poi_heavy_atoms_difference_norm": 0.09925725919495766,
189
- "eval_poi_tanimoto_similarity": 0.0,
190
- "eval_poi_valid": 0.8965090587715422,
191
- "eval_reassembly": 0.08166151126822802,
192
- "eval_reassembly_nostereo": 0.09863013698630137,
193
- "eval_runtime": 1544.4861,
194
- "eval_samples_per_second": 7.326,
195
- "eval_steps_per_second": 0.115,
196
- "eval_tanimoto_similarity": 0.0,
197
- "eval_valid": 0.8929739284136102,
198
- "step": 7500
199
- },
200
- {
201
- "epoch": 0.789110278161373,
202
- "grad_norm": 0.38644686341285706,
203
- "learning_rate": 1.1199720219819944e-05,
204
- "loss": 0.0697,
205
- "step": 8000
206
- },
207
- {
208
- "epoch": 0.8384296705464589,
209
- "grad_norm": 0.2929253578186035,
210
- "learning_rate": 3.5558320363512003e-06,
211
- "loss": 0.0612,
212
- "step": 8500
213
- },
214
- {
215
- "epoch": 0.8877490629315447,
216
- "grad_norm": 0.5124661326408386,
217
- "learning_rate": 1.1918930601284838e-05,
218
- "loss": 0.0554,
219
- "step": 9000
220
- },
221
- {
222
- "epoch": 0.9370684553166305,
223
- "grad_norm": 0.2770146429538727,
224
- "learning_rate": 5.217007694350461e-06,
225
- "loss": 0.0511,
226
- "step": 9500
227
- },
228
- {
229
- "epoch": 0.9863878477017163,
230
- "grad_norm": 0.29158660769462585,
231
- "learning_rate": 0.0,
232
- "loss": 0.0448,
233
- "step": 10000
234
- },
235
- {
236
- "epoch": 0.9863878477017163,
237
- "eval_all_ligands_equal": 0.19496243923994697,
238
- "eval_e3_equal": 0.6822801590808661,
239
- "eval_e3_graph_edit_distance": 9.999999999999999e+63,
240
- "eval_e3_graph_edit_distance_norm": 1.0,
241
- "eval_e3_has_attachment_point(s)": 0.9961997348652232,
242
- "eval_e3_heavy_atoms_difference": -0.20821917808219179,
243
- "eval_e3_heavy_atoms_difference_norm": -0.020312192895071864,
244
- "eval_e3_tanimoto_similarity": 0.0,
245
- "eval_e3_valid": 0.9961997348652232,
246
- "eval_has_all_attachment_points": 0.9850640742377376,
247
- "eval_has_three_substructures": 0.9984975695978789,
248
- "eval_heavy_atoms_difference": 7.780291648254529,
249
- "eval_heavy_atoms_difference_norm": 0.10405481436831165,
250
- "eval_linker_equal": 0.30746796288113126,
251
- "eval_linker_graph_edit_distance": 9.999999999999999e+63,
252
- "eval_linker_graph_edit_distance_norm": 1.0,
253
- "eval_linker_has_attachment_point(s)": 0.9946973044631021,
254
- "eval_linker_heavy_atoms_difference": 1.0045956694653115,
255
- "eval_linker_heavy_atoms_difference_norm": 0.020478695715494242,
256
- "eval_linker_tanimoto_similarity": 0.0,
257
- "eval_linker_valid": 0.9946973044631021,
258
- "eval_loss": 0.29711082577705383,
259
- "eval_num_fragments": 3.0000883782589485,
260
- "eval_poi_equal": 0.6341140079540433,
261
- "eval_poi_graph_edit_distance": 9.999999999999999e+63,
262
- "eval_poi_graph_edit_distance_norm": 1.0,
263
- "eval_poi_has_attachment_point(s)": 0.9104728236853734,
264
- "eval_poi_heavy_atoms_difference": 2.697923110914715,
265
- "eval_poi_heavy_atoms_difference_norm": 0.08519220092920521,
266
- "eval_poi_tanimoto_similarity": 0.0,
267
- "eval_poi_valid": 0.9104728236853734,
268
- "eval_reassembly": 0.19902783915156871,
269
- "eval_reassembly_nostereo": 0.22315510384445428,
270
- "eval_runtime": 1514.5071,
271
- "eval_samples_per_second": 7.471,
272
- "eval_steps_per_second": 0.117,
273
- "eval_tanimoto_similarity": 0.0,
274
- "eval_valid": 0.9057003977021653,
275
- "step": 10000
276
  }
277
  ],
278
  "logging_steps": 500,
@@ -287,17 +133,13 @@
287
  "should_evaluate": false,
288
  "should_log": false,
289
  "should_save": true,
290
- "should_training_stop": true
291
  },
292
  "attributes": {}
293
  }
294
  },
295
- "total_flos": 8.663036348367667e+16,
296
  "train_batch_size": 128,
297
- "trial_name": "trial-number=24-learning_rate=1.2e-05-warmup_ratio=0.020-num_cycles=9",
298
- "trial_params": {
299
- "learning_rate": 1.2165321092526382e-05,
300
- "num_cycles": 9,
301
- "warmup_ratio": 0.02
302
- }
303
  }
 
1
  {
2
+ "best_metric": 0.45963172804532576,
3
+ "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine_restarts-opt25/checkpoint-5000",
4
+ "epoch": 0.49319392385085814,
5
  "eval_steps": 2500,
6
+ "global_step": 5000,
7
+ "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.049319392385085814,
13
+ "grad_norm": 0.7575409412384033,
14
+ "learning_rate": 4.465132736856968e-05,
15
+ "loss": 1.4495,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09863878477017163,
20
+ "grad_norm": 0.6125224232673645,
21
+ "learning_rate": 8.628481651367859e-06,
22
+ "loss": 0.3014,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14795817715525744,
27
+ "grad_norm": 0.5499436259269714,
28
+ "learning_rate": 4.3093350952626764e-05,
29
+ "loss": 0.1515,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.19727756954034326,
34
+ "grad_norm": 0.28163060545921326,
35
+ "learning_rate": 6.906649047373284e-06,
36
+ "loss": 0.0885,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.24659696192542907,
41
+ "grad_norm": 0.26792627573013306,
42
+ "learning_rate": 4.137151834863209e-05,
43
+ "loss": 0.0576,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.2959163543105149,
48
+ "grad_norm": 0.23422876000404358,
49
+ "learning_rate": 5.348672631430346e-06,
50
+ "loss": 0.0408,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.3452357466956007,
55
+ "grad_norm": 0.25026798248291016,
56
+ "learning_rate": 3.9501422739279976e-05,
57
+ "loss": 0.0302,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.3945551390806865,
62
+ "grad_norm": 0.18633298575878143,
63
+ "learning_rate": 3.968661679220468e-06,
64
+ "loss": 0.0237,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.4438745314657723,
69
+ "grad_norm": 0.21757744252681732,
70
+ "learning_rate": 3.750000000000008e-05,
71
+ "loss": 0.0193,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.49319392385085814,
76
+ "grad_norm": 0.14472977817058563,
77
+ "learning_rate": 2.77911378362688e-06,
78
+ "loss": 0.0156,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.49319392385085814,
83
+ "eval_all_ligands_equal": 0.45963172804532576,
84
+ "eval_e3_equal": 0.7815155807365439,
85
+ "eval_e3_graph_edit_distance": Infinity,
86
+ "eval_e3_graph_edit_distance_norm": Infinity,
87
+ "eval_e3_has_attachment_point(s)": 0.9915899433427762,
88
+ "eval_e3_heavy_atoms_difference": 0.39128895184135976,
89
+ "eval_e3_heavy_atoms_difference_norm": 0.006079141519917903,
90
  "eval_e3_tanimoto_similarity": 0.0,
91
+ "eval_e3_valid": 0.9915899433427762,
92
+ "eval_has_all_attachment_points": 0.986278328611898,
93
+ "eval_has_three_substructures": 0.9988491501416431,
94
+ "eval_heavy_atoms_difference": 7.0030099150141645,
95
+ "eval_heavy_atoms_difference_norm": 0.09184213866701363,
96
+ "eval_linker_equal": 0.6622698300283286,
97
+ "eval_linker_graph_edit_distance": 3.5410764872521247e+61,
98
+ "eval_linker_graph_edit_distance_norm": Infinity,
99
+ "eval_linker_has_attachment_point(s)": 0.9964589235127479,
100
+ "eval_linker_heavy_atoms_difference": 0.38048866855524077,
101
+ "eval_linker_heavy_atoms_difference_norm": 0.0004655148396369131,
102
  "eval_linker_tanimoto_similarity": 0.0,
103
+ "eval_linker_valid": 0.9964589235127479,
104
+ "eval_loss": 0.28911474347114563,
105
+ "eval_num_fragments": 3.000619688385269,
106
+ "eval_poi_equal": 0.7265403682719547,
107
+ "eval_poi_graph_edit_distance": Infinity,
108
+ "eval_poi_graph_edit_distance_norm": Infinity,
109
+ "eval_poi_has_attachment_point(s)": 0.9251947592067988,
110
+ "eval_poi_heavy_atoms_difference": 2.3129426345609065,
111
+ "eval_poi_heavy_atoms_difference_norm": 0.07392839153429423,
112
  "eval_poi_tanimoto_similarity": 0.0,
113
+ "eval_poi_valid": 0.9251947592067988,
114
+ "eval_reassembly": 0.4665368271954674,
115
+ "eval_reassembly_nostereo": 0.4910587818696884,
116
+ "eval_runtime": 2426.7651,
117
+ "eval_samples_per_second": 4.655,
118
+ "eval_steps_per_second": 0.073,
119
  "eval_tanimoto_similarity": 0.0,
120
+ "eval_valid": 0.9168732294617564,
121
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
122
  }
123
  ],
124
  "logging_steps": 500,
 
133
  "should_evaluate": false,
134
  "should_log": false,
135
  "should_save": true,
136
+ "should_training_stop": false
137
  },
138
  "attributes": {}
139
  }
140
  },
141
+ "total_flos": 4.33139477262336e+16,
142
  "train_batch_size": 128,
143
+ "trial_name": null,
144
+ "trial_params": null
 
 
 
 
145
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d8632640bbe126885af10bd60f2424fb195aa4218c094577172b919da3113f
3
  size 7480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64c5622356e7cd4fe22546f63bc083b851b2422c7b250f26dca95392b1010ffa
3
  size 7480