ribesstefano commited on
Commit
b0f1cd0
·
verified ·
1 Parent(s): f814c62

Training in progress, step 100000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ed51e1ba85f76a635d5a4b2a2391f7569c86dcbec7e8462be43c05a028f2b92
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98759b2d7ebc1d279e01894e895488231ca886295ea5febbef75377b3c17846e
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ff468b57d7d38029e80e932afebd1303c6c991cc99b4531d000cb90d3c844ac
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cfe49edb2c5cdd32ea816756e7d42933808a9b4a91e32bcea425f1ff6d3320f
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35f5729f689be2bbffa9964aeb321f5783ac9d47f55dce0a0ce5ba77dbc5b474
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23cc08fa295f1f61f14d032299f4a12f1ac03252919134b2e30f6532808f7457
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa6c62e484d18fd65a9b7d67344c5142e2d88165c2f53674e02273b93133c9c8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18ea3abbc14ac3d713f060ff2fd846183e96ea3ca75c3d268b653d81e7259f7c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.5980878186968839,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine/checkpoint-95000",
4
- "epoch": 9.370684553166305,
5
  "eval_steps": 2500,
6
- "global_step": 95000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1925,6 +1925,160 @@
1925
  "eval_tanimoto_similarity": 0.0,
1926
  "eval_valid": 0.9279390934844193,
1927
  "step": 95000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1928
  }
1929
  ],
1930
  "logging_steps": 500,
@@ -1939,12 +2093,12 @@
1939
  "should_evaluate": false,
1940
  "should_log": false,
1941
  "should_save": true,
1942
- "should_training_stop": false
1943
  },
1944
  "attributes": {}
1945
  }
1946
  },
1947
- "total_flos": 8.229984794717169e+17,
1948
  "train_batch_size": 128,
1949
  "trial_name": null,
1950
  "trial_params": null
 
1
  {
2
  "best_metric": 0.5980878186968839,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine/checkpoint-95000",
4
+ "epoch": 9.863878477017163,
5
  "eval_steps": 2500,
6
+ "global_step": 100000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1925
  "eval_tanimoto_similarity": 0.0,
1926
  "eval_valid": 0.9279390934844193,
1927
  "step": 95000
1928
+ },
1929
+ {
1930
+ "epoch": 9.420003945551391,
1931
+ "grad_norm": 0.0018721942324191332,
1932
+ "learning_rate": 2.526870501993378e-07,
1933
+ "loss": 0.0002,
1934
+ "step": 95500
1935
+ },
1936
+ {
1937
+ "epoch": 9.469323337936476,
1938
+ "grad_norm": 0.0017144909361377358,
1939
+ "learning_rate": 2.0009955530982117e-07,
1940
+ "loss": 0.0002,
1941
+ "step": 96000
1942
+ },
1943
+ {
1944
+ "epoch": 9.518642730321563,
1945
+ "grad_norm": 0.0021374619100242853,
1946
+ "learning_rate": 1.535318123066204e-07,
1947
+ "loss": 0.0002,
1948
+ "step": 96500
1949
+ },
1950
+ {
1951
+ "epoch": 9.567962122706648,
1952
+ "grad_norm": 0.005559207871556282,
1953
+ "learning_rate": 1.1310684269457139e-07,
1954
+ "loss": 0.0002,
1955
+ "step": 97000
1956
+ },
1957
+ {
1958
+ "epoch": 9.617281515091735,
1959
+ "grad_norm": 0.0035916175693273544,
1960
+ "learning_rate": 7.883464070810032e-08,
1961
+ "loss": 0.0002,
1962
+ "step": 97500
1963
+ },
1964
+ {
1965
+ "epoch": 9.617281515091735,
1966
+ "eval_all_ligands_equal": 0.5979992917847026,
1967
+ "eval_e3_equal": 0.8281692634560907,
1968
+ "eval_e3_graph_edit_distance": Infinity,
1969
+ "eval_e3_graph_edit_distance_norm": Infinity,
1970
+ "eval_e3_has_attachment_point(s)": 0.9868980169971672,
1971
+ "eval_e3_heavy_atoms_difference": 0.40625,
1972
+ "eval_e3_heavy_atoms_difference_norm": 0.008543233459256977,
1973
+ "eval_e3_tanimoto_similarity": 0.0,
1974
+ "eval_e3_valid": 0.9868980169971672,
1975
+ "eval_has_all_attachment_points": 0.9848618980169972,
1976
+ "eval_has_three_substructures": 0.9992917847025495,
1977
+ "eval_heavy_atoms_difference": 6.117032577903683,
1978
+ "eval_heavy_atoms_difference_norm": 0.08171100798099956,
1979
+ "eval_linker_equal": 0.8498583569405099,
1980
+ "eval_linker_graph_edit_distance": 2.2131728045325776e+61,
1981
+ "eval_linker_graph_edit_distance_norm": Infinity,
1982
+ "eval_linker_has_attachment_point(s)": 0.9977868271954674,
1983
+ "eval_linker_heavy_atoms_difference": 0.15430240793201133,
1984
+ "eval_linker_heavy_atoms_difference_norm": -0.0017717876495697477,
1985
+ "eval_linker_tanimoto_similarity": 0.0,
1986
+ "eval_linker_valid": 0.9977868271954674,
1987
+ "eval_loss": 0.38293081521987915,
1988
+ "eval_num_fragments": 3.0001770538243626,
1989
+ "eval_poi_equal": 0.7955028328611898,
1990
+ "eval_poi_graph_edit_distance": Infinity,
1991
+ "eval_poi_graph_edit_distance_norm": Infinity,
1992
+ "eval_poi_has_attachment_point(s)": 0.9394475920679887,
1993
+ "eval_poi_heavy_atoms_difference": 1.805771954674221,
1994
+ "eval_poi_heavy_atoms_difference_norm": 0.057646246942032714,
1995
+ "eval_poi_tanimoto_similarity": 0.0,
1996
+ "eval_poi_valid": 0.9394475920679887,
1997
+ "eval_reassembly": 0.605435552407932,
1998
+ "eval_reassembly_nostereo": 0.6317280453257791,
1999
+ "eval_runtime": 2300.5871,
2000
+ "eval_samples_per_second": 4.91,
2001
+ "eval_steps_per_second": 0.077,
2002
+ "eval_tanimoto_similarity": 0.0,
2003
+ "eval_valid": 0.9265226628895185,
2004
+ "step": 97500
2005
+ },
2006
+ {
2007
+ "epoch": 9.66660090747682,
2008
+ "grad_norm": 0.0018907383782789111,
2009
+ "learning_rate": 5.0723679437578165e-08,
2010
+ "loss": 0.0002,
2011
+ "step": 98000
2012
+ },
2013
+ {
2014
+ "epoch": 9.715920299861907,
2015
+ "grad_norm": 0.00224716286174953,
2016
+ "learning_rate": 2.8818634561947334e-08,
2017
+ "loss": 0.0002,
2018
+ "step": 98500
2019
+ },
2020
+ {
2021
+ "epoch": 9.765239692246992,
2022
+ "grad_norm": 0.0026547384914010763,
2023
+ "learning_rate": 1.3037127690179729e-08,
2024
+ "loss": 0.0002,
2025
+ "step": 99000
2026
+ },
2027
+ {
2028
+ "epoch": 9.814559084632076,
2029
+ "grad_norm": 0.005669564940035343,
2030
+ "learning_rate": 3.4331286033528754e-09,
2031
+ "loss": 0.0002,
2032
+ "step": 99500
2033
+ },
2034
+ {
2035
+ "epoch": 9.863878477017163,
2036
+ "grad_norm": 0.003081223228946328,
2037
+ "learning_rate": 9.011690840776687e-12,
2038
+ "loss": 0.0002,
2039
+ "step": 100000
2040
+ },
2041
+ {
2042
+ "epoch": 9.863878477017163,
2043
+ "eval_all_ligands_equal": 0.5980878186968839,
2044
+ "eval_e3_equal": 0.828257790368272,
2045
+ "eval_e3_graph_edit_distance": Infinity,
2046
+ "eval_e3_graph_edit_distance_norm": Infinity,
2047
+ "eval_e3_has_attachment_point(s)": 0.9870750708215298,
2048
+ "eval_e3_heavy_atoms_difference": 0.40421388101983,
2049
+ "eval_e3_heavy_atoms_difference_norm": 0.008500938679118707,
2050
+ "eval_e3_tanimoto_similarity": 0.0,
2051
+ "eval_e3_valid": 0.9870750708215298,
2052
+ "eval_has_all_attachment_points": 0.9846848441926346,
2053
+ "eval_has_three_substructures": 0.9992032577903682,
2054
+ "eval_heavy_atoms_difference": 6.106409348441926,
2055
+ "eval_heavy_atoms_difference_norm": 0.0815233025391124,
2056
+ "eval_linker_equal": 0.849592776203966,
2057
+ "eval_linker_graph_edit_distance": Infinity,
2058
+ "eval_linker_graph_edit_distance_norm": Infinity,
2059
+ "eval_linker_has_attachment_point(s)": 0.9977868271954674,
2060
+ "eval_linker_heavy_atoms_difference": 0.15465651558073654,
2061
+ "eval_linker_heavy_atoms_difference_norm": -0.0017519301091180534,
2062
+ "eval_linker_tanimoto_similarity": 0.0,
2063
+ "eval_linker_valid": 0.9977868271954674,
2064
+ "eval_loss": 0.38294461369514465,
2065
+ "eval_num_fragments": 3.0000885269121813,
2066
+ "eval_poi_equal": 0.7955028328611898,
2067
+ "eval_poi_graph_edit_distance": Infinity,
2068
+ "eval_poi_graph_edit_distance_norm": Infinity,
2069
+ "eval_poi_has_attachment_point(s)": 0.9393590651558074,
2070
+ "eval_poi_heavy_atoms_difference": 1.8055949008498584,
2071
+ "eval_poi_heavy_atoms_difference_norm": 0.05770569057556065,
2072
+ "eval_poi_tanimoto_similarity": 0.0,
2073
+ "eval_poi_valid": 0.9393590651558074,
2074
+ "eval_reassembly": 0.6055240793201133,
2075
+ "eval_reassembly_nostereo": 0.6318165722379604,
2076
+ "eval_runtime": 2300.3904,
2077
+ "eval_samples_per_second": 4.91,
2078
+ "eval_steps_per_second": 0.077,
2079
+ "eval_tanimoto_similarity": 0.0,
2080
+ "eval_valid": 0.9266997167138811,
2081
+ "step": 100000
2082
  }
2083
  ],
2084
  "logging_steps": 500,
 
2093
  "should_evaluate": false,
2094
  "should_log": false,
2095
  "should_save": true,
2096
+ "should_training_stop": true
2097
  },
2098
  "attributes": {}
2099
  }
2100
  },
2101
+ "total_flos": 8.663173632603694e+17,
2102
  "train_batch_size": 128,
2103
  "trial_name": null,
2104
  "trial_params": null