Training in progress, step 1000
Browse files
config.json
CHANGED
|
@@ -11,9 +11,9 @@
|
|
| 11 |
"initializer_range": 0.02,
|
| 12 |
"layer_norm_epsilon": 1e-05,
|
| 13 |
"model_type": "gpt2",
|
| 14 |
-
"n_ctx":
|
| 15 |
-
"n_embd":
|
| 16 |
-
"n_head":
|
| 17 |
"n_inner": null,
|
| 18 |
"n_layer": 12,
|
| 19 |
"n_positions": 1024,
|
|
|
|
| 11 |
"initializer_range": 0.02,
|
| 12 |
"layer_norm_epsilon": 1e-05,
|
| 13 |
"model_type": "gpt2",
|
| 14 |
+
"n_ctx": 512,
|
| 15 |
+
"n_embd": 1024,
|
| 16 |
+
"n_head": 16,
|
| 17 |
"n_inner": null,
|
| 18 |
"n_layer": 12,
|
| 19 |
"n_positions": 1024,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b2de214e8f1502e86bc9b61c8992505f98d77a5eedb4cfa1d1be2f33014ea1c
|
| 3 |
+
size 731716424
|
runs/Apr10_22-26-23_gpu-pod/events.out.tfevents.1712787988.gpu-pod.1209.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a947d0eeba31181aa5c45bb90a184efcb5ffdd46eb02b8a1146ce2c4f4eda351
|
| 3 |
+
size 4829
|
runs/Apr10_22-28-16_gpu-pod/events.out.tfevents.1712788101.gpu-pod.1718.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5f7d9cac196fb4d025037ddada8c79424da90c8e0f6fcd7c122cbd38d122eb1
|
| 3 |
+
size 5038
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4475
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0358968f457a6b9893184cffc2a04fbb2483bc3c78b69ffbb670d89f6c31ef8
|
| 3 |
size 4475
|