Update README.md
Browse files
README.md
CHANGED
|
@@ -75,16 +75,17 @@ The following hyperparameters were used during training:
|
|
| 75 |
- lr_scheduler_type: cosine
|
| 76 |
- num_steps: 0
|
| 77 |
- quantization_type: bitsandbytes
|
| 78 |
-
- LoRA:
|
| 79 |
-
-
|
| 80 |
-
-
|
| 81 |
-
-
|
| 82 |
-
-
|
| 83 |
-
-
|
| 84 |
-
-
|
| 85 |
-
-
|
| 86 |
-
-
|
| 87 |
-
-
|
|
|
|
| 88 |
|
| 89 |
### Training results
|
| 90 |
|
|
|
|
| 75 |
- lr_scheduler_type: cosine
|
| 76 |
- num_steps: 0
|
| 77 |
- quantization_type: bitsandbytes
|
| 78 |
+
- LoRA:
|
| 79 |
+
- bits: 4
|
| 80 |
+
- use_exllama: True
|
| 81 |
+
- device_map: auto
|
| 82 |
+
- use_cache: False
|
| 83 |
+
- lora_r: 8
|
| 84 |
+
- lora_alpha: 16
|
| 85 |
+
- lora_dropout: 0.1
|
| 86 |
+
- bias: none
|
| 87 |
+
- target_modules: ['q_proj', 'k_proj', 'v_proj', 'o_proj']
|
| 88 |
+
- task_type: CAUSAL_LM
|
| 89 |
|
| 90 |
### Training results
|
| 91 |
|