nblinh commited on
Commit
30aa0b9
·
verified ·
1 Parent(s): b011168

End of training

Browse files
README.md CHANGED
@@ -78,7 +78,7 @@ resume_from_checkpoint: null
78
  s2_attention: null
79
  sample_packing: false
80
  saves_per_epoch: 1
81
- sequence_len: 2048
82
  special_tokens:
83
  pad_token: </s>
84
  strict: false
@@ -105,7 +105,7 @@ xformers_attention: true
105
 
106
  This model is a fine-tuned version of [openlm-research/open_llama_3b](https://huggingface.co/openlm-research/open_llama_3b) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
- - Loss: 3.7840
109
 
110
  ## Model description
111
 
@@ -137,7 +137,7 @@ The following hyperparameters were used during training:
137
 
138
  | Training Loss | Epoch | Step | Validation Loss |
139
  |:-------------:|:------:|:----:|:---------------:|
140
- | 4.5323 | 0.0002 | 10 | 3.7840 |
141
 
142
 
143
  ### Framework versions
 
78
  s2_attention: null
79
  sample_packing: false
80
  saves_per_epoch: 1
81
+ sequence_len: 1024
82
  special_tokens:
83
  pad_token: </s>
84
  strict: false
 
105
 
106
  This model is a fine-tuned version of [openlm-research/open_llama_3b](https://huggingface.co/openlm-research/open_llama_3b) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
+ - Loss: 3.7643
109
 
110
  ## Model description
111
 
 
137
 
138
  | Training Loss | Epoch | Step | Validation Loss |
139
  |:-------------:|:------:|:----:|:---------------:|
140
+ | 4.5149 | 0.0002 | 10 | 3.7643 |
141
 
142
 
143
  ### Framework versions
adapter_config.json CHANGED
@@ -21,11 +21,11 @@
21
  "revision": null,
22
  "target_modules": [
23
  "gate_proj",
24
- "v_proj",
25
  "k_proj",
 
 
26
  "q_proj",
27
  "up_proj",
28
- "o_proj",
29
  "down_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
21
  "revision": null,
22
  "target_modules": [
23
  "gate_proj",
 
24
  "k_proj",
25
+ "o_proj",
26
+ "v_proj",
27
  "q_proj",
28
  "up_proj",
 
29
  "down_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a23971735c6c7201e7a2b2f9a991fd1dd59ec44520a51d2bec7bfc1eaafb584e
3
  size 101834682
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21b5774c11c87956c6614a03adec5912db7b24ce635954cf394ecb851ef66bfe
3
  size 101834682
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31b0d205f90ef61231421a91f7d99271ed8a6888b23c86b07e12e680847aa3ec
3
  size 101752088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a817fca8448c618ca0399ae6500d0d06078b8dcbd1642b6de601d31a99c1314
3
  size 101752088
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1ca2c9cfcb209a44e2a3d71ecca31b66b857e19f413bd59a3c56c046fc7ee16
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c875cc28983fec1f79d714107d3f7799493d920a5d75aa40a4d88d5568dc4bcf
3
  size 6776