MuRIL_for_TeluguQC

Browse files

Files changed (7) hide show

README.md +17 -16
config.json +1 -1
model.safetensors +1 -1
runs/Apr09_09-25-00_d477a7e83fd3/events.out.tfevents.1712654711.d477a7e83fd3.893.0 +3 -0
runs/Apr09_09-32-10_d477a7e83fd3/events.out.tfevents.1712655194.d477a7e83fd3.893.1 +3 -0
special_tokens_map.json +5 -35
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
-license: cc-by-4.0
-base_model: l3cube-pune/telugu-bert
 tags:
 - generated_from_trainer
 metrics:
@@ -17,13 +17,13 @@ should probably proofread and complete it, then remove this comment. -->
 # output
-This model is a fine-tuned version of [l3cube-pune/telugu-bert](https://huggingface.co/l3cube-pune/telugu-bert) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.6017
-- Precision: 0.7825
-- Recall: 0.7870
-- Accuracy: 0.7870
-- F1-score: 0.7809
 ## Model description
@@ -48,19 +48,20 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 7
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | Accuracy | F1-score |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:--------:|:--------:|
-| 1.7849        | 1.0   | 32   | 1.7769          | 0.0454    | 0.2130 | 0.2130   | 0.0748   |
-| 1.7491        | 2.0   | 64   | 1.7436          | 0.1414    | 0.3306 | 0.3306   | 0.1933   |
-| 1.7032        | 3.0   | 96   | 1.7059          | 0.2918    | 0.3043 | 0.3043   | 0.2076   |
-| 1.6498        | 4.0   | 128  | 1.6571          | 0.7274    | 0.6572 | 0.6572   | 0.6571   |
-| 1.6029        | 5.0   | 160  | 1.6236          | 0.7687    | 0.7627 | 0.7627   | 0.7576   |
-| 1.5724        | 6.0   | 192  | 1.6049          | 0.7894    | 0.7951 | 0.7951   | 0.7893   |
-| 1.556         | 7.0   | 224  | 1.6017          | 0.7825    | 0.7870 | 0.7870   | 0.7809   |
 ### Framework versions

 ---
+license: apache-2.0
+base_model: google/muril-base-cased
 tags:
 - generated_from_trainer
 metrics:
 # output
+This model is a fine-tuned version of [google/muril-base-cased](https://huggingface.co/google/muril-base-cased) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.6250
+- Precision: 0.7716
+- Recall: 0.7647
+- Accuracy: 0.7647
+- F1-score: 0.7587
 ## Model description
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 8
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | Accuracy | F1-score |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:--------:|:--------:|
+| 1.7858        | 1.0   | 32   | 1.7821          | 0.0454    | 0.2130 | 0.2130   | 0.0748   |
+| 1.7526        | 2.0   | 64   | 1.7539          | 0.1754    | 0.2860 | 0.2860   | 0.1866   |
+| 1.7112        | 3.0   | 96   | 1.7232          | 0.3352    | 0.3043 | 0.3043   | 0.2168   |
+| 1.6655        | 4.0   | 128  | 1.6832          | 0.7122    | 0.6166 | 0.6166   | 0.6194   |
+| 1.6217        | 5.0   | 160  | 1.6496          | 0.7708    | 0.7688 | 0.7688   | 0.7629   |
+| 1.5898        | 6.0   | 192  | 1.6431          | 0.7618    | 0.7424 | 0.7424   | 0.7379   |
+| 1.5678        | 7.0   | 224  | 1.6285          | 0.7697    | 0.7627 | 0.7627   | 0.7565   |
+| 1.5572        | 8.0   | 256  | 1.6250          | 0.7716    | 0.7647 | 0.7647   | 0.7587   |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "l3cube-pune/telugu-bert",
   "architectures": [
     "BertForSequenceClassification"
   ],

 {
+  "_name_or_path": "google/muril-base-cased",
   "architectures": [
     "BertForSequenceClassification"
   ],

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aab7a751f02eea3422dd153d9de73285a746a4c7df81a6f7f561c7dd835eeb38
 size 950266896

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b85ca71ae55461247b0c3c451f9fbcd3af094e027628ec1b6c8397e8880713a
 size 950266896

runs/Apr09_09-25-00_d477a7e83fd3/events.out.tfevents.1712654711.d477a7e83fd3.893.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c0a15a358e8c0080017692792a2c3ad02edab0013f3719c5fc15534b0057191
+size 9944

runs/Apr09_09-32-10_d477a7e83fd3/events.out.tfevents.1712655194.d477a7e83fd3.893.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0dae25e691bcb7f7c08eb347fcb2e35cf4a2b33c0466174a7a0454411e77f1e
+size 10630

special_tokens_map.json CHANGED Viewed

@@ -1,37 +1,7 @@
 {
-  "cls_token": {
-    "content": "[CLS]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "mask_token": {
-    "content": "[MASK]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "[PAD]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "sep_token": {
-    "content": "[SEP]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "[UNK]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
 }

 {
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bca09a3f3f95451faf3e17d022867f8113ccd6ab0ca2e5d2d6e73464c3890360
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:cec6a56dc671964ef5b5a1c936de270b653e2169a37e8282e74d5fb914107522
 size 4856