Ransaka
/

sinhala-roman-transformer

Text2Text Generation

encoder-decoder

Generated from Trainer

Inference Endpoints

Model card Files Files and versions Metrics Training metrics Community

Ransaka commited on 10 days ago

Commit

2f551a5

•

1 Parent(s): 766759a

Training in progress, step 500

Files changed (3) hide show

config.json +6 -6
model.safetensors +2 -2
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -25,7 +25,7 @@
     "forced_eos_token_id": null,
     "hidden_act": "gelu",
     "hidden_dropout_prob": 0.1,
-    "hidden_size": 384,
     "id2label": {
       "0": "LABEL_0",
       "1": "LABEL_1"
@@ -45,10 +45,10 @@
     "min_length": 0,
     "model_type": "bert",
     "no_repeat_ngram_size": 0,
-    "num_attention_heads": 6,
     "num_beam_groups": 1,
     "num_beams": 1,
-    "num_hidden_layers": 6,
     "num_return_sequences": 1,
     "output_attentions": false,
     "output_hidden_states": false,
@@ -105,7 +105,7 @@
     "forced_eos_token_id": null,
     "hidden_act": "gelu",
     "hidden_dropout_prob": 0.1,
-    "hidden_size": 384,
     "id2label": {
       "0": "LABEL_0",
       "1": "LABEL_1"
@@ -125,10 +125,10 @@
     "min_length": 0,
     "model_type": "bert",
     "no_repeat_ngram_size": 0,
-    "num_attention_heads": 6,
     "num_beam_groups": 1,
     "num_beams": 1,
-    "num_hidden_layers": 6,
     "num_return_sequences": 1,
     "output_attentions": false,
     "output_hidden_states": false,

     "forced_eos_token_id": null,
     "hidden_act": "gelu",
     "hidden_dropout_prob": 0.1,
+    "hidden_size": 768,
     "id2label": {
       "0": "LABEL_0",
       "1": "LABEL_1"
     "min_length": 0,
     "model_type": "bert",
     "no_repeat_ngram_size": 0,
+    "num_attention_heads": 3,
     "num_beam_groups": 1,
     "num_beams": 1,
+    "num_hidden_layers": 3,
     "num_return_sequences": 1,
     "output_attentions": false,
     "output_hidden_states": false,
     "forced_eos_token_id": null,
     "hidden_act": "gelu",
     "hidden_dropout_prob": 0.1,
+    "hidden_size": 768,
     "id2label": {
       "0": "LABEL_0",
       "1": "LABEL_1"
     "min_length": 0,
     "model_type": "bert",
     "no_repeat_ngram_size": 0,
+    "num_attention_heads": 3,
     "num_beam_groups": 1,
     "num_beams": 1,
+    "num_hidden_layers": 3,
     "num_return_sequences": 1,
     "output_attentions": false,
     "output_hidden_states": false,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df2c45619e3c92ed45a03412cc3752b22de82f3d08c696d56dbb92768827db23
-size 132506536

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f146193e4e10b0dea08825a6a086b0806a45cdefc7c53dc62d79dd81a1534d0
+size 229215968

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:42f1aaf7698ac609f95385131af9e2b33b5954f26ec5e11d6e9aaa5526ee8df4
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:2384c99249dd25b6927dbc0e7d215bf8bb8277aa315bc1488f05f54cd28da30b
 size 5240