sorayutmild
commited on
Commit
•
dc8fa44
1
Parent(s):
05bd9cd
Training in progress, step 2000
Browse files- .gitattributes +1 -0
- .gitignore +1 -0
- config.json +32 -0
- pytorch_model.bin +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/1671715404.0960257/events.out.tfevents.1671715404.3efc8d045e2f.23.2 +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/1671715417.2763708/events.out.tfevents.1671715417.3efc8d045e2f.23.3 +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/1671715428.5540988/events.out.tfevents.1671715428.3efc8d045e2f.23.4 +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/1671715441.1662471/events.out.tfevents.1671715441.3efc8d045e2f.23.5 +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/1671715451.616452/events.out.tfevents.1671715451.3efc8d045e2f.23.6 +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/1671715492.9185338/events.out.tfevents.1671715492.3efc8d045e2f.23.7 +3 -0
- runs/Dec22_13-19-54_3efc8d045e2f/events.out.tfevents.1671715403.3efc8d045e2f.23.1 +3 -0
- runs/Dec22_13-25-09_3efc8d045e2f/1671715524.4630265/events.out.tfevents.1671715524.3efc8d045e2f.23.9 +3 -0
- runs/Dec22_13-25-09_3efc8d045e2f/1671715531.49861/events.out.tfevents.1671715531.3efc8d045e2f.23.10 +3 -0
- runs/Dec22_13-25-09_3efc8d045e2f/events.out.tfevents.1671715524.3efc8d045e2f.23.8 +3 -0
- runs/Dec22_13-26-27_3efc8d045e2f/1671715591.830819/events.out.tfevents.1671715591.3efc8d045e2f.23.12 +3 -0
- runs/Dec22_13-26-27_3efc8d045e2f/1671715666.0171692/events.out.tfevents.1671715666.3efc8d045e2f.23.13 +3 -0
- runs/Dec22_13-26-27_3efc8d045e2f/events.out.tfevents.1671715591.3efc8d045e2f.23.11 +3 -0
- runs/Dec22_13-27-58_3efc8d045e2f/1671715687.5748084/events.out.tfevents.1671715687.3efc8d045e2f.23.15 +3 -0
- runs/Dec22_13-27-58_3efc8d045e2f/1671715692.787198/events.out.tfevents.1671715692.3efc8d045e2f.23.16 +3 -0
- runs/Dec22_13-27-58_3efc8d045e2f/events.out.tfevents.1671715687.3efc8d045e2f.23.14 +3 -0
- special_tokens_map.json +5 -0
- spiece.model +3 -0
- tokenizer.json +3 -0
- tokenizer_config.json +12 -0
- training_args.bin +3 -0
.gitattributes
CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
35 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "thanathorn/mt5-cpe-kmutt-thai-sentence-sum",
|
3 |
+
"architectures": [
|
4 |
+
"MT5ForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"d_ff": 2048,
|
7 |
+
"d_kv": 64,
|
8 |
+
"d_model": 768,
|
9 |
+
"decoder_start_token_id": 0,
|
10 |
+
"dense_act_fn": "gelu_new",
|
11 |
+
"dropout_rate": 0.1,
|
12 |
+
"eos_token_id": 1,
|
13 |
+
"feed_forward_proj": "gated-gelu",
|
14 |
+
"initializer_factor": 1.0,
|
15 |
+
"is_encoder_decoder": true,
|
16 |
+
"is_gated_act": true,
|
17 |
+
"layer_norm_epsilon": 1e-06,
|
18 |
+
"model_type": "mt5",
|
19 |
+
"num_decoder_layers": 12,
|
20 |
+
"num_heads": 12,
|
21 |
+
"num_layers": 12,
|
22 |
+
"output_past": true,
|
23 |
+
"pad_token_id": 0,
|
24 |
+
"relative_attention_max_distance": 128,
|
25 |
+
"relative_attention_num_buckets": 32,
|
26 |
+
"tie_word_embeddings": false,
|
27 |
+
"tokenizer_class": "T5Tokenizer",
|
28 |
+
"torch_dtype": "float32",
|
29 |
+
"transformers_version": "4.20.1",
|
30 |
+
"use_cache": true,
|
31 |
+
"vocab_size": 250112
|
32 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55d69b4085f93b4ff49bdc1d5c842cd55c55463006f2e9d5ad97b36ba717e287
|
3 |
+
size 2329700173
|
runs/Dec22_13-19-54_3efc8d045e2f/1671715404.0960257/events.out.tfevents.1671715404.3efc8d045e2f.23.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7ff07576274d3c7283f58c2fe06b75ec97d3d0d84142c80440a795940c76c20
|
3 |
+
size 5702
|
runs/Dec22_13-19-54_3efc8d045e2f/1671715417.2763708/events.out.tfevents.1671715417.3efc8d045e2f.23.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce1260bda67ecf2418d2c108d0976c12c23e41676b7c1748d58d752c32b42ce6
|
3 |
+
size 5702
|
runs/Dec22_13-19-54_3efc8d045e2f/1671715428.5540988/events.out.tfevents.1671715428.3efc8d045e2f.23.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:607b3e55ccffc0f823f21e02b173815e83b1a8e752db82cae2644922da3d612c
|
3 |
+
size 5702
|
runs/Dec22_13-19-54_3efc8d045e2f/1671715441.1662471/events.out.tfevents.1671715441.3efc8d045e2f.23.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db1a4a0c30ebd52ad67b103302a19c09ab0baa8046331502b7618b11abf9d28d
|
3 |
+
size 5702
|
runs/Dec22_13-19-54_3efc8d045e2f/1671715451.616452/events.out.tfevents.1671715451.3efc8d045e2f.23.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f89180f6461efb659cd4ff130568e2b5d061f86b0b9690a14ea7985b621e53e
|
3 |
+
size 5702
|
runs/Dec22_13-19-54_3efc8d045e2f/1671715492.9185338/events.out.tfevents.1671715492.3efc8d045e2f.23.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:396524122392f355e2b7c1e0766f20bede15c995b21c76948ca3efd1f145f94e
|
3 |
+
size 5702
|
runs/Dec22_13-19-54_3efc8d045e2f/events.out.tfevents.1671715403.3efc8d045e2f.23.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e36c930942299a90c3be9f01c92782eb91bb657972579904f66ddf3a2692b5ed
|
3 |
+
size 24584
|
runs/Dec22_13-25-09_3efc8d045e2f/1671715524.4630265/events.out.tfevents.1671715524.3efc8d045e2f.23.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a08ea118741d707f53fbca8989cb0a7becbcf4ff9b20ed776bc8c8d23f6981ec
|
3 |
+
size 5702
|
runs/Dec22_13-25-09_3efc8d045e2f/1671715531.49861/events.out.tfevents.1671715531.3efc8d045e2f.23.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:215d5387b8396d116a2d5e1d3be7d5e9090ff945221fb7cc0237452a55e02a28
|
3 |
+
size 5702
|
runs/Dec22_13-25-09_3efc8d045e2f/events.out.tfevents.1671715524.3efc8d045e2f.23.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eee41196f6e571128b0ebc97959d8dee01d93dacaeb18e27dfc0f15c778a4ccb
|
3 |
+
size 8088
|
runs/Dec22_13-26-27_3efc8d045e2f/1671715591.830819/events.out.tfevents.1671715591.3efc8d045e2f.23.12
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:418e00a4f9e7ace6e25b48d7069ffedf2f909664a249fa389508d64dab6be3a9
|
3 |
+
size 5702
|
runs/Dec22_13-26-27_3efc8d045e2f/1671715666.0171692/events.out.tfevents.1671715666.3efc8d045e2f.23.13
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bce33056c1b4d971024e822dadaa97e31bd9602eb5f40d8f52dea9b2dc544c22
|
3 |
+
size 5702
|
runs/Dec22_13-26-27_3efc8d045e2f/events.out.tfevents.1671715591.3efc8d045e2f.23.11
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b6daf730b807967a9ad800485b75a176717f346dc2b39e5bfde13417861646f
|
3 |
+
size 8088
|
runs/Dec22_13-27-58_3efc8d045e2f/1671715687.5748084/events.out.tfevents.1671715687.3efc8d045e2f.23.15
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e324b80818693f86879058985853fb4aae8efbdbfa743d8825ce486893b6e154
|
3 |
+
size 5702
|
runs/Dec22_13-27-58_3efc8d045e2f/1671715692.787198/events.out.tfevents.1671715692.3efc8d045e2f.23.16
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2419d53a1e0642925605e3e5575ae527b51dfa56bfc3ddc913dc22cf6eeb6310
|
3 |
+
size 5702
|
runs/Dec22_13-27-58_3efc8d045e2f/events.out.tfevents.1671715687.3efc8d045e2f.23.14
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:072cbdea0cfbf241453e30c882115adf6d456932359ae67f9d39789001ad2187
|
3 |
+
size 8716
|
special_tokens_map.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"eos_token": "</s>",
|
3 |
+
"pad_token": "<pad>",
|
4 |
+
"unk_token": "<unk>"
|
5 |
+
}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
|
3 |
+
size 4309802
|
tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93c3578052e1605d8332eb961bc08d72e246071974e4cc54aa6991826b802aa5
|
3 |
+
size 16330369
|
tokenizer_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": null,
|
3 |
+
"eos_token": "</s>",
|
4 |
+
"extra_ids": 0,
|
5 |
+
"name_or_path": "thanathorn/mt5-cpe-kmutt-thai-sentence-sum",
|
6 |
+
"pad_token": "<pad>",
|
7 |
+
"sp_model_kwargs": {},
|
8 |
+
"special_tokens_map_file": "/home/patrick/.cache/torch/transformers/685ac0ca8568ec593a48b61b0a3c272beee9bc194a3c7241d15dcadb5f875e53.f76030f3ec1b96a8199b2593390c610e76ca8028ef3d24680000619ffb646276",
|
9 |
+
"tokenizer_class": "T5Tokenizer",
|
10 |
+
"truncate": true,
|
11 |
+
"unk_token": "<unk>"
|
12 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b18463aa97d9f229af1f4234149444ea4ce5edd2060b1732bf8f26a6a382ee2e
|
3 |
+
size 3567
|