ahmedheakl commited on
Commit
9ce3741
1 Parent(s): a9356cf

Training in progress, step 131000

Browse files
Files changed (4) hide show
  1. config.json +1 -2
  2. model.safetensors +1 -1
  3. tokenizer.json +0 -0
  4. training_args.bin +1 -1
config.json CHANGED
@@ -7,7 +7,6 @@
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 32013,
9
  "eos_token_id": 32021,
10
- "head_dim": 128,
11
  "hidden_act": "silu",
12
  "hidden_size": 2048,
13
  "initializer_range": 0.02,
@@ -28,7 +27,7 @@
28
  "rope_theta": 100000,
29
  "tie_word_embeddings": false,
30
  "torch_dtype": "bfloat16",
31
- "transformers_version": "4.45.2",
32
  "use_cache": false,
33
  "vocab_size": 32256
34
  }
 
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 32013,
9
  "eos_token_id": 32021,
 
10
  "hidden_act": "silu",
11
  "hidden_size": 2048,
12
  "initializer_range": 0.02,
 
27
  "rope_theta": 100000,
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "bfloat16",
30
+ "transformers_version": "4.44.2",
31
  "use_cache": false,
32
  "vocab_size": 32256
33
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2fad2386719a163af2f035e3add9cd8a24396e4337f4fcf3d616be8a16f67eb
3
  size 2692969128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93cc5222cc26606c6337586c2760731e9b70f42beba7736efbef25c4929f4677
3
  size 2692969128
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:869bce22a0489edacec40c8cd9439ce2d965c89b6299eab749b480464055a034
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e28cf8e36ba27b9823cfb1f50af213f8361bb2179a8a5491e4f0b852a90a6d7a
3
  size 5496