Upload folder using huggingface_hub
Browse files- config.json +32 -0
- generation_config.json +8 -0
- model-00001-of-00024.safetensors +3 -0
- model-00002-of-00024.safetensors +3 -0
- model-00003-of-00024.safetensors +3 -0
- model-00004-of-00024.safetensors +3 -0
- model-00005-of-00024.safetensors +3 -0
- model-00006-of-00024.safetensors +3 -0
- model-00007-of-00024.safetensors +3 -0
- model-00008-of-00024.safetensors +3 -0
- model-00009-of-00024.safetensors +3 -0
- model-00010-of-00024.safetensors +3 -0
- model-00011-of-00024.safetensors +3 -0
- model-00012-of-00024.safetensors +3 -0
- model-00013-of-00024.safetensors +3 -0
- model-00014-of-00024.safetensors +3 -0
- model-00015-of-00024.safetensors +3 -0
- model-00016-of-00024.safetensors +3 -0
- model-00017-of-00024.safetensors +3 -0
- model-00018-of-00024.safetensors +3 -0
- model-00019-of-00024.safetensors +3 -0
- model-00020-of-00024.safetensors +3 -0
- model-00021-of-00024.safetensors +3 -0
- model-00022-of-00024.safetensors +3 -0
- model-00023-of-00024.safetensors +3 -0
- model-00024-of-00024.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "X-ALMA",
|
3 |
+
"architectures": [
|
4 |
+
"XALMAForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"head_dim": 128,
|
11 |
+
"hidden_act": "silu",
|
12 |
+
"hidden_size": 5120,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 13824,
|
15 |
+
"max_length": null,
|
16 |
+
"max_position_embeddings": 4096,
|
17 |
+
"mlp_bias": false,
|
18 |
+
"model_type": "llama",
|
19 |
+
"num_attention_heads": 40,
|
20 |
+
"num_hidden_layers": 40,
|
21 |
+
"num_key_value_heads": 40,
|
22 |
+
"pad_token_id": 0,
|
23 |
+
"pretraining_tp": 1,
|
24 |
+
"rms_norm_eps": 1e-05,
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 10000.0,
|
27 |
+
"tie_word_embeddings": false,
|
28 |
+
"torch_dtype": "float32",
|
29 |
+
"transformers_version": "4.45.1",
|
30 |
+
"use_cache": true,
|
31 |
+
"vocab_size": 32000
|
32 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"max_length": 512,
|
6 |
+
"pad_token_id": 0,
|
7 |
+
"transformers_version": "4.45.1"
|
8 |
+
}
|
model-00001-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe9462bf7af838fa5927803ccb7c91048c91f64940346991de5ff9a07711dbe6
|
3 |
+
size 4900059112
|
model-00002-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bf417426a6de545a20d03a5ae33054cc9ebc9c6788daefab8adda009d2acc05
|
3 |
+
size 4997618144
|
model-00003-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f024dd35d1a734e4cc2fd1c4296f179e2e9977b090958892e63d354ddb3c62a
|
3 |
+
size 4972412488
|
model-00004-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e474de0e734d60075da919c9806e388e034a25550d0a1ac373af87272315966
|
3 |
+
size 4993425240
|
model-00005-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f0e410f0761149ec421ec48bcff92c9f091fa2adf74d5757c622d7b2ef15106
|
3 |
+
size 4850822032
|
model-00006-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0806bac01b08365bafd14d35460806fed3c7f6b2d8fe136f9b4defb4c90d23f
|
3 |
+
size 4966158520
|
model-00007-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b2a08fdc3e22fb556dc5c6a9c11f84be750aa2ba3232e6768353cf591ead099
|
3 |
+
size 4975559648
|
model-00008-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:727d1daf2aa80f2cfb01290fcd08f8e5b14fbf4b44473cdb4c618168863e5dd2
|
3 |
+
size 4979794680
|
model-00009-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bf6af7e00334b972741dba02386f4315128d0374c5cb00975488e4263f10085
|
3 |
+
size 4997621464
|
model-00010-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:367ec5b405521d124e081b79aa3ca7eff0664bf75af54dfb917be578e55dbecc
|
3 |
+
size 4934703200
|
model-00011-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f03150f6a9ad3001ac98d0cc4fc44ed530d6bafd908b02dbb1e141e5a10b6d1e
|
3 |
+
size 4988141408
|
model-00012-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8bfdeec5bc2d6cff70e850ef4b8495f4ddf8402061251dd5a883b2555c7d6e4
|
3 |
+
size 4893812696
|
model-00013-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45d1f3577e67322a89f5049455074a63dfeedd129ff176c25938e0add54c208b
|
3 |
+
size 4997618336
|
model-00014-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2606a4bdcca537830aa857f5f00b2ba9206cc1d316720abd1f695cc10ec3ea1f
|
3 |
+
size 4972412696
|
model-00015-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f41a82233824728f7ea682650b1b190c1dbf33b0134a0304bb322c997f7799d0
|
3 |
+
size 4993425448
|
model-00016-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f353e5a62651c42178d49d5361e2bfdbc01a4c6bb5c65d29fceafaf033fc24d6
|
3 |
+
size 4850822264
|
model-00017-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50b693d450fc42c6992f6efd34511f97142cad13cb948d0992713467a10f48ad
|
3 |
+
size 4966158672
|
model-00018-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f76f53c89011a6842041854a84c39f32ab7ff17417da17790cacee1306e998a
|
3 |
+
size 4975559648
|
model-00019-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:583faf545d4c5873e009df486fb91b262dfd37aa7d6321d6c8e550a24ebf91a9
|
3 |
+
size 4979794680
|
model-00020-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c614d68b32c532bb7271f6a9a1fa9aceffff05d546db00859349e7c38d11efa2
|
3 |
+
size 4997621464
|
model-00021-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6992d59925ed6604d8610ace159fce78bfb8d7b3babe1c51d2201d7eccd917d4
|
3 |
+
size 4934703200
|
model-00022-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99bc875b42d5384b77b7de151ea4aa3125068df84b129a03d9ccffe40088ac2c
|
3 |
+
size 4988141408
|
model-00023-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a8ee3cd9d9593f8651dd0edc9a7e0dc3c453cdb62c74613e250160c57afee1c
|
3 |
+
size 4893812696
|
model-00024-of-00024.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4533cee65d7e7d4b2c8e2ce31cdd147215d9f77d9c49066bbfe6a0a64dfe68c5
|
3 |
+
size 2152794216
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|