Hack90 commited on
Commit
c0f27b1
·
verified ·
1 Parent(s): 8f23794

DNA-LLM/virus_pythia_14_1024_cross_entropy

Browse files
Files changed (5) hide show
  1. README.md +3 -3
  2. config.json +1 -1
  3. generation_config.json +1 -1
  4. model.safetensors +1 -1
  5. training_args.bin +1 -1
README.md CHANGED
@@ -32,8 +32,8 @@ More information needed
32
 
33
  The following hyperparameters were used during training:
34
  - learning_rate: 5e-05
35
- - train_batch_size: 40
36
- - eval_batch_size: 40
37
  - seed: 42
38
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
39
  - lr_scheduler_type: linear
@@ -46,7 +46,7 @@ The following hyperparameters were used during training:
46
 
47
  ### Framework versions
48
 
49
- - Transformers 4.40.0
50
  - Pytorch 2.2.1+cu121
51
  - Datasets 2.19.0
52
  - Tokenizers 0.19.1
 
32
 
33
  The following hyperparameters were used during training:
34
  - learning_rate: 5e-05
35
+ - train_batch_size: 80
36
+ - eval_batch_size: 80
37
  - seed: 42
38
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
39
  - lr_scheduler_type: linear
 
46
 
47
  ### Framework versions
48
 
49
+ - Transformers 4.40.1
50
  - Pytorch 2.2.1+cu121
51
  - Datasets 2.19.0
52
  - Tokenizers 0.19.1
config.json CHANGED
@@ -23,7 +23,7 @@
23
  "rotary_pct": 0.25,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "float32",
26
- "transformers_version": "4.40.0",
27
  "use_cache": true,
28
  "use_parallel_residual": true,
29
  "vocab_size": 9
 
23
  "rotary_pct": 0.25,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "float32",
26
+ "transformers_version": "4.40.1",
27
  "use_cache": true,
28
  "use_parallel_residual": true,
29
  "vocab_size": 9
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
- "transformers_version": "4.40.0"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
+ "transformers_version": "4.40.1"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7198f04c137198d2bcfa67ede584dc8c96153d88304bc53355cb603c34d29666
3
  size 4777048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e06adf92fe753dc442723db3d871fa396947156cca82c3799c7de511737a02b
3
  size 4777048
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68f63195edd8ab732fe7d4f1db65872537bae4e94e35c4eaabf8c8034cf8b7fc
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30599c12bfd41d82381809d03b7c0350b5f494e08d13f33d6b14050decb9696b
3
  size 4984