graphcore-rahult commited on
Commit
092db50
1 Parent(s): 78263b2

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. ipu_config.json +4 -4
  3. pytorch_model.bin +1 -1
  4. training_args.bin +1 -1
config.json CHANGED
@@ -2,7 +2,7 @@
2
  "_name_or_path": "gpt2",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
- "PipelinedGPT2LMHeadModel"
6
  ],
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
 
2
  "_name_or_path": "gpt2",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
+ "PoptorchPipelinedGPT2LMHeadModel"
6
  ],
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
ipu_config.json CHANGED
@@ -3,11 +3,11 @@
3
  "device_iterations": 2,
4
  "embedding_serialization_factor": 4,
5
  "enable_half_partials": true,
6
- "executable_cache_dir": "/tmp/lmcache/",
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 16,
9
  "inference_device_iterations": 5,
10
- "inference_replication_factor": 4,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
@@ -20,8 +20,8 @@
20
  "optimum_version": "1.5.1",
21
  "output_mode": "final",
22
  "recompute_checkpoint_every_layer": true,
23
- "replicated_tensor_sharding": true,
24
- "replication_factor": 4,
25
  "seed": 42,
26
  "sharded_execution_for_inference": false,
27
  "transformers_version": "4.20.1"
 
3
  "device_iterations": 2,
4
  "embedding_serialization_factor": 4,
5
  "enable_half_partials": true,
6
+ "executable_cache_dir": "/tmp/lmcache4/",
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 16,
9
  "inference_device_iterations": 5,
10
+ "inference_replication_factor": 1,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
 
20
  "optimum_version": "1.5.1",
21
  "output_mode": "final",
22
  "recompute_checkpoint_every_layer": true,
23
+ "replicated_tensor_sharding": false,
24
+ "replication_factor": 1,
25
  "seed": 42,
26
  "sharded_execution_for_inference": false,
27
  "transformers_version": "4.20.1"
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c198b53f4c8c7a6525d3e27ecb5c7126b9c0916c930ad6cc8b357ec5a5cedb2
3
  size 261514473
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98be7a37645b50ad99a01b1d44d9ab4abd27738bff597b76c13b02edde1f3ed6
3
  size 261514473
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a773e48dabdb3e3091dec5107367123865bd42e1bcb30cc18ab8017a3fdb8f1d
3
  size 2735
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd0e8adb4537e66ff3c6649d9c805d0ef48c7c4c1b248b1512326c7a21ab9ed2
3
  size 2735