graphcore-rahult commited on
Commit
be9523a
1 Parent(s): 2277132

Training in progress, step 500

Browse files
Files changed (3) hide show
  1. ipu_config.json +3 -3
  2. pytorch_model.bin +1 -1
  3. training_args.bin +1 -1
ipu_config.json CHANGED
@@ -7,7 +7,7 @@
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 32,
9
  "inference_device_iterations": 5,
10
- "inference_replication_factor": 1,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
@@ -22,8 +22,8 @@
22
  "optimum_version": "1.5.1",
23
  "output_mode": "final",
24
  "recompute_checkpoint_every_layer": true,
25
- "replicated_tensor_sharding": false,
26
- "replication_factor": 1,
27
  "seed": 42,
28
  "sharded_execution_for_inference": false,
29
  "transformers_version": "4.20.1"
 
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 32,
9
  "inference_device_iterations": 5,
10
+ "inference_replication_factor": 4,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
 
22
  "optimum_version": "1.5.1",
23
  "output_mode": "final",
24
  "recompute_checkpoint_every_layer": true,
25
+ "replicated_tensor_sharding": true,
26
+ "replication_factor": 4,
27
  "seed": 42,
28
  "sharded_execution_for_inference": false,
29
  "transformers_version": "4.20.1"
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fc61a0b2e8677824d0f412b1a2b34ec64a41e76efad409b23a77eb2c9b941b0
3
  size 248181489
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37c8b1f11b6923d313b083ef49fb3126dece2213ab93b6fb6cb56b59220d5fdb
3
  size 248181489
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0fed49aff71d16a99fb12b3fa788766a5b8d9f715f2619e190ab8fe986b64ca
3
  size 2735
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:354a000e7b498833b02566e145ff807e39ae9f25840debc587c798c2f43ba390
3
  size 2735