Create ipu_config.json
Browse files- ipu_config.json +18 -0
ipu_config.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"recompute_checkpoint_every_layer": true,
|
| 3 |
+
"optimizer_state_offchip": true,
|
| 4 |
+
"replicated_tensor_sharding": true,
|
| 5 |
+
"enable_half_first_order_momentum": true,
|
| 6 |
+
"enable_half_partials": true,
|
| 7 |
+
|
| 8 |
+
"replication_factor": {"pod4": 1, "pod8": 2, "pod16": 4, "pod32": 8, "pod64": 16, "pod128": 32, "pod256": 64, "default": 1},
|
| 9 |
+
"gradient_accumulation_steps": 512,
|
| 10 |
+
"device_iterations": 1,
|
| 11 |
+
"executable_cache_dir": "./exe_cache",
|
| 12 |
+
|
| 13 |
+
"inference_device_iterations": 4,
|
| 14 |
+
"inference_replication_factor": {"pod4": 1, "pod8": 2, "pod16": 4, "pod32": 8, "pod64": 16, "pod128": 32, "pod256": 64, "default": 1},
|
| 15 |
+
"ipus_per_replica": 4,
|
| 16 |
+
"layers_per_ipu": [0, 4, 4, 4],
|
| 17 |
+
"matmul_proportion": [0.25, 0.25, 0.25, 0.25]
|
| 18 |
+
}
|