Create ipu_config.json
Browse files- ipu_config.json +18 -0
ipu_config.json
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"recompute_checkpoint_every_layer": true,
|
3 |
+
"optimizer_state_offchip": true,
|
4 |
+
"replicated_tensor_sharding": true,
|
5 |
+
"enable_half_first_order_momentum": true,
|
6 |
+
"enable_half_partials": true,
|
7 |
+
|
8 |
+
"replication_factor": {"pod4": 1, "pod8": 2, "pod16": 4, "pod32": 8, "pod64": 16, "pod128": 32, "pod256": 64, "default": 1},
|
9 |
+
"gradient_accumulation_steps": 512,
|
10 |
+
"device_iterations": 1,
|
11 |
+
"executable_cache_dir": "./exe_cache",
|
12 |
+
|
13 |
+
"inference_device_iterations": 4,
|
14 |
+
"inference_replication_factor": {"pod4": 1, "pod8": 2, "pod16": 4, "pod32": 8, "pod64": 16, "pod128": 32, "pod256": 64, "default": 1},
|
15 |
+
"ipus_per_replica": 4,
|
16 |
+
"layers_per_ipu": [0, 4, 4, 4],
|
17 |
+
"matmul_proportion": [0.25, 0.25, 0.25, 0.25]
|
18 |
+
}
|