File size: 484 Bytes
265a281
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
{
    "optimizer_state_offchip": true,
    "replicated_tensor_sharding": true,
    "enable_half_partials": true,                                                                                                
  
    "gradient_accumulation_steps": 16,
    "executable_cache_dir": "./exe_cache",                                                                                       

    "layers_per_ipu": [4, 4],
    "matmul_proportion": 0.6,
    "projection_serialization_factor": 4
}