Graphcore
/

mt5-small-ipu

Model card Files Files and versions Community

mt5-small-ipu / ipu_config.json

mwizakunda's picture

Syntax fix

4c21729 over 1 year ago

history blame contribute delete

895 Bytes

	{
	"layers_per_ipu": [0, 8, 8, 0],
	"inference_layers_per_ipu": [0, 8, 8, 0],
	"embedding_serialization_factor": null,
	"serialized_embedding_splits_per_ipu": [4, 4, 0, 0],
	"projection_serialization_factor": 4,
	"matmul_proportion": 0.25,
	"inference_matmul_proportion": 0.6,
	"recompute_checkpoint_every_layer": true,
	"optimizer_state_offchip": true,
	"replicated_tensor_sharding": true,
	"device_iterations": 10,
	"gradient_accumulation_steps": 128,
	"executable_cache_dir": "./exe_cache"
	}