aws-neuron
/

optimum-neuron-cache

Model card Files Files and versions Community

optimum-neuron-cache / neuronxcc-2.14.227.0+2d4f85be /MODULE_09efc8a8af0f17d5b6d1 /controlnet_0 /config.json

Jingya's picture

Jingya HF staff

Synchronizing local compiler cache.

89d090e verified 3 months ago

2.53 kB

	{
	"_class_name": "ControlNetModel",
	"_commit_hash": null,
	"_diffusers_version": "0.28.2",
	"_name_or_path": "lllyasviel/control_v11p_sd15_openpose",
	"_use_default_values": [
	"num_attention_heads",
	"transformer_layers_per_block",
	"mid_block_type",
	"addition_embed_type",
	"encoder_hid_dim",
	"encoder_hid_dim_type",
	"conditioning_channels",
	"addition_embed_type_num_heads",
	"global_pool_conditions",
	"addition_time_embed_dim"
	],
	"act_fn": "silu",
	"addition_embed_type": null,
	"addition_embed_type_num_heads": 64,
	"addition_time_embed_dim": null,
	"attention_head_dim": 8,
	"block_out_channels": [
	320,
	640,
	1280,
	1280
	],
	"class_embed_type": null,
	"conditioning_channels": 3,
	"conditioning_embedding_out_channels": [
	16,
	32,
	96,
	256
	],
	"controlnet_conditioning_channel_order": "rgb",
	"cross_attention_dim": 768,
	"down_block_types": [
	"CrossAttnDownBlock2D",
	"CrossAttnDownBlock2D",
	"CrossAttnDownBlock2D",
	"DownBlock2D"
	],
	"downsample_padding": 1,
	"encoder_hid_dim": null,
	"encoder_hid_dim_type": null,
	"flip_sin_to_cos": true,
	"freq_shift": 0,
	"global_pool_conditions": false,
	"in_channels": 4,
	"layers_per_block": 2,
	"mid_block_scale_factor": 1,
	"mid_block_type": "UNetMidBlock2DCrossAttn",
	"neuron": {
	"auto_cast": "matmul",
	"auto_cast_type": "bf16",
	"compiler_type": "neuronx-cc",
	"compiler_version": "2.14.227.0+2d4f85be",
	"dynamic_batch_size": false,
	"inline_weights_to_neff": true,
	"input_names": [
	"sample",
	"timestep",
	"encoder_hidden_states",
	"controlnet_cond",
	"conditioning_scale"
	],
	"model_type": "controlnet",
	"optlevel": "2",
	"output_attentions": false,
	"output_hidden_states": false,
	"output_names": [
	"down_block_res_samples",
	"mid_block_res_sample"
	],
	"static_batch_size": 1,
	"static_encoder_hidden_size": 768,
	"static_height": 64,
	"static_num_channels": 4,
	"static_sequence_length": 77,
	"static_vae_scale_factor": 8,
	"static_width": 64
	},
	"norm_eps": 1e-05,
	"norm_num_groups": 32,
	"num_attention_heads": null,
	"num_class_embeds": null,
	"only_cross_attention": false,
	"projection_class_embeddings_input_dim": null,
	"resnet_time_scale_shift": "default",
	"task": "semantic-segmentation",
	"transformer_layers_per_block": 1,
	"transformers_version": null,
	"upcast_attention": false,
	"use_linear_projection": false
	}