Skywork
/

UniPic2-Metaquery-9B

image-understanding

vision-language

Model card Files Files and versions

UniPic2-Metaquery-9B / transformer /config.json

OrlandoHugBot's picture

Upload folder using huggingface_hub

31b4eeb verified 3 months ago

history blame contribute delete

593 Bytes

	{
	"_class_name": "SD3Transformer2DKontextModel",
	"_diffusers_version": "0.35.0.dev0",
	"_name_or_path": "stabilityai/stable-diffusion-3.5-medium",
	"attention_head_dim": 64,
	"caption_projection_dim": 1536,
	"dual_attention_layers": [
	0,
	1,
	2,
	3,
	4,
	5,
	6,
	7,
	8,
	9,
	10,
	11,
	12
	],
	"in_channels": 16,
	"joint_attention_dim": 4096,
	"num_attention_heads": 24,
	"num_layers": 24,
	"out_channels": 16,
	"patch_size": 2,
	"pooled_projection_dim": 2048,
	"pos_embed_max_size": 384,
	"qk_norm": "rms_norm",
	"sample_size": 128
	}