{ "architectures": [ "Emu3VisionVQModel" ], "attn_resolutions": [ 3 ], "auto_map": { "AutoConfig": "configuration_emu3visionvq.Emu3VisionVQConfig", "AutoModel": "modeling_emu3visionvq.Emu3VisionVQModel" }, "ch": 256, "ch_mult": [ 1, 2, 2, 4 ], "codebook_size": 32768, "double_z": false, "dropout": 0.0, "embed_dim": 4, "in_channels": 3, "model_type": "Emu3VisionVQ", "num_res_blocks": 2, "out_channels": 3, "temporal_downsample_factor": 4, "torch_dtype": "float32", "transformers_version": "4.44.0", "z_channels": 4 }