| { | |
| "architectures": [ | |
| "Emu3VisionVQModel" | |
| ], | |
| "attn_resolutions": [ | |
| 3 | |
| ], | |
| "auto_map": { | |
| "AutoConfig": "configuration_emu3visionvq.Emu3VisionVQConfig", | |
| "AutoModel": "modeling_emu3visionvq.Emu3VisionVQModel" | |
| }, | |
| "ch": 256, | |
| "ch_mult": [ | |
| 1, | |
| 2, | |
| 2, | |
| 4 | |
| ], | |
| "codebook_size": 32768, | |
| "double_z": false, | |
| "dropout": 0.0, | |
| "embed_dim": 4, | |
| "in_channels": 3, | |
| "model_type": "Emu3VisionVQ", | |
| "num_res_blocks": 2, | |
| "out_channels": 3, | |
| "temporal_downsample_factor": 4, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.44.0", | |
| "z_channels": 4 | |
| } | |