-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig_imagenet.yaml
64 lines (64 loc) · 2.09 KB
/
config_imagenet.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
model:
params:
condition_info:
key: label
content_codec_config:
params:
ckpt_path: OUTPUT/pretrained_model/taming_dvae/vqgan_imagenet_f16_16384.pth
config_path: OUTPUT/pretrained_model/taming_dvae/vqgan_imagenet_f16_16384.yaml
mapping_path: ./help_folder/statistics/taming_vqvae_974.pt
num_tokens: 16384
quantize_number: 974
token_shape:
- 16
- 16
trainable: false
target: image_synthesis.modeling.codecs.image_codec.taming_gumbel_vqvae.TamingVQVAE
content_info:
key: image
diffusion_config:
params:
adaptive_auxiliary_loss: true
alpha_init_type: alpha1
auxiliary_loss_weight: 0.001
condition_emb_config:
params:
embed_dim: 512
identity: true
num_embed: 1000
target: image_synthesis.modeling.embeddings.class_embedding.ClassEmbedding
content_emb_config:
params:
embed_dim: 512
num_embed: 974
pos_emb_type: embedding
spatial_size: !!python/tuple
- 32
- 32
trainable: true
target: image_synthesis.modeling.embeddings.dalle_mask_image_embedding.DalleMaskImageEmbedding
diffusion_step: 100
mask_weight:
- 1
- 1
transformer_config:
params:
attn_pdrop: 0.0
attn_type: selfcondition
block_activate: GELU2
class_number: 1000
class_type: adalayernorm
content_seq_len: 256
content_spatial_size:
- 16
- 16
mlp_hidden_times: 4
mlp_type: conv_mlp
n_embd: 512
n_head: 16
n_layer: 24
resid_pdrop: 0.0
timestep_type: adalayernorm
target: image_synthesis.modeling.transformers.transformer_utils.Condition2ImageTransformer
target: image_synthesis.modeling.transformers.diffusion_transformer.DiffusionTransformer
target: image_synthesis.modeling.models.conditional_dalle.C_DALLE