carlex3321 commited on
Commit
c3e13b4
·
verified ·
1 Parent(s): 814f463

Delete configs/generate_distributed.yaml

Browse files
Files changed (1) hide show
  1. configs/generate_distributed.yaml +0 -126
configs/generate_distributed.yaml DELETED
@@ -1,126 +0,0 @@
1
- __object__:
2
- path: generate_distributed
3
- name: VINCIEGenerator
4
-
5
- dit:
6
- model:
7
- __object__:
8
- path: models.dit.nadit
9
- name: NaDiT
10
- args: as_params
11
- vid_in_channels: 33
12
- vid_out_channels: 16
13
- vid_dim: 2560
14
- vid_out_norm: fusedrms
15
- txt_in_dim: 5120
16
- txt_in_norm: fusedln
17
- txt_dim: ${.vid_dim}
18
- emb_dim: ${eval:'6 * ${.vid_dim}'}
19
- heads: 20
20
- head_dim: 128
21
- expand_ratio: 4
22
- norm: fusedrms
23
- norm_eps: 1e-5
24
- ada: single
25
- qk_bias: False
26
- qk_rope: True
27
- qk_norm: fusedrms
28
- patch_size: [ 1,2,2 ]
29
- num_layers: 32 # llm-like
30
- mm_layers: 10
31
- mlp_type: swiglu
32
- block_type: mmdit
33
- msa_type: mm_full
34
- rope_type: mmrope3d
35
- rope_dim: 128
36
- compile: False
37
- gradient_checkpoint: True
38
- checkpoint: /app/ckpt/VINCIE-3B/dit.pth
39
- fsdp:
40
- sharding_strategy: _HYBRID_SHARD_ZERO2
41
- ema:
42
- decay: 0.9998
43
-
44
-
45
- vae:
46
- model:
47
- __inherit__: /app/models/vae/s8_c16_t4_inflation_sd3.yaml
48
- slicing:
49
- split_size:
50
- memory_device: same
51
- checkpoint: /app/ckpt/VINCIE-3B/vae.pth
52
- scaling_factor: 0.9152
53
- compile: False
54
- # grouping: True
55
- grouping: False
56
- dtype: bfloat16
57
-
58
-
59
- text:
60
- models:
61
- - type: llm14b
62
- path: /app/ckpt/VINCIE-3B/llm14b
63
- # path: llm14b
64
- max_length: 150
65
- layer: last
66
- mask: True
67
- dropout: 0.1
68
- compile: False
69
- dtype: bfloat16
70
- fsdp:
71
- enabled: True
72
- sharding_strategy: HYBRID_SHARD
73
-
74
- prompt_id_embedding:
75
- model:
76
- __object__:
77
- path: models.embedding.prompt_emb
78
- name: PromptEmbedding
79
- args: as_params
80
- max_num_prompts: 64 # max number of turns or prompts in a session
81
- embedding_dim: 5120
82
- fusion_strategy: seq_concat
83
- # fusion_strategy: dim_add
84
-
85
- diffusion:
86
- schedule:
87
- type: lerp
88
- T: 1000.0
89
- sampler:
90
- type: euler
91
- prediction_type: v_lerp
92
- timesteps:
93
- training:
94
- type: logitnormal
95
- loc: 0.0
96
- scale: 1.0
97
- sampling:
98
- type: uniform_trailing
99
- steps: 50
100
- shift: 12
101
- loss:
102
- type: v_lerp
103
- cfg:
104
- scale: 7.5
105
- rescale: 0
106
- partial: 1.0
107
-
108
- data:
109
- video:
110
- type: session_image
111
-
112
- generation:
113
- seed: 0
114
- aspect_ratio: keep_ratio
115
- resolution: 256
116
- fps: 2
117
- batch_size: 1
118
- sequence_parallel: 1
119
- repeat: 1
120
- use_img_placehoder: True
121
- output:
122
- dir: output/mse_bench
123
- filename: "{index}_turn{turn_index}_rep{repeat_index}_seed{seed}"
124
- positive_prompt:
125
- path: benchmark/mse_bench
126
- negative_prompt: "Worst quality, Normal quality, Low quality, Low res, Blurry, Jpeg artifacts, Grainy, text, logo, watermark, banner, extra digits, signature, subtitling, Bad anatomy, Bad proportions, Deformed, Disconnected limbs, Disfigured, Extra arms, Extra limbs, Extra hands, Fused fingers, Gross proportions, Long neck, Malformed limbs, Mutated, Mutated hands, Mutated limbs, Missing arms, Missing fingers, Poorly drawn hands, Poorly drawn face, Nsfw, Uncensored, Cleavage, Nude, Nipples, Overexposed, Plain background, Grainy, Underexposed, Deformed structures"