37 lines
834 B
Python
37 lines
834 B
Python
use_t2i2v = True
|
|
|
|
# flux configurations
|
|
img_flux = dict(
|
|
type="flux",
|
|
from_pretrained="./ckpts/flux1-dev.safetensors",
|
|
guidance_embed=True,
|
|
# model architecture
|
|
in_channels=64,
|
|
vec_in_dim=768,
|
|
context_in_dim=4096,
|
|
hidden_size=3072,
|
|
mlp_ratio=4.0,
|
|
num_heads=24,
|
|
depth=19,
|
|
depth_single_blocks=38,
|
|
axes_dim=[16, 56, 56],
|
|
theta=10_000,
|
|
qkv_bias=True,
|
|
cond_embed=False, # pass i2v & v2v info, for t2v need this layer too but with x_cond and mask all set to 0
|
|
)
|
|
|
|
img_flux_ae = dict(
|
|
type="autoencoder_2d",
|
|
from_pretrained="./ckpts/flux1-dev-ae.safetensors",
|
|
resolution=256,
|
|
in_channels=3,
|
|
ch=128,
|
|
out_ch=3,
|
|
ch_mult=[1, 2, 4, 4],
|
|
num_res_blocks=2,
|
|
z_channels=16,
|
|
scale_factor=0.3611,
|
|
shift_factor=0.1159,
|
|
)
|
|
img_resolution = "768px"
|