lifm
Browse files- lifm/FMiT-B2-16f8/config.json +28 -0
- lifm/FMiT-B2-16f8/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-B2-4f4/config.json +28 -0
- lifm/FMiT-B2-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-B4-4f4/config.json +28 -0
- lifm/FMiT-B4-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-L2-16f8/config.json +28 -0
- lifm/FMiT-L2-16f8/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-L2-4f4/config.json +28 -0
- lifm/FMiT-L2-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-L4-4f4/config.json +28 -0
- lifm/FMiT-L4-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-S2-16f8/config.json +28 -0
- lifm/FMiT-S2-16f8/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-S2-4f4/config.json +28 -0
- lifm/FMiT-S2-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/FMiT-S4-4f4/config.json +28 -0
- lifm/FMiT-S4-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/UNet-B-16f8/config.json +53 -0
- lifm/UNet-B-16f8/diffusion_pytorch_model.safetensors +3 -0
- lifm/UNet-B-4f4/config.json +53 -0
- lifm/UNet-B-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/UNet-L-16f8/config.json +53 -0
- lifm/UNet-L-16f8/diffusion_pytorch_model.safetensors +3 -0
- lifm/UNet-L-4f4/config.json +53 -0
- lifm/UNet-L-4f4/diffusion_pytorch_model.safetensors +3 -0
- lifm/UNet-S-16f8/config.json +53 -0
- lifm/UNet-S-16f8/diffusion_pytorch_model.safetensors +3 -0
- lifm/UNet-S-4f4/config.json +53 -0
- lifm/UNet-S-4f4/diffusion_pytorch_model.safetensors +3 -0
lifm/FMiT-B2-16f8/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-B_16f8_all_sv/checkpoint-940000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 17,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 12,
|
20 |
+
"optimization_step": 60001,
|
21 |
+
"out_channels": 16,
|
22 |
+
"patch_size": 2,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 14,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-B2-16f8/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0aa62b399ab2f01a678f097edfbc4d758e8ed56c9f4f91f811c9ddafcfc77f5d
|
3 |
+
size 590045024
|
lifm/FMiT-B2-4f4/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-B2_4f4_all_sv/checkpoint-980000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 5,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 12,
|
20 |
+
"optimization_step": 20001,
|
21 |
+
"out_channels": 4,
|
22 |
+
"patch_size": 2,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 28,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-B2-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a90e1e62a1eac4602f989b98ed084bb7a201e17e5059e0f0b034ddb1e76633c
|
3 |
+
size 589749912
|
lifm/FMiT-B4-4f4/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-B_4f4_all_sv/checkpoint-770000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 5,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 12,
|
20 |
+
"optimization_step": 230001,
|
21 |
+
"out_channels": 4,
|
22 |
+
"patch_size": 4,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 28,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-B4-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d5cd4aef5f3cdaef91c2f101297fbd8b8ebc6de07b4d70d88cb41f143e6a302
|
3 |
+
size 590081888
|
lifm/FMiT-L2-16f8/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-L_16f8_all_sv/checkpoint-900000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 17,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 16,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 24,
|
20 |
+
"optimization_step": 100001,
|
21 |
+
"out_channels": 16,
|
22 |
+
"patch_size": 2,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 14,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-L2-16f8/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08e3d422eeb42b45dcb237983942d28c94012235760c2828de571c3c0ee44dfa
|
3 |
+
size 2046838968
|
lifm/FMiT-L2-4f4/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-L2_4f4_all_sv/checkpoint-960000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 5,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 16,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 24,
|
20 |
+
"optimization_step": 40001,
|
21 |
+
"out_channels": 4,
|
22 |
+
"patch_size": 2,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 14,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-L2-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc0fadec1c5a03108d06940d5e1d9f9b5adee9cddbb2200bc4691ade9c5dd88d
|
3 |
+
size 2046445560
|
lifm/FMiT-L4-4f4/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-L_4f4_all_sv/checkpoint-900000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 5,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 16,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 24,
|
20 |
+
"optimization_step": 100001,
|
21 |
+
"out_channels": 4,
|
22 |
+
"patch_size": 4,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 14,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-L4-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88275ef78c4697e40b355fd87e8eee015df8ad009e6f78404fcebc644f0dda5a
|
3 |
+
size 2046888120
|
lifm/FMiT-S2-16f8/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-S_16f8_all_sv/checkpoint-550000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 17,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 6,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 12,
|
20 |
+
"optimization_step": 450001,
|
21 |
+
"out_channels": 16,
|
22 |
+
"patch_size": 2,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 14,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-S2-16f8/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d163609e13854f091d8d6ad0052d86be0932e8a72cec19cfcdc394a171ebe3d
|
3 |
+
size 159376504
|
lifm/FMiT-S2-4f4/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-S2_4f4_all_sv/checkpoint-720000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 5,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 6,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 12,
|
20 |
+
"optimization_step": 280001,
|
21 |
+
"out_channels": 4,
|
22 |
+
"patch_size": 2,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 28,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-S2-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19bbc36db1b9de7732b0629056aa689a0d6df329222a3bdb953d5e5d9469316c
|
3 |
+
size 159228848
|
lifm/FMiT-S4-4f4/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegDiTTransformer2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_DiT-S_4f4_all_sv/checkpoint-540000/denoiser_ema",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"decay": 0.9999,
|
9 |
+
"dropout": 0.0,
|
10 |
+
"in_channels": 5,
|
11 |
+
"inv_gamma": 1.0,
|
12 |
+
"min_decay": 0.0,
|
13 |
+
"norm_elementwise_affine": false,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"norm_num_groups": 32,
|
16 |
+
"norm_type": "ada_norm_zero",
|
17 |
+
"num_attention_heads": 6,
|
18 |
+
"num_embeds_ada_norm": 1000,
|
19 |
+
"num_layers": 12,
|
20 |
+
"optimization_step": 460001,
|
21 |
+
"out_channels": 4,
|
22 |
+
"patch_size": 4,
|
23 |
+
"power": 0.6666666666666666,
|
24 |
+
"sample_size": 28,
|
25 |
+
"upcast_attention": false,
|
26 |
+
"update_after_step": 0,
|
27 |
+
"use_ema_warmup": false
|
28 |
+
}
|
lifm/FMiT-S4-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59aacefc34342777f73a29e5b10537f070bbc2418cbd9907e00063771ccb6946
|
3 |
+
size 159394936
|
lifm/UNet-B-16f8/config.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegUnet2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_UNet-B_16f8_all_sv/checkpoint-780000/denoiser_ema",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"add_attention": true,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"attn_norm_num_groups": null,
|
9 |
+
"block_out_channels": [
|
10 |
+
160,
|
11 |
+
320,
|
12 |
+
480,
|
13 |
+
640
|
14 |
+
],
|
15 |
+
"center_input_sample": false,
|
16 |
+
"class_embed_type": "timestep",
|
17 |
+
"decay": 0.9999,
|
18 |
+
"down_block_types": [
|
19 |
+
"AttnDownBlock2D",
|
20 |
+
"AttnDownBlock2D",
|
21 |
+
"AttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"downsample_type": "resnet",
|
26 |
+
"dropout": 0.0,
|
27 |
+
"flip_sin_to_cos": true,
|
28 |
+
"freq_shift": 0,
|
29 |
+
"in_channels": 17,
|
30 |
+
"inv_gamma": 1.0,
|
31 |
+
"layers_per_block": 2,
|
32 |
+
"mid_block_scale_factor": 1,
|
33 |
+
"min_decay": 0.0,
|
34 |
+
"norm_eps": 1e-05,
|
35 |
+
"norm_num_groups": 32,
|
36 |
+
"num_class_embeds": null,
|
37 |
+
"num_train_timesteps": null,
|
38 |
+
"optimization_step": 220001,
|
39 |
+
"out_channels": 16,
|
40 |
+
"power": 0.6666666666666666,
|
41 |
+
"resnet_time_scale_shift": "default",
|
42 |
+
"sample_size": 28,
|
43 |
+
"time_embedding_type": "positional",
|
44 |
+
"up_block_types": [
|
45 |
+
"UpBlock2D",
|
46 |
+
"AttnUpBlock2D",
|
47 |
+
"AttnUpBlock2D",
|
48 |
+
"AttnUpBlock2D"
|
49 |
+
],
|
50 |
+
"update_after_step": 0,
|
51 |
+
"upsample_type": "resnet",
|
52 |
+
"use_ema_warmup": false
|
53 |
+
}
|
lifm/UNet-B-16f8/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b283951444625491a147db32818675f2b72fbcc3efe2977308a85f66b3e7674
|
3 |
+
size 560371312
|
lifm/UNet-B-4f4/config.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegUnet2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_UNet-B_4f4_all_sv/checkpoint-900000/denoiser_ema",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"add_attention": true,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"attn_norm_num_groups": null,
|
9 |
+
"block_out_channels": [
|
10 |
+
160,
|
11 |
+
320,
|
12 |
+
480,
|
13 |
+
640
|
14 |
+
],
|
15 |
+
"center_input_sample": false,
|
16 |
+
"class_embed_type": "timestep",
|
17 |
+
"decay": 0.9999,
|
18 |
+
"down_block_types": [
|
19 |
+
"AttnDownBlock2D",
|
20 |
+
"AttnDownBlock2D",
|
21 |
+
"AttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"downsample_type": "resnet",
|
26 |
+
"dropout": 0.0,
|
27 |
+
"flip_sin_to_cos": true,
|
28 |
+
"freq_shift": 0,
|
29 |
+
"in_channels": 5,
|
30 |
+
"inv_gamma": 1.0,
|
31 |
+
"layers_per_block": 2,
|
32 |
+
"mid_block_scale_factor": 1,
|
33 |
+
"min_decay": 0.0,
|
34 |
+
"norm_eps": 1e-05,
|
35 |
+
"norm_num_groups": 32,
|
36 |
+
"num_class_embeds": null,
|
37 |
+
"num_train_timesteps": null,
|
38 |
+
"optimization_step": 100001,
|
39 |
+
"out_channels": 4,
|
40 |
+
"power": 0.6666666666666666,
|
41 |
+
"resnet_time_scale_shift": "default",
|
42 |
+
"sample_size": 28,
|
43 |
+
"time_embedding_type": "positional",
|
44 |
+
"up_block_types": [
|
45 |
+
"UpBlock2D",
|
46 |
+
"AttnUpBlock2D",
|
47 |
+
"AttnUpBlock2D",
|
48 |
+
"AttnUpBlock2D"
|
49 |
+
],
|
50 |
+
"update_after_step": 0,
|
51 |
+
"upsample_type": "resnet",
|
52 |
+
"use_ema_warmup": false
|
53 |
+
}
|
lifm/UNet-B-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20bba15f4e2a446ea961eb0d1f797edd329bc55ab2589530b826d5c6ce531e19
|
3 |
+
size 560233024
|
lifm/UNet-L-16f8/config.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegUnet2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_UNet-L_16f8_all_sv/checkpoint-940000/denoiser_ema",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"add_attention": true,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"attn_norm_num_groups": null,
|
9 |
+
"block_out_channels": [
|
10 |
+
320,
|
11 |
+
640,
|
12 |
+
960,
|
13 |
+
1280
|
14 |
+
],
|
15 |
+
"center_input_sample": false,
|
16 |
+
"class_embed_type": "timestep",
|
17 |
+
"decay": 0.9999,
|
18 |
+
"down_block_types": [
|
19 |
+
"AttnDownBlock2D",
|
20 |
+
"AttnDownBlock2D",
|
21 |
+
"AttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"downsample_type": "resnet",
|
26 |
+
"dropout": 0.0,
|
27 |
+
"flip_sin_to_cos": true,
|
28 |
+
"freq_shift": 0,
|
29 |
+
"in_channels": 17,
|
30 |
+
"inv_gamma": 1.0,
|
31 |
+
"layers_per_block": 2,
|
32 |
+
"mid_block_scale_factor": 1,
|
33 |
+
"min_decay": 0.0,
|
34 |
+
"norm_eps": 1e-05,
|
35 |
+
"norm_num_groups": 32,
|
36 |
+
"num_class_embeds": null,
|
37 |
+
"num_train_timesteps": null,
|
38 |
+
"optimization_step": 60001,
|
39 |
+
"out_channels": 16,
|
40 |
+
"power": 0.6666666666666666,
|
41 |
+
"resnet_time_scale_shift": "default",
|
42 |
+
"sample_size": 28,
|
43 |
+
"time_embedding_type": "positional",
|
44 |
+
"up_block_types": [
|
45 |
+
"UpBlock2D",
|
46 |
+
"AttnUpBlock2D",
|
47 |
+
"AttnUpBlock2D",
|
48 |
+
"AttnUpBlock2D"
|
49 |
+
],
|
50 |
+
"update_after_step": 0,
|
51 |
+
"upsample_type": "resnet",
|
52 |
+
"use_ema_warmup": false
|
53 |
+
}
|
lifm/UNet-L-16f8/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:609b1d75c10ce40fb9487bdf9e1fa1c8bbfec17fc0c13534c876ad8199a2f2ac
|
3 |
+
size 2239924208
|
lifm/UNet-L-4f4/config.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegUnet2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_UNet-L_4f4_all_sv/checkpoint-960000/denoiser_ema",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"add_attention": true,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"attn_norm_num_groups": null,
|
9 |
+
"block_out_channels": [
|
10 |
+
320,
|
11 |
+
640,
|
12 |
+
960,
|
13 |
+
1280
|
14 |
+
],
|
15 |
+
"center_input_sample": false,
|
16 |
+
"class_embed_type": "timestep",
|
17 |
+
"decay": 0.9999,
|
18 |
+
"down_block_types": [
|
19 |
+
"AttnDownBlock2D",
|
20 |
+
"AttnDownBlock2D",
|
21 |
+
"AttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"downsample_type": "resnet",
|
26 |
+
"dropout": 0.0,
|
27 |
+
"flip_sin_to_cos": true,
|
28 |
+
"freq_shift": 0,
|
29 |
+
"in_channels": 5,
|
30 |
+
"inv_gamma": 1.0,
|
31 |
+
"layers_per_block": 2,
|
32 |
+
"mid_block_scale_factor": 1,
|
33 |
+
"min_decay": 0.0,
|
34 |
+
"norm_eps": 1e-05,
|
35 |
+
"norm_num_groups": 32,
|
36 |
+
"num_class_embeds": null,
|
37 |
+
"num_train_timesteps": null,
|
38 |
+
"optimization_step": 40001,
|
39 |
+
"out_channels": 4,
|
40 |
+
"power": 0.6666666666666666,
|
41 |
+
"resnet_time_scale_shift": "default",
|
42 |
+
"sample_size": 28,
|
43 |
+
"time_embedding_type": "positional",
|
44 |
+
"up_block_types": [
|
45 |
+
"UpBlock2D",
|
46 |
+
"AttnUpBlock2D",
|
47 |
+
"AttnUpBlock2D",
|
48 |
+
"AttnUpBlock2D"
|
49 |
+
],
|
50 |
+
"update_after_step": 0,
|
51 |
+
"upsample_type": "resnet",
|
52 |
+
"use_ema_warmup": false
|
53 |
+
}
|
lifm/UNet-L-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a184c77f1d8acb459966c953b9876e95179196753bc99ca7eff6aeb37b285157
|
3 |
+
size 2239647672
|
lifm/UNet-S-16f8/config.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegUnet2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_UNet-S_16f8_all_sv/checkpoint-810000/denoiser_ema",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"add_attention": true,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"attn_norm_num_groups": null,
|
9 |
+
"block_out_channels": [
|
10 |
+
96,
|
11 |
+
192,
|
12 |
+
288,
|
13 |
+
384
|
14 |
+
],
|
15 |
+
"center_input_sample": false,
|
16 |
+
"class_embed_type": "timestep",
|
17 |
+
"decay": 0.9999,
|
18 |
+
"down_block_types": [
|
19 |
+
"AttnDownBlock2D",
|
20 |
+
"AttnDownBlock2D",
|
21 |
+
"AttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"downsample_type": "resnet",
|
26 |
+
"dropout": 0.0,
|
27 |
+
"flip_sin_to_cos": true,
|
28 |
+
"freq_shift": 0,
|
29 |
+
"in_channels": 17,
|
30 |
+
"inv_gamma": 1.0,
|
31 |
+
"layers_per_block": 2,
|
32 |
+
"mid_block_scale_factor": 1,
|
33 |
+
"min_decay": 0.0,
|
34 |
+
"norm_eps": 1e-05,
|
35 |
+
"norm_num_groups": 32,
|
36 |
+
"num_class_embeds": null,
|
37 |
+
"num_train_timesteps": null,
|
38 |
+
"optimization_step": 190001,
|
39 |
+
"out_channels": 16,
|
40 |
+
"power": 0.6666666666666666,
|
41 |
+
"resnet_time_scale_shift": "default",
|
42 |
+
"sample_size": 28,
|
43 |
+
"time_embedding_type": "positional",
|
44 |
+
"up_block_types": [
|
45 |
+
"UpBlock2D",
|
46 |
+
"AttnUpBlock2D",
|
47 |
+
"AttnUpBlock2D",
|
48 |
+
"AttnUpBlock2D"
|
49 |
+
],
|
50 |
+
"update_after_step": 0,
|
51 |
+
"upsample_type": "resnet",
|
52 |
+
"use_ema_warmup": false
|
53 |
+
}
|
lifm/UNet-S-16f8/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:664eebd04bb2519bc2d9010390d2042e41ad3050ba3d03daf2911509fb1942b2
|
3 |
+
size 201935064
|
lifm/UNet-S-4f4/config.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "SegUnet2DModel",
|
3 |
+
"_diffusers_version": "0.30.3",
|
4 |
+
"_name_or_path": "experiments/lifm_UNet-S_4f4_all_sv/checkpoint-910000/denoiser_ema",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"add_attention": true,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"attn_norm_num_groups": null,
|
9 |
+
"block_out_channels": [
|
10 |
+
96,
|
11 |
+
192,
|
12 |
+
288,
|
13 |
+
384
|
14 |
+
],
|
15 |
+
"center_input_sample": false,
|
16 |
+
"class_embed_type": "timestep",
|
17 |
+
"decay": 0.9999,
|
18 |
+
"down_block_types": [
|
19 |
+
"AttnDownBlock2D",
|
20 |
+
"AttnDownBlock2D",
|
21 |
+
"AttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"downsample_type": "resnet",
|
26 |
+
"dropout": 0.0,
|
27 |
+
"flip_sin_to_cos": true,
|
28 |
+
"freq_shift": 0,
|
29 |
+
"in_channels": 5,
|
30 |
+
"inv_gamma": 1.0,
|
31 |
+
"layers_per_block": 2,
|
32 |
+
"mid_block_scale_factor": 1,
|
33 |
+
"min_decay": 0.0,
|
34 |
+
"norm_eps": 1e-05,
|
35 |
+
"norm_num_groups": 32,
|
36 |
+
"num_class_embeds": null,
|
37 |
+
"num_train_timesteps": null,
|
38 |
+
"optimization_step": 90001,
|
39 |
+
"out_channels": 4,
|
40 |
+
"power": 0.6666666666666666,
|
41 |
+
"resnet_time_scale_shift": "default",
|
42 |
+
"sample_size": 28,
|
43 |
+
"time_embedding_type": "positional",
|
44 |
+
"up_block_types": [
|
45 |
+
"UpBlock2D",
|
46 |
+
"AttnUpBlock2D",
|
47 |
+
"AttnUpBlock2D",
|
48 |
+
"AttnUpBlock2D"
|
49 |
+
],
|
50 |
+
"update_after_step": 0,
|
51 |
+
"upsample_type": "resnet",
|
52 |
+
"use_ema_warmup": false
|
53 |
+
}
|
lifm/UNet-S-4f4/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da1ec23a62a00b86a146f78b736566a129f2c6e97656c2d33975f79fb76ae768
|
3 |
+
size 201852056
|