add use_full_z_range flag, fix vae missing key warnings
Browse files- README.md +2 -2
- model_index.json +1 -0
- vae/config.json +4 -0
README.md
CHANGED
@@ -14,8 +14,8 @@ tags:
|
|
14 |
# Marigold Normals (LCM) Model Card
|
15 |
|
16 |
This model belongs to the family of diffusion-based Marigold models for solving various computer vision tasks.
|
17 |
-
The Marigold Normals model focuses on the surface normals task.
|
18 |
-
It takes an input image and computes surface normals in each pixel.
|
19 |
The LCM stands for Latent Consistency Models, which is a technique for making the diffusion model fast.
|
20 |
The Marigold Normals model is trained from Stable Diffusion with synthetic data, and the LCM model is further fine-tuned from it.
|
21 |
Thanks to the rich visual knowledge stored in Stable Diffusion, Marigold models possess deep scene understanding and excel at solving computer vision tasks.
|
|
|
14 |
# Marigold Normals (LCM) Model Card
|
15 |
|
16 |
This model belongs to the family of diffusion-based Marigold models for solving various computer vision tasks.
|
17 |
+
The Marigold Normals model focuses on the surface normals task.
|
18 |
+
It takes an input image and computes surface normals in each pixel.
|
19 |
The LCM stands for Latent Consistency Models, which is a technique for making the diffusion model fast.
|
20 |
The Marigold Normals model is trained from Stable Diffusion with synthetic data, and the LCM model is further fine-tuned from it.
|
21 |
Thanks to the rich visual knowledge stored in Stable Diffusion, Marigold models possess deep scene understanding and excel at solving computer vision tasks.
|
model_index.json
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
{
|
2 |
"_class_name":"MarigoldPipeline",
|
3 |
"_diffusers_version":"0.24.0",
|
|
|
4 |
"unet":[
|
5 |
"diffusers",
|
6 |
"UNet2DConditionModel"
|
|
|
1 |
{
|
2 |
"_class_name":"MarigoldPipeline",
|
3 |
"_diffusers_version":"0.24.0",
|
4 |
+
"use_full_z_range": true,
|
5 |
"unet":[
|
6 |
"diffusers",
|
7 |
"UNet2DConditionModel"
|
vae/config.json
CHANGED
@@ -15,12 +15,16 @@
|
|
15 |
"DownEncoderBlock2D",
|
16 |
"DownEncoderBlock2D"
|
17 |
],
|
|
|
18 |
"in_channels": 3,
|
19 |
"latent_channels": 4,
|
|
|
|
|
20 |
"layers_per_block": 2,
|
21 |
"norm_num_groups": 32,
|
22 |
"out_channels": 3,
|
23 |
"sample_size": 768,
|
|
|
24 |
"up_block_types": [
|
25 |
"UpDecoderBlock2D",
|
26 |
"UpDecoderBlock2D",
|
|
|
15 |
"DownEncoderBlock2D",
|
16 |
"DownEncoderBlock2D"
|
17 |
],
|
18 |
+
"force_upcast": true,
|
19 |
"in_channels": 3,
|
20 |
"latent_channels": 4,
|
21 |
+
"latents_mean": null,
|
22 |
+
"latents_std": null,
|
23 |
"layers_per_block": 2,
|
24 |
"norm_num_groups": 32,
|
25 |
"out_channels": 3,
|
26 |
"sample_size": 768,
|
27 |
+
"scaling_factor": 0.18215,
|
28 |
"up_block_types": [
|
29 |
"UpDecoderBlock2D",
|
30 |
"UpDecoderBlock2D",
|