Push trained VAE model
Browse files- README.md +3 -0
- pytorch_model.bin +3 -0
- vae_config.json +29 -0
README.md
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
# Transfusion VAE
|
2 |
+
|
3 |
+
A UNet-style VAE trained on CC3M with adversarial and perceptual losses.
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bccf2a2abec6b609f2a3afe0024dd852e48d6d0dcf82c9677b15062f64bed9c3
|
3 |
+
size 322243354
|
vae_config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"image_size": 256,
|
3 |
+
"in_channels": 3,
|
4 |
+
"out_channels": 3,
|
5 |
+
"hidden_channels": 128,
|
6 |
+
"num_res_blocks": 3,
|
7 |
+
"channel_multipliers": [
|
8 |
+
1,
|
9 |
+
2,
|
10 |
+
2,
|
11 |
+
4,
|
12 |
+
4
|
13 |
+
],
|
14 |
+
"attention_resolutions": [
|
15 |
+
32
|
16 |
+
],
|
17 |
+
"dropout": 0.0,
|
18 |
+
"use_checkpoint": false,
|
19 |
+
"use_fp16": false,
|
20 |
+
"resblock_updown": true,
|
21 |
+
"z_channels": 8,
|
22 |
+
"double_z": true,
|
23 |
+
"位_recon": 1.0,
|
24 |
+
"位_kl": 1e-6,
|
25 |
+
"位_lpips": 1.0,
|
26 |
+
"位_id": 0.1,
|
27 |
+
"位_gan": 0.5,
|
28 |
+
"gan_start_step": 50000
|
29 |
+
}
|