Upload folder using huggingface_hub
Browse files- .gitattributes +1 -33
- .gitignore +4 -4
- LICENSE.md +5 -0
- README.md +21 -3
- models/baseline_unet/afhq/ckpt_epoch_200.pt +3 -0
- models/baseline_unet/afhq/config.yaml +37 -0
- models/baseline_unet/celeba_hq/ckpt_epoch_200.pt +3 -0
- models/baseline_unet/celeba_hq/config.yaml +37 -0
- models/baseline_unet/cifar10/ckpt_epoch_200.pt +3 -0
- models/baseline_unet/cifar10/config.yaml +33 -0
- models/baseline_unet/fashion_mnist/ckpt_epoch_200.pt +3 -0
- models/baseline_unet/fashion_mnist/config.yaml +36 -0
- models/baseline_unet/mnist/ckpt_epoch_200.pt +3 -0
- models/baseline_unet/mnist/config.yaml +36 -0
.gitattributes
CHANGED
|
@@ -1,35 +1,3 @@
|
|
| 1 |
-
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
-
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
-
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
-
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
-
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
-
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
-
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
-
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
-
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
-
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
-
|
| 27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
-
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
-
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
-
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
-
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
-
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
-
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
*.pt filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
| 2 |
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.gitignore
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
-
#
|
| 2 |
-
|
| 3 |
-
|
| 4 |
-
|
|
|
|
| 1 |
+
# Allow model weights
|
| 2 |
+
!*.pt
|
| 3 |
+
!*.ckpt
|
| 4 |
+
!*.safetensors
|
LICENSE.md
ADDED
|
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
**LICENSE**
|
| 2 |
+
Add whichever license you intend (MIT is common for baseline weights).
|
| 3 |
+
|
| 4 |
+
```bash
|
| 5 |
+
git add README.md LICENSE
|
README.md
CHANGED
|
@@ -1,3 +1,21 @@
|
|
| 1 |
-
|
| 2 |
-
|
| 3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Locality Diffusion Baselines
|
| 2 |
+
|
| 3 |
+
This repository contains pretrained **baseline model weights** used in:
|
| 4 |
+
|
| 5 |
+
*Locality in Image Diffusion Models Emerges from Data Statistics*
|
| 6 |
+
Artem Lukoianov et al., NeurIPS 2025.
|
| 7 |
+
|
| 8 |
+
## Structure
|
| 9 |
+
|
| 10 |
+
- `models/baseline_unet/` – baseline UNet models on multiple datasets
|
| 11 |
+
- `models/wiener/` – Wiener models
|
| 12 |
+
|
| 13 |
+
## Usage
|
| 14 |
+
|
| 15 |
+
```python
|
| 16 |
+
from huggingface_hub import hf_hub_download
|
| 17 |
+
|
| 18 |
+
path = hf_hub_download(
|
| 19 |
+
repo_id="ottogin/locality-diffusion-baselines",
|
| 20 |
+
filename="models/baseline_unet/cifar10/ckpt_epoch_200.pt"
|
| 21 |
+
)
|
models/baseline_unet/afhq/ckpt_epoch_200.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c228ee2946b689151ec091e784c2246d81243580c9b1176610ecd1a2f66f2bba
|
| 3 |
+
size 320613872
|
models/baseline_unet/afhq/config.yaml
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
T: 1000
|
| 2 |
+
attn: []
|
| 3 |
+
batch_size: 80
|
| 4 |
+
beta_1: 0.0001
|
| 5 |
+
beta_T: 0.02
|
| 6 |
+
channel: 128
|
| 7 |
+
channel_mult:
|
| 8 |
+
- 1
|
| 9 |
+
- 2
|
| 10 |
+
- 3
|
| 11 |
+
- 4
|
| 12 |
+
checkpoint_freq: 20
|
| 13 |
+
dataset_name: afhq
|
| 14 |
+
dataset_root: data/
|
| 15 |
+
device: cuda:0
|
| 16 |
+
dropout: 0.15
|
| 17 |
+
epoch: 200
|
| 18 |
+
eval_random_seed: 42
|
| 19 |
+
grad_clip: 1.0
|
| 20 |
+
img_size: 64
|
| 21 |
+
in_channels: 3
|
| 22 |
+
lr: 0.0001
|
| 23 |
+
model_type: unet
|
| 24 |
+
multiplier: 2.0
|
| 25 |
+
nrow: 8
|
| 26 |
+
num_res_blocks: 2
|
| 27 |
+
out_channels: 3
|
| 28 |
+
random_seed: 42
|
| 29 |
+
sample_freq: 20
|
| 30 |
+
sampledImgName: SampledNoGuidenceImgs.png
|
| 31 |
+
sampledNoisyImgName: NoisyNoGuidenceImgs.png
|
| 32 |
+
sampled_dir: ./SampledImgs/
|
| 33 |
+
save_weight_dir: ./Checkpoints/
|
| 34 |
+
subset_size: -1
|
| 35 |
+
test_load_weight: ckpt_199_.pt
|
| 36 |
+
training_load_weight: null
|
| 37 |
+
use_wandb: true
|
models/baseline_unet/celeba_hq/ckpt_epoch_200.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fd5c82a46586bf32df578cf3d5856fb089dcb246fef756a77475b8980989362
|
| 3 |
+
size 320613872
|
models/baseline_unet/celeba_hq/config.yaml
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
T: 1000
|
| 2 |
+
attn: []
|
| 3 |
+
batch_size: 80
|
| 4 |
+
beta_1: 0.0001
|
| 5 |
+
beta_T: 0.02
|
| 6 |
+
channel: 128
|
| 7 |
+
channel_mult:
|
| 8 |
+
- 1
|
| 9 |
+
- 2
|
| 10 |
+
- 3
|
| 11 |
+
- 4
|
| 12 |
+
checkpoint_freq: 20
|
| 13 |
+
dataset_name: celeba_hq
|
| 14 |
+
dataset_root: data/
|
| 15 |
+
device: cuda:0
|
| 16 |
+
dropout: 0.15
|
| 17 |
+
epoch: 200
|
| 18 |
+
eval_random_seed: 42
|
| 19 |
+
grad_clip: 1.0
|
| 20 |
+
img_size: 64
|
| 21 |
+
in_channels: 3
|
| 22 |
+
lr: 0.0001
|
| 23 |
+
model_type: unet
|
| 24 |
+
multiplier: 2.0
|
| 25 |
+
nrow: 8
|
| 26 |
+
num_res_blocks: 2
|
| 27 |
+
out_channels: 3
|
| 28 |
+
random_seed: 42
|
| 29 |
+
sample_freq: 20
|
| 30 |
+
sampledImgName: SampledNoGuidenceImgs.png
|
| 31 |
+
sampledNoisyImgName: NoisyNoGuidenceImgs.png
|
| 32 |
+
sampled_dir: ./SampledImgs/
|
| 33 |
+
save_weight_dir: ./Checkpoints/
|
| 34 |
+
subset_size: -1
|
| 35 |
+
test_load_weight: ckpt_199_.pt
|
| 36 |
+
training_load_weight: null
|
| 37 |
+
use_wandb: true
|
models/baseline_unet/cifar10/ckpt_epoch_200.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a000f27dfe5b2cbdb12706b6aa7f0a5f72b8d873e3cf346864c528e017b4a19
|
| 3 |
+
size 320613461
|
models/baseline_unet/cifar10/config.yaml
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
T: 1000
|
| 2 |
+
attn: []
|
| 3 |
+
batch_size: 80
|
| 4 |
+
beta_1: 0.0001
|
| 5 |
+
beta_T: 0.02
|
| 6 |
+
channel: 128
|
| 7 |
+
channel_mult:
|
| 8 |
+
- 1
|
| 9 |
+
- 2
|
| 10 |
+
- 3
|
| 11 |
+
- 4
|
| 12 |
+
checkpoint_freq: 20
|
| 13 |
+
dataset_root: data/
|
| 14 |
+
device: cuda:6
|
| 15 |
+
dropout: 0.15
|
| 16 |
+
epoch: 200
|
| 17 |
+
eval_random_seed: 42
|
| 18 |
+
grad_clip: 1.0
|
| 19 |
+
img_size: 32
|
| 20 |
+
lr: 0.0001
|
| 21 |
+
multiplier: 2.0
|
| 22 |
+
nrow: 8
|
| 23 |
+
num_res_blocks: 2
|
| 24 |
+
random_seed: 42
|
| 25 |
+
sample_freq: 20
|
| 26 |
+
sampledImgName: SampledNoGuidenceImgs.png
|
| 27 |
+
sampledNoisyImgName: NoisyNoGuidenceImgs.png
|
| 28 |
+
sampled_dir: ./SampledImgs/
|
| 29 |
+
save_weight_dir: ./Checkpoints/
|
| 30 |
+
subset_size: -1
|
| 31 |
+
test_load_weight: ckpt_199_.pt
|
| 32 |
+
training_load_weight: null
|
| 33 |
+
use_wandb: true
|
models/baseline_unet/fashion_mnist/ckpt_epoch_200.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28b73c711a2721c8a965f652b9f81618ef83a12bda4fc42d6ec1ed10dab5b2f6
|
| 3 |
+
size 24893232
|
models/baseline_unet/fashion_mnist/config.yaml
ADDED
|
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
T: 1000
|
| 2 |
+
attn: []
|
| 3 |
+
batch_size: 80
|
| 4 |
+
beta_1: 0.0001
|
| 5 |
+
beta_T: 0.02
|
| 6 |
+
channel: 64
|
| 7 |
+
channel_mult:
|
| 8 |
+
- 1
|
| 9 |
+
- 2
|
| 10 |
+
- 2
|
| 11 |
+
checkpoint_freq: 20
|
| 12 |
+
dataset_name: fashion_mnist
|
| 13 |
+
dataset_root: data/
|
| 14 |
+
device: cuda:0
|
| 15 |
+
dropout: 0.15
|
| 16 |
+
epoch: 200
|
| 17 |
+
eval_random_seed: 42
|
| 18 |
+
grad_clip: 1.0
|
| 19 |
+
img_size: 28
|
| 20 |
+
in_channels: 1
|
| 21 |
+
lr: 0.0001
|
| 22 |
+
model_type: unet
|
| 23 |
+
multiplier: 2.0
|
| 24 |
+
nrow: 8
|
| 25 |
+
num_res_blocks: 2
|
| 26 |
+
out_channels: 1
|
| 27 |
+
random_seed: 42
|
| 28 |
+
sample_freq: 20
|
| 29 |
+
sampledImgName: SampledNoGuidenceImgs.png
|
| 30 |
+
sampledNoisyImgName: NoisyNoGuidenceImgs.png
|
| 31 |
+
sampled_dir: ./SampledImgs/
|
| 32 |
+
save_weight_dir: ./Checkpoints/
|
| 33 |
+
subset_size: -1
|
| 34 |
+
test_load_weight: ckpt_199_.pt
|
| 35 |
+
training_load_weight: null
|
| 36 |
+
use_wandb: true
|
models/baseline_unet/mnist/ckpt_epoch_200.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59dab64112364b9b051716577fa17fa36b00639d399e7bb0b756c179fc0c395e
|
| 3 |
+
size 24893232
|
models/baseline_unet/mnist/config.yaml
ADDED
|
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
T: 1000
|
| 2 |
+
attn: []
|
| 3 |
+
batch_size: 80
|
| 4 |
+
beta_1: 0.0001
|
| 5 |
+
beta_T: 0.02
|
| 6 |
+
channel: 64
|
| 7 |
+
channel_mult:
|
| 8 |
+
- 1
|
| 9 |
+
- 2
|
| 10 |
+
- 2
|
| 11 |
+
checkpoint_freq: 20
|
| 12 |
+
dataset_name: mnist
|
| 13 |
+
dataset_root: data/
|
| 14 |
+
device: cuda:0
|
| 15 |
+
dropout: 0.15
|
| 16 |
+
epoch: 200
|
| 17 |
+
eval_random_seed: 42
|
| 18 |
+
grad_clip: 1.0
|
| 19 |
+
img_size: 28
|
| 20 |
+
in_channels: 1
|
| 21 |
+
lr: 0.0001
|
| 22 |
+
model_type: unet
|
| 23 |
+
multiplier: 2.0
|
| 24 |
+
nrow: 8
|
| 25 |
+
num_res_blocks: 2
|
| 26 |
+
out_channels: 1
|
| 27 |
+
random_seed: 42
|
| 28 |
+
sample_freq: 20
|
| 29 |
+
sampledImgName: SampledNoGuidenceImgs.png
|
| 30 |
+
sampledNoisyImgName: NoisyNoGuidenceImgs.png
|
| 31 |
+
sampled_dir: ./SampledImgs/
|
| 32 |
+
save_weight_dir: ./Checkpoints/
|
| 33 |
+
subset_size: -1
|
| 34 |
+
test_load_weight: ckpt_199_.pt
|
| 35 |
+
training_load_weight: null
|
| 36 |
+
use_wandb: true
|