| |
| |
| |
|
|
| |
| |
| |
| experiment_2d: |
| |
| dataset: "8gaussians" |
| source: "gaussian" |
|
|
| |
| model: |
| input_dim: 2 |
| hidden_dim: 256 |
| num_hidden_layers: 3 |
| time_emb_dim: 64 |
| activation: "silu" |
|
|
| |
| sinkhorn: |
| epsilon: 0.1 |
| blur: 0.5 |
| scaling: 0.80 |
| eta: 1.0 |
| num_steps: 10 |
| batch_size: 256 |
|
|
| |
| pool: |
| num_batches: 200 |
| experience_replay: true |
|
|
| |
| training: |
| num_iterations: 20000 |
| batch_size: 256 |
| learning_rate: 0.001 |
| optimizer: "adam" |
| beta1: 0.9 |
| beta2: 0.999 |
| weight_decay: 0.0 |
|
|
| |
| inference: |
| num_euler_steps: 10 |
| num_samples: 1024 |
|
|
| |
| evaluation: |
| num_test_samples: 1024 |
| metric: "w2" |
|
|
| |
| |
| |
| experiment_mnist: |
| dataset: "mnist" |
| image_size: 28 |
| in_channels: 1 |
|
|
| |
| unet: |
| model_channels: 32 |
| num_res_blocks: 1 |
| channel_mult: [1, 2, 2] |
| num_heads: 1 |
| num_head_channels: -1 |
| attention_resolutions: [16] |
| dropout: 0.0 |
| use_scale_shift_norm: true |
|
|
| |
| sinkhorn: |
| blur: 0.5 |
| scaling: 0.80 |
| eta: 1.0 |
| num_steps: 5 |
| batch_size: 256 |
|
|
| |
| pool: |
| num_batches: 1500 |
| storage_limit_gb: 20 |
|
|
| |
| nsgf_training: |
| num_iterations: 100000 |
| batch_size: 128 |
| learning_rate: 0.0001 |
| optimizer: "adam" |
| beta1: 0.9 |
| beta2: 0.999 |
| weight_decay: 0.0 |
|
|
| |
| nsf_training: |
| num_iterations: 100000 |
| batch_size: 128 |
| learning_rate: 0.0001 |
| optimizer: "adam" |
| beta1: 0.9 |
| beta2: 0.999 |
| weight_decay: 0.0 |
|
|
| |
| time_predictor: |
| conv_channels: [32, 64, 128, 256] |
| kernel_size: 3 |
| stride: 1 |
| padding: 1 |
| pool_size: 2 |
| num_iterations: 40000 |
| learning_rate: 0.0001 |
| batch_size: 128 |
|
|
| |
| inference: |
| nsgf_steps: 5 |
| nsf_steps: 55 |
| total_nfe: 60 |
|
|
| |
| evaluation: |
| num_generated: 10000 |
| metrics: ["fid"] |
|
|
| experiment_cifar10: |
| dataset: "cifar10" |
| image_size: 32 |
| in_channels: 3 |
|
|
| |
| unet: |
| model_channels: 128 |
| num_res_blocks: 2 |
| channel_mult: [1, 2, 2, 2] |
| num_heads: 4 |
| num_head_channels: 64 |
| attention_resolutions: [16] |
| dropout: 0.0 |
| use_scale_shift_norm: true |
|
|
| |
| sinkhorn: |
| blur: 1.0 |
| scaling: 0.85 |
| eta: 1.0 |
| num_steps: 5 |
| batch_size: 128 |
|
|
| |
| pool: |
| num_batches: 2500 |
| storage_limit_gb: 45 |
|
|
| |
| nsgf_training: |
| num_iterations: 200000 |
| batch_size: 128 |
| learning_rate: 0.0001 |
| optimizer: "adam" |
| beta1: 0.9 |
| beta2: 0.999 |
| weight_decay: 0.0 |
|
|
| |
| nsf_training: |
| num_iterations: 200000 |
| batch_size: 128 |
| learning_rate: 0.0001 |
| optimizer: "adam" |
| beta1: 0.9 |
| beta2: 0.999 |
| weight_decay: 0.0 |
|
|
| |
| time_predictor: |
| conv_channels: [32, 64, 128, 256] |
| kernel_size: 3 |
| stride: 1 |
| padding: 1 |
| pool_size: 2 |
| num_iterations: 40000 |
| learning_rate: 0.0001 |
| batch_size: 128 |
|
|
| |
| inference: |
| nsgf_steps: 5 |
| nsf_steps: 54 |
| total_nfe: 59 |
|
|
| |
| evaluation: |
| num_generated: 10000 |
| metrics: ["fid", "is"] |
| |
|
|