stabilityai
/

SAME-L

Model card Files Files and versions

SAME-L / model_config.json

mattricesound's picture

Upload folder using huggingface_hub

9499ba2 verified 5 days ago

history blame contribute delete

1.93 kB

	{
	"model_type": "autoencoder",
	"sample_size": 196608,
	"sample_rate": 44100,
	"audio_channels": 2,
	"model": {
	"pretransform": {
	"type": "patched",
	"config": {
	"patch_size": 256,
	"channels": 2
	}
	},
	"encoder": {
	"type": "same",
	"requires_grad": false,
	"config": {
	"in_channels": 512,
	"channels": 256,
	"c_mults": [6],
	"strides": [16],
	"latent_dim": 256,
	"transformer_depths": [12],
	"checkpointing": true,
	"differential": true,
	"dyt": true,
	"dim_heads": 64,
	"sliding_window": [1,1],
	"variable_stride": true,
	"mask_noise": 0.001
	}
	},
	"decoder": {
	"type": "same",
	"requires_grad": false,
	"config": {
	"out_channels": 512,
	"channels": 256,
	"c_mults": [6],
	"strides": [16],
	"latent_dim": 256,
	"transformer_depths": [12],
	"sinusoidal_blocks": [8],
	"checkpointing": false,
	"differential": true,
	"dyt": true,
	"dim_heads": 64,
	"sliding_window": [1,1],
	"variable_stride": true,
	"mask_noise": 0.1
	}
	},
	"bottleneck": {
	"type": "softnorm",
	"config": {
	"dim": 256,
	"noise_augment_dim": 0,
	"noise_regularize": true,
	"auto_scale": true,
	"freeze": true
	}
	},
	"latent_dim": 256,
	"downsampling_ratio": 4096,
	"io_channels": 2
	}
	}