asdf98 commited on
Commit
f7a7863
·
verified ·
1 Parent(s): c6e7340

Upload luminars/config.py

Browse files
Files changed (1) hide show
  1. luminars/config.py +18 -19
luminars/config.py CHANGED
@@ -3,27 +3,26 @@ from dataclasses import dataclass
3
 
4
  @dataclass
5
  class LuminaRSConfig:
6
- # Core dims
7
- latent_dim: int = 16 # SD-compatible VAE latent dim
8
  latent_h: int = 32 # 32x32 latent = 1024x1024 px
9
  latent_w: int = 32
10
- # SSM Core
11
- d_model: int = 256 # main hidden dim
12
- d_state: int = 64 # mamba S4D hidden state
13
- d_conv: int = 4 # local convolution width
14
- expand: int = 2 # expansion factor in SSM
15
- n_layers: int = 8 # SSM-repeat stack
16
- drop_path: float = 0.0 # stochastic depth
17
- # Semantic (text) encoder
18
- text_embed_dim: int = 768 # CLIP-T hidden dim
 
19
  max_text_len: int = 77
20
- prompt_embed_dim: int = 256 # compressed prompt plan
21
- # Style/Mood/Philosophy modules
22
- style_dim: int = 128
23
- mood_dim: int = 64
24
- philosophy_dim: int = 64
25
- # Flow head
26
- n_flow_steps: int = 10 # ODE solver steps at inference
27
  # Training
28
- vae_pretrained: str = "madebyollin/sdxl-vae-fp16-fix" # 31M param VAE
 
 
 
29
  clip_pretrained: str = "openai/clip-vit-large-patch14"
 
 
 
3
 
4
  @dataclass
5
  class LuminaRSConfig:
6
+ # Latent dims
7
+ latent_dim: int = 16 # VAE latent channels
8
  latent_h: int = 32 # 32x32 latent = 1024x1024 px
9
  latent_w: int = 32
10
+ # UNet channels at each scale
11
+ channels: tuple = (64, 128, 256, 256, 384)
12
+ # Bottleneck depth
13
+ n_bottleneck: int = 4
14
+ # Iterative refinement depth (TRM-style shared-weight recursion)
15
+ n_recurse: int = 2
16
+ # Time embedding
17
+ t_embed_dim: int = 256
18
+ # Text conditioning
19
+ text_embed_dim: int = 768
20
  max_text_len: int = 77
 
 
 
 
 
 
 
21
  # Training
22
+ drop_path: float = 0.05
23
+ # VAE (frozen)
24
+ vae_pretrained: str = "madebyollin/sdxl-vae-fp16-fix"
25
+ # Text encoder (frozen)
26
  clip_pretrained: str = "openai/clip-vit-large-patch14"
27
+ # Flow matching inference steps
28
+ n_flow_steps: int = 12