ARBS / arbitor /config.py
CLIWorks's picture
Upload folder using huggingface_hub
d8bc908 verified
VOCAB=288
AUDIO_VOCAB=288
AUDIO_SR=16000
AUDIO_FRAME_RATE=50
THRESHOLD=0.05
# -- 3B Target Dimensions --
EMBEDDING_DIM=1536
CODEBOOK_DIM=1024
CODEBOOK_SIZE=524288 # Base unit
# Shared multimodal VQ (256K entries × 1024-dim)
SHARED_VQ_SIZE = 262144
HIDDEN_DIM=8192 # Main hidden dimension
FFN_HIDDEN=16384 # 2× HIDDEN_DIM
CTX=256
# MoEGraph (256 experts, centroid routing, unified ACT)
MG_N_EXPERTS = 256
MG_CORE_RANK = 384
MG_SHARED_INTER = 1536
MG_ACT_ITERS = 4
MG_WORKSPACE_DIM = 768
MG_TOP_K = 2
# VQ
# MemGram (32 heads × ~65K slots ≈ 2M total associative slots)
MEMGRAM_STRUCT_PRIMES = [64901, 64919, 64921, 64927, 64937, 64951, 64969, 64997,
65003, 65011, 65027, 65029, 65033, 65053, 65063, 65071,
65101, 65119, 65123, 65129, 65141, 65147, 65167, 65171,
65173, 65179, 65183, 65203, 65213, 65239, 65257, 65269]
MEMGRAM_CONV_PRIMES = [8009, 8011, 8017, 8039, 8081, 8087, 8089, 8093]
MEMGRAM_EMBED_DIM = 64
MEMGRAM_KEY_DIM = 32
# KV Ledger
KV_LEDGER_SIZE = 262144
SLIDING_WINDOW_SIZE = 32768
KQ_CACHE_SIZE = 8192
# MLA Attention dimensions
MLA_N_HEADS = 32
MLA_QK_NOPE_HEAD_DIM = 96
MLA_QK_ROPE_HEAD_DIM = 32
MLA_V_HEAD_DIM = 96
MLA_SLIDE_DIM = 64
MLA_FULL_DIM = 32
MLA_N_LAYERS = 24
# RoPE
MLA_ROPE_THETA = 10000.0
# Attention
ATTENTION_STRIDE = 8
KV_CONTEXT_LENGTH = 33554432
# CSA / HCA compression (DeepSeek V4 hybrid attention)
MLA_CSA_DIM = 16
MLA_HCA_DIM = 16
MLA_HCA_STRIDE = 32
# KG EMA — Phase 17
KG_EMA_ALPHA=0.99
KG_REQUANT_EVERY=50
KG_TERNARY_THRESHOLD=0.3
# Composite Motif VQ — Phase 17 (64K entries × 1024-dim)
KGVQ_CODEBOOK_SIZE=65536
KGVQ_CODEBOOK_DIM=1024
KGVQ_DECAY=0.99
KGVQ_COMMITMENT_WEIGHT=1.0
KGVQ_DEAD_CODE_THRESHOLD=2
K_MAX_COMPOSITES=20
# VideoHead (Open-Sora VAE: 4 latent channels, 8× spatial + 4× temporal compression)
VIDEO_LATENT_CHANNELS = 4
VIDEO_MAX_STEPS = 8
VIDEO_HEIGHT = 64
VIDEO_WIDTH = 64
# -- Open-Sora 3D VAE (Phase 19) --
OPEN_SORA_VAE_PATH = "arbitor/encoders/models/opensora-vae"
OPEN_SORA_VAE_REPO = "hpcai-tech/OpenSora-VAE-v1.2"
OPEN_SORA_LATENT_CHANNELS = 4
OPEN_SORA_SCALE_FACTOR_SPATIAL = 8
OPEN_SORA_SCALE_FACTOR_TEMPORAL = 4
# -- ACT Loop Parameters (Phase 19) --
BYTEHEAD_ACT_MAX_ITERS = 3
BYTEHEAD_ACT_HALT_CONSECUTIVE = 2
BYTEHEAD_ACT_PONDER_LAMBDA = 0.01
VIDEOHEAD_ACT_MIN_FPS = 1
VIDEOHEAD_ACT_MAX_FPS = 60
VIDEOHEAD_ACT_FRAME_CHUNK = 8
TALKERHEAD_ACT_CHUNK_FRAMES = 500
# -- Timestamp Encoding (Phase 19) --
TIMESTAMP_MAX_PERIOD = 10000.0
# -- Temporal Frame Buffer (Phase 19) --
FRAME_BUFFER_LOCAL_SIZE = 3
FRAME_BUFFER_CACHE_STRIDE = 4
SPECIAL_VOCAB = {
# Control
'PAD': 256, 'BOS': 257, 'EOS': 258, 'STOP': 259,
# Roles
'SYSTEM': 260, 'USER': 261, 'ASSISTANT': 262,
# Reasoning
'SCRATCHPAD': 263, 'PLAN': 264, 'REFLECTION': 265, 'SUMMARY': 266,
# Tool use
'ACTION': 267, 'TOOL': 268, 'TOOL_RESULT': 269,
# Code
'CODE': 270, 'CODE_BLOCK': 271, 'EXECUTION': 272,
# RAG
'SEARCH': 273, 'CONTEXT': 274, 'CITATION': 275,
# Quality / format
'ERROR': 276, 'FORMAT': 277,
# Multimodal
'IMAGE': 278, 'TEXT': 279, 'AUDIO': 280,
'VIDEO': 281, 'SPEAK': 282, 'IMG_GEN': 283,
# Future
'RES1': 284, 'RES2': 285, 'RES3': 286, 'RESERVED': 287,
}