VLyb's picture
Upload folder using huggingface_hub
dd23092 verified
datasets:
vla_data:
data_mix: bridge
data_root_dir: /mnt/project_ai4edu/lyl/worlkplace/starVLA/playground/Datasets/OXE_LEROBOT_DATASET
image_size:
- 224
- 224
per_device_batch_size: 16
video_backend: pyav
frameskip:
cache_dir: playground/frameskip/frameskip_cache_vac_cr10-100
default_compression_ratio: 1.0
enabled: true
importance:
allow_backend_fallback: false
alpha: 0.6
beta: 0.2
device: cuda
enable_vac: true
gamma: 0.2
max_vac_frames: 16
type: gripper_aware
vac_beta: 0.2
video_backend: ffmpeg
visual_encoder_checkpoint: /mnt/project_ai4edu/share/models/timm/vit_large_patch14_dinov2.lvd142m/pytorch_model.bin
visual_encoder_name: vit_large_patch14_dinov2
pruning:
compression_ratios:
- 0.1
- 0.2
- 0.3
- 0.4
- 0.5
- 0.6
- 0.7
- 0.8
- 0.9
- 1.0
used_compression_ratios:
- 0.2
- 0.2
- 0.2
- 0.2
- 0.2
- 1.0
training:
dynamic_ratio: true
ratio_schedule: uniform
warmup_steps: 5000
framework:
action_model:
action_dim: 7
action_horizon: 16
action_model_type: DiT-B
add_pos_embed: true
diffusion_model_cfg:
cross_attention_dim: 2560
dropout: 0.2
final_dropout: true
interleave_self_attention: true
norm_type: ada_norm
num_layers: 16
output_dim: 2560
positional_embeddings: null
future_action_window_size: 15
hidden_size: 1024
max_seq_len: 1024
noise_beta_alpha: 1.5
noise_beta_beta: 1.0
noise_s: 0.999
num_inference_timesteps: 4
num_target_vision_tokens: 32
num_timestep_buckets: 1000
past_action_window_size: 0
state_dim: 7
name: QwenGR00T
qwenvl:
base_vlm: FrameSkip_GR00T_bridge_qwen3/Qwen3-VL-4B-Instruct
template: qwen3_vl
run_root_dir: ./results/Checkpoints/FrameSkip/SimplerEnv
seed: 42
trainer:
eval_interval: 1000
freeze_modules: true
gradient_accumulation_steps: 1
gradient_clipping: 1.0
is_resume: true
learning_rate:
action_model: 0.0001
base: 1.0e-05
qwen_vl_interface: 1.0e-05
logging_frequency: 100
lr_scheduler_type: cosine_with_min_lr
max_train_steps: 100000
num_warmup_steps: 2000
optimizer:
betas:
- 0.9
- 0.95
eps: 1.0e-08
weight_decay: 1.0e-08
repeated_diffusion_steps: 4
save_interval: 10000
scheduler_specific_kwargs:
min_lr: 5.0e-07
wandb_entity: jinhuiye
wandb_project: starVLA