model reproduction

Files changed (7) hide show

README.md +6 -4
lorweb_model/config.yaml +86 -0
lorweb_model/lorweb_model.safetensors +3 -0
samples/architectural_car.jpg +0 -0
samples/armor_doggy.jpg +0 -0
samples/clay_man.jpg +0 -0
samples/ghibli_cat.jpg +0 -0

README.md CHANGED Viewed

@@ -8,10 +8,10 @@ base_model:
 - black-forest-labs/FLUX.1-Kontext-dev
 ---
-# LoRWeB Model (Coming Soon)
 <div align="center">
-  <a href="https://arxiv.org/">ArXiv</a> | <a href="https://github.com/NVlabs/LoRWeB" style="display:inline;text-decoration:underline;"><img width="20" height="20" style="display:inline;margin:0;" src="https://img.icons8.com/ios-glyphs/30/github.png" alt="github"> GitHub Repository</a> | <a href="https://research.nvidia.com/labs/par/lorweb"> 🌐 Project Website</a> | <a href="https://huggingface.co/datasets/hilamanor/LoRWeB_evalset">🤗 Evaluation Dataset (Comming Soon)</a>
 </div>
 <div align="center">
@@ -31,7 +31,9 @@ base_model:
 ### ℹ️ Additional Information
-Please see our full modelcard and further details in the [GitHub Repo](https://github.com/NVlabs/LoRWeB)
 ## 📚 Citation
@@ -41,7 +43,7 @@ If you use this model in your research, please cite:
 @article{manor2026lorweb,
     title={Spanning the Visual Analogy Space with a Weight Basis of LoRAs},
     author={Manor, Hila and Gal, Rinon and Maron, Haggai and Michaeli, Tomer and Chechik, Gal},
-    journal={arXiv preprint},
     year={2026}
 }
 ```

 - black-forest-labs/FLUX.1-Kontext-dev
 ---
+# LoRWeB Model
 <div align="center">
+  <a href="https://arxiv.org/abs/2602.15727">ArXiv</a> | <a href="https://github.com/NVlabs/LoRWeB" style="display:inline;text-decoration:underline;"><img width="20" height="20" style="display:inline;margin:0;" src="https://img.icons8.com/ios-glyphs/30/github.png" alt="github"> GitHub Repository</a> | <a href="https://research.nvidia.com/labs/par/lorweb"> 🌐 Project Website</a> | <a href="https://huggingface.co/datasets/hilamanor/LoRWeB_evalset">🤗 Evaluation Dataset</a>
 </div>
 <div align="center">
 ### ℹ️ Additional Information
+**This model is a reproduction of the original model from the paper. It was trained from scratch using Technion resources.** This might introduce differences from the results reported in the paper. Please see the `samples` directory for examples of this model's outputs on the {**a**, **a'**, **b**} triplets from the teaser figure.
+Please see our full modelcard and further details in the [GitHub Repo](https://github.com/NVlabs/LoRWeB).
 ## 📚 Citation
 @article{manor2026lorweb,
     title={Spanning the Visual Analogy Space with a Weight Basis of LoRAs},
     author={Manor, Hila and Gal, Rinon and Maron, Haggai and Michaeli, Tomer and Chechik, Gal},
+    journal={arXiv preprint arXiv:2602.15727},
     year={2026}
 }
 ```

lorweb_model/config.yaml ADDED Viewed

	@@ -0,0 +1,86 @@

+job: extension
+config:
+  name: lorweb_model
+  process:
+  - type: sd_trainer
+    training_folder: output
+    device: cuda:0
+    network:
+      type: attlora
+      linear: 4
+      linear_alpha: 4
+      network_kwargs:
+        lora_keys_dim: 128
+        lora_heads: 1
+        mixing_coeffs_type: mean
+        external_query: true
+        pooling_type: avg
+        query_projection_type: linear
+        external_query_model: openai/clip-vit-large-patch14
+        loras_num: 32
+        lora_softmax: true
+        query_mode: cat-aa'b
+    save:
+      dtype: float16
+      save_every: 250
+      max_step_saves_to_keep: 4
+      push_to_hub: false
+    datasets:
+    - folder_path: ./data/relation252k_processed/target
+      control_path: ./data/relation252k_processed/control
+      caption_ext: txt
+      caption_dropout_rate: 0.05
+      shuffle_tokens: false
+      cache_latents_to_disk: false
+      resolution:
+      - 512
+      is_analogy: false
+      is_box_analogy: true
+      full_size_control_images: true
+      enable_relation_captions: true
+      is_bidirectional_analogy: false
+    train:
+      batch_size: 6
+      steps: 10000
+      gradient_accumulation_steps: 1
+      train_unet: true
+      train_text_encoder: false
+      gradient_checkpointing: true
+      noise_scheduler: flowmatch
+      optimizer: adamw8bit
+      optimizer_params:
+        betas:
+        - 0.9
+        - 0.99
+        weight_decay: 0.05
+      lr: 0.001
+      timestep_type: weighted
+      dtype: bf16
+      debug_save_target_images: true
+    model:
+      name_or_path: black-forest-labs/FLUX.1-Kontext-dev
+      arch: flux_kontext
+      quantize: true
+    sample:
+      sampler: flowmatch
+      sample_every: 500
+      width: 1024
+      height: 1024
+      prompts:
+      - Transform the photo into a stylized illustration. --ctrl_img ./data/relation252k_processed/control/analogy_MJ_Style11827_1.png_MJ_Style11827_2.png_0000.jpg
+      neg: ''
+      seed: 42
+      walk_seed: true
+      guidance_scale: 4
+      sample_steps: 20
+      is_analogy: false
+      is_box_analogy: true
+    logging:
+      use_wandb: true
+      log_every: 1
+      project_name: lorweb
+      verbose: false
+      run_name: lorweb_model
+meta:
+  name: LoRWeB_default_PROMPTS
+  version: '1.0'

lorweb_model/lorweb_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d67e997fc45f2535f1947a29079ea87b6af2ac3a18732f26648f94ca91f308c4
+size 1670370808

samples/architectural_car.jpg ADDED Viewed

samples/armor_doggy.jpg ADDED Viewed

samples/clay_man.jpg ADDED Viewed

samples/ghibli_cat.jpg ADDED Viewed