| { |
| "model_name": "Helion-V2", |
| "model_version": "2.0", |
| "model_type": "causal-lm", |
| "architecture": "helion", |
| "organization": "DeepXR", |
| "release_date": "2024-11-15", |
| "license": "Apache-2.0", |
| "homepage": "https://huggingface.co/DeepXR/Helion-V2", |
| "repository": "https://github.com/DeepXR/Helion-V2", |
| "documentation": "https://docs.deepxr.ai/helion-v2", |
| "parameters": { |
| "total": 7200000000, |
| "trainable": 7200000000, |
| "non_trainable": 0 |
| }, |
| "model_size": { |
| "fp32": "28.8 GB", |
| "fp16": "14.4 GB", |
| "bfloat16": "14.4 GB", |
| "int8": "7.2 GB", |
| "int4": "3.6 GB" |
| }, |
| "context_length": 8192, |
| "vocabulary_size": 32768, |
| "languages": [ |
| "en", |
| "es", |
| "fr", |
| "de", |
| "it", |
| "pt", |
| "nl", |
| "ru", |
| "zh", |
| "ja", |
| "ko", |
| "ar", |
| "hi" |
| ], |
| "primary_language": "en", |
| "tasks": [ |
| "text-generation", |
| "conversational", |
| "code-generation", |
| "question-answering", |
| "summarization", |
| "translation", |
| "creative-writing" |
| ], |
| "framework": { |
| "name": "transformers", |
| "version": "4.40.0+", |
| "backend": "pytorch", |
| "backend_version": "2.1.0+" |
| }, |
| "training": { |
| "dataset_tokens": 2500000000000, |
| "training_steps": 600000, |
| "epochs": 3, |
| "batch_size": 4194304, |
| "learning_rate": 0.0003, |
| "optimizer": "AdamW", |
| "hardware": "128x NVIDIA H100 80GB", |
| "training_time_days": 21, |
| "knowledge_cutoff": "2024-10-31" |
| }, |
| "benchmarks": { |
| "mmlu": { |
| "score": 64.2, |
| "metric": "accuracy", |
| "shots": 5 |
| }, |
| "humaneval": { |
| "score": 48.2, |
| "metric": "pass@1", |
| "shots": 0 |
| }, |
| "hellaswag": { |
| "score": 80.5, |
| "metric": "accuracy", |
| "shots": 10 |
| }, |
| "truthfulqa": { |
| "score": 52.1, |
| "metric": "mc2_accuracy", |
| "shots": 0 |
| }, |
| "gsm8k": { |
| "score": 68.7, |
| "metric": "accuracy", |
| "shots": 8 |
| }, |
| "arc_challenge": { |
| "score": 58.3, |
| "metric": "accuracy", |
| "shots": 25 |
| }, |
| "mt_bench": { |
| "score": 7.85, |
| "metric": "rating", |
| "shots": 0 |
| } |
| }, |
| "safety": { |
| "toxigen_score": 0.08, |
| "crows_pairs_bias": 54.2, |
| "content_filtering": true, |
| "pii_detection": true, |
| "crisis_detection": true, |
| "safety_classifiers": [ |
| "hate_speech", |
| "violence", |
| "sexual_content", |
| "self_harm", |
| "illegal_activity", |
| "child_safety" |
| ] |
| }, |
| "deployment": { |
| "recommended_gpu": [ |
| "NVIDIA A100", |
| "NVIDIA H100", |
| "NVIDIA RTX 4090", |
| "NVIDIA A6000" |
| ], |
| "minimum_vram_gb": 16, |
| "recommended_vram_gb": 24, |
| "supports_quantization": true, |
| "quantization_formats": [ |
| "int8", |
| "int4", |
| "GPTQ", |
| "AWQ", |
| "GGUF" |
| ], |
| "inference_frameworks": [ |
| "transformers", |
| "vllm", |
| "llama.cpp", |
| "text-generation-inference" |
| ] |
| }, |
| "contact": { |
| "email": "contact@deepxr.ai", |
| "github": "https://github.com/DeepXR/Helion-V2", |
| "twitter": "@DeepXR_AI", |
| "discord": "https://discord.gg/deepxr" |
| }, |
| "tags": [ |
| "text-generation", |
| "conversational", |
| "code", |
| "instruction-following", |
| "pytorch", |
| "causal-lm", |
| "llm", |
| "reasoning", |
| "multilingual", |
| "apache-2.0", |
| "production-ready", |
| "safe-ai" |
| ], |
| "checksum": { |
| "algorithm": "SHA256", |
| "model_files": "computed_on_upload" |
| } |
| } |