Minibase
/

Detoxify-Language-Medium

@@ -1,190 +1,3 @@
-{
-  "_name_or_path": "Detoxify-Medium",
-  "architectures": ["LlamaForCausalLM"],
-  "bos_token_id": 1,
-  "eos_token_id": 2,
-  "hidden_act": "silu",
-  "hidden_size": 1024,
-  "initializer_range": 0.02,
-  "intermediate_size": 2816,
-  "max_position_embeddings": 8192,
-  "model_type": "llama",
-  "num_attention_heads": 16,
-  "num_hidden_layers": 20,
-  "num_key_value_heads": 16,
-  "pretraining_tp": 1,
-  "rms_norm_eps": 1e-05,
-  "rope_scaling": null,
-  "rope_theta": 10000.0,
-  "tie_word_embeddings": false,
-  "torch_dtype": "float16",
-  "transformers_version": "4.36.0",
-  "use_cache": true,
-  "vocab_size": 49152,
-  "quantization_config": {
-    "quant_method": "gguf",
-    "quantization_type": "Q8_0",
-    "quantization_bits": 8,
-    "quantization_version": "2",
-    "quantization_fidelity": "high",
-    "compression_ratio": 0.5,
-    "quantization_format": "GGUF",
-    "quantization_description": "8-bit quantization with optimized weights for high fidelity"
-  },
-  "file_size": 387911872,
-  "file_size_mb": 369,
-  "context_length": 4096,
-  "max_seq_length": 4096,
-  "model_family": "llama",
-  "model_version": "1.0.0",
-  "model_size_category": "medium",
-  "hardware_requirements": {
-    "minimum_ram": "12GB",
-    "recommended_ram": "24GB",
-    "minimum_vram": "0GB",
-    "recommended_vram": "0GB",
-    "cpu_compatibility": "Any modern CPU (Intel i5+, AMD Ryzen 5+)",
-    "gpu_compatibility": {
-      "nvidia": "Any CUDA-compatible GPU (GTX 1060+, RTX series)",
-      "amd": "Any ROCm-compatible GPU (RX 570+, Radeon series)",
-      "apple_silicon": "M1/M2/M3/M4 chips with Metal (recommended)",
-      "intel": "Intel Arc GPUs with oneAPI"
-    },
-    "os_compatibility": ["linux", "macos", "windows"],
-    "recommended_hardware": "Apple Silicon M2/M3/M4, Intel i7/i9, or NVIDIA RTX 30-series",
-    "memory_usage_estimate": "~6-8GB during inference",
-    "storage_requirements": "400MB free space"
-  },
-  "inference_config": {
-    "max_tokens": 256,
-    "temperature": 0.7,
-    "top_p": 0.9,
-    "top_k": 40,
-    "repetition_penalty": 1.1,
-    "n_threads": 8,
-    "n_gpu_layers": 99,
-    "n_batch": 512,
-    "n_ctx": 4096,
-    "recommended_batch_size": 1,
-    "streaming_support": true
-  },
-  "task": "text-detoxification",
-  "task_description": "Transform toxic or inappropriate text into clean, non-toxic versions while preserving the original meaning and intent",
-  "task_type": "text2text-generation",
-  "input_format": "Instruction: {instruction}\\n\\nInput: {input}\\n\\nResponse:",
-  "output_format": "Clean, non-toxic text that preserves the original meaning",
-  "primary_use_case": "Content moderation and text detoxification",
-  "supported_languages": ["en"],
-  "performance_metrics": {
-    "toxicity_reduction": 0.178,
-    "semantic_preservation": 0.561,
-    "fluency": 0.929,
-    "latency_ms": 160.2,
-    "throughput_requests_per_second": 6.2,
-    "benchmark_dataset": "ParaDetox",
-    "benchmark_samples": 1011,
-    "evaluation_date": "2025-09-18"
-  },
-  "model_capabilities": {
-    "max_input_length": 4096,
-    "supports_streaming": true,
-    "supports_batch_processing": false,
-    "instruction_following": true,
-    "few_shot_learning": true,
-    "multilingual_support": false,
-    "domain_adaptation": "general_web_content"
-  },
-  "training_details": {
-    "base_model": "Custom Llama architecture",
-    "training_objective": "Instruction-following for detoxification",
-    "fine_tuning_dataset": "Curated toxic-neutral parallel pairs",
-    "optimization": "Quantized for edge deployment",
-    "training_framework": "Custom implementation",
-    "parameter_count": "~150M estimated"
-  },
-  "license": "apache-2.0",
-  "tags": [
-    "text-generation",
-    "text-detoxification",
-    "toxicity-reduction",
-    "content-moderation",
-    "llama",
-    "gguf",
-    "quantized",
-    "cpu-inference",
-    "apple-silicon",
-    "minibase",
-    "medium-model",
-    "4096-context",
-    "q8_0"
-  ],
-  "model_creator": "Minibase AI",
-  "model_url": "https://minibase.ai",
-  "discord_url": "https://discord.com/invite/BrJn4D2Guh",
-  "repository_url": "https://github.com/minibase-ai/detoxify-medium",
-  "paper_url": "https://minibase.ai/research/detoxify-medium",
-  "generation_config": {
-    "_from_model_config": true,
-    "bos_token_id": 1,
-    "eos_token_id": 2,
-    "pad_token_id": null,
-    "do_sample": true,
-    "max_new_tokens": 256,
-    "repetition_penalty": 1.1,
-    "temperature": 0.7,
-    "top_k": 40,
-    "top_p": 0.9,
-    "transformers_version": "4.36.0"
-  },
-  "tokenizer_config": {
-    "add_bos_token": true,
-    "add_eos_token": false,
-    "bos_token": "<s>",
-    "eos_token": "</s>",
-    "unk_token": "<unk>",
-    "pad_token": null,
-    "model_max_length": 4096,
-    "chat_template": "{% for message in messages %}{{ message.content }}{% endfor %}",
-    "clean_up_tokenization_spaces": false,
-    "legacy": true
-  },
-  "chat_template": "{% for message in messages %}{{ message.content }}{% endfor %}",
-  "instruction_template": "Instruction: {instruction}\\n\\nInput: {input}\\n\\nResponse:",
-  "safety_and_ethics": {
-    "intended_use": "Text detoxification and content moderation",
-    "potential_misuse": "Should not be used for generating toxic content",
-    "content_policy": "Designed to reduce toxicity in text",
-    "bias_considerations": "May reflect biases present in training data",
-    "limitation_awareness": "Not suitable for all languages or contexts"
-  },
-  "technical_support": {
-    "framework": "llama.cpp",
-    "runtime_compatibility": ["llama.cpp", "ctransformers", "llama-cpp-python"],
-    "server_endpoint": "http://127.0.0.1:8000",
-    "api_format": "OpenAI-compatible",
-    "streaming_support": true
-  },
-  "version_info": {
-    "model_version": "1.0.0",
-    "quantization_version": "Q8_0",
-    "creation_date": "2025-09-18",
-    "last_updated": "2025-09-18",
-    "compatibility_version": "llama.cpp v0.2.0+"
-  }
-}

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d452c14cc5da273518a7957a15bd1db5d44e3d96670f200cf5846a17301676d
+size 5861