| { | |
| "model_name": "Helion-V2", | |
| "model_version": "2.0", | |
| "model_type": "causal-lm", | |
| "architecture": "helion", | |
| "organization": "DeepXR", | |
| "release_date": "2024-11-15", | |
| "license": "Apache-2.0", | |
| "homepage": "https://huggingface.co/DeepXR/Helion-V2", | |
| "repository": "https://github.com/DeepXR/Helion-V2", | |
| "documentation": "https://docs.deepxr.ai/helion-v2", | |
| "parameters": { | |
| "total": 7200000000, | |
| "trainable": 7200000000, | |
| "non_trainable": 0 | |
| }, | |
| "model_size": { | |
| "fp32": "28.8 GB", | |
| "fp16": "14.4 GB", | |
| "bfloat16": "14.4 GB", | |
| "int8": "7.2 GB", | |
| "int4": "3.6 GB" | |
| }, | |
| "context_length": 8192, | |
| "vocabulary_size": 32768, | |
| "languages": [ | |
| "en", | |
| "es", | |
| "fr", | |
| "de", | |
| "it", | |
| "pt", | |
| "nl", | |
| "ru", | |
| "zh", | |
| "ja", | |
| "ko", | |
| "ar", | |
| "hi" | |
| ], | |
| "primary_language": "en", | |
| "tasks": [ | |
| "text-generation", | |
| "conversational", | |
| "code-generation", | |
| "question-answering", | |
| "summarization", | |
| "translation", | |
| "creative-writing" | |
| ], | |
| "framework": { | |
| "name": "transformers", | |
| "version": "4.40.0+", | |
| "backend": "pytorch", | |
| "backend_version": "2.1.0+" | |
| }, | |
| "training": { | |
| "dataset_tokens": 2500000000000, | |
| "training_steps": 600000, | |
| "epochs": 3, | |
| "batch_size": 4194304, | |
| "learning_rate": 0.0003, | |
| "optimizer": "AdamW", | |
| "hardware": "128x NVIDIA H100 80GB", | |
| "training_time_days": 21, | |
| "knowledge_cutoff": "2024-10-31" | |
| }, | |
| "benchmarks": { | |
| "mmlu": { | |
| "score": 64.2, | |
| "metric": "accuracy", | |
| "shots": 5 | |
| }, | |
| "humaneval": { | |
| "score": 48.2, | |
| "metric": "pass@1", | |
| "shots": 0 | |
| }, | |
| "hellaswag": { | |
| "score": 80.5, | |
| "metric": "accuracy", | |
| "shots": 10 | |
| }, | |
| "truthfulqa": { | |
| "score": 52.1, | |
| "metric": "mc2_accuracy", | |
| "shots": 0 | |
| }, | |
| "gsm8k": { | |
| "score": 68.7, | |
| "metric": "accuracy", | |
| "shots": 8 | |
| }, | |
| "arc_challenge": { | |
| "score": 58.3, | |
| "metric": "accuracy", | |
| "shots": 25 | |
| }, | |
| "mt_bench": { | |
| "score": 7.85, | |
| "metric": "rating", | |
| "shots": 0 | |
| } | |
| }, | |
| "safety": { | |
| "toxigen_score": 0.08, | |
| "crows_pairs_bias": 54.2, | |
| "content_filtering": true, | |
| "pii_detection": true, | |
| "crisis_detection": true, | |
| "safety_classifiers": [ | |
| "hate_speech", | |
| "violence", | |
| "sexual_content", | |
| "self_harm", | |
| "illegal_activity", | |
| "child_safety" | |
| ] | |
| }, | |
| "deployment": { | |
| "recommended_gpu": [ | |
| "NVIDIA A100", | |
| "NVIDIA H100", | |
| "NVIDIA RTX 4090", | |
| "NVIDIA A6000" | |
| ], | |
| "minimum_vram_gb": 16, | |
| "recommended_vram_gb": 24, | |
| "supports_quantization": true, | |
| "quantization_formats": [ | |
| "int8", | |
| "int4", | |
| "GPTQ", | |
| "AWQ", | |
| "GGUF" | |
| ], | |
| "inference_frameworks": [ | |
| "transformers", | |
| "vllm", | |
| "llama.cpp", | |
| "text-generation-inference" | |
| ] | |
| }, | |
| "contact": { | |
| "email": "contact@deepxr.ai", | |
| "github": "https://github.com/DeepXR/Helion-V2", | |
| "twitter": "@DeepXR_AI", | |
| "discord": "https://discord.gg/deepxr" | |
| }, | |
| "tags": [ | |
| "text-generation", | |
| "conversational", | |
| "code", | |
| "instruction-following", | |
| "pytorch", | |
| "causal-lm", | |
| "llm", | |
| "reasoning", | |
| "multilingual", | |
| "apache-2.0", | |
| "production-ready", | |
| "safe-ai" | |
| ], | |
| "checksum": { | |
| "algorithm": "SHA256", | |
| "model_files": "computed_on_upload" | |
| } | |
| } |