| { |
| "model_family": "Helion", |
| "version": "2.5", |
| "release_type": "research_and_development", |
| "variants": { |
| "base": { |
| "name": "Helion-2.5-Rnd", |
| "full_name": "DeepXR/Helion-2.5-Rnd", |
| "description": "Base research model with full precision (FP16)", |
| "parameters": "70B", |
| "precision": "float16", |
| "context_length": 131072, |
| "safetensors_shards": 83, |
| "shard_naming": "shard_00 to shard_82", |
| "shard_size_gb": 1.69, |
| "shard_size_gib": 1.57, |
| "total_size_gb": 140.27, |
| "status": "active", |
| "recommended_use": [ |
| "Research", |
| "Development", |
| "High-accuracy inference" |
| ], |
| "hardware_requirements": { |
| "min_vram_gb": 145, |
| "min_gpus": 2, |
| "recommended_gpu": "A100 80GB" |
| } |
| }, |
| "instruct": { |
| "name": "Helion-2.5-Rnd-Instruct", |
| "full_name": "DeepXR/Helion-2.5-Rnd-Instruct", |
| "description": "Instruction-tuned variant optimized for following instructions", |
| "parameters": "70B", |
| "precision": "bfloat16", |
| "context_length": 131072, |
| "status": "planned", |
| "recommended_use": [ |
| "Instruction following", |
| "Task completion", |
| "Structured outputs" |
| ], |
| "fine_tuning": { |
| "type": "supervised", |
| "data_focus": "instruction_pairs" |
| } |
| }, |
| "chat": { |
| "name": "Helion-2.5-Rnd-Chat", |
| "full_name": "DeepXR/Helion-2.5-Rnd-Chat", |
| "description": "Conversational variant optimized for multi-turn dialogue", |
| "parameters": "70B", |
| "precision": "bfloat16", |
| "context_length": 131072, |
| "status": "planned", |
| "recommended_use": [ |
| "Conversational AI", |
| "Customer service", |
| "Interactive applications" |
| ], |
| "fine_tuning": { |
| "type": "rlhf", |
| "data_focus": "conversational_data" |
| } |
| }, |
| "code": { |
| "name": "Helion-2.5-Rnd-Code", |
| "full_name": "DeepXR/Helion-2.5-Rnd-Code", |
| "description": "Code-specialized variant with enhanced programming capabilities", |
| "parameters": "70B", |
| "precision": "bfloat16", |
| "context_length": 131072, |
| "status": "planned", |
| "recommended_use": [ |
| "Code generation", |
| "Code review", |
| "Bug fixing", |
| "Documentation" |
| ], |
| "fine_tuning": { |
| "type": "supervised", |
| "data_focus": "code_repositories" |
| }, |
| "enhanced_languages": [ |
| "Python", |
| "JavaScript", |
| "TypeScript", |
| "Rust", |
| "Go", |
| "Java" |
| ] |
| }, |
| "math": { |
| "name": "Helion-2.5-Rnd-Math", |
| "full_name": "DeepXR/Helion-2.5-Rnd-Math", |
| "description": "Mathematics-specialized variant for advanced problem solving", |
| "parameters": "70B", |
| "precision": "bfloat16", |
| "context_length": 131072, |
| "status": "planned", |
| "recommended_use": [ |
| "Mathematical reasoning", |
| "Proof generation", |
| "Problem solving", |
| "Educational applications" |
| ], |
| "fine_tuning": { |
| "type": "supervised", |
| "data_focus": "mathematical_proofs" |
| } |
| } |
| }, |
| "deployment_configurations": { |
| "production": { |
| "description": "Production-ready configuration with optimizations", |
| "settings": { |
| "tensor_parallel_size": 4, |
| "gpu_memory_utilization": 0.95, |
| "max_batch_size": 32, |
| "enable_prefix_caching": true, |
| "enable_chunked_prefill": true |
| } |
| }, |
| "development": { |
| "description": "Development configuration for testing", |
| "settings": { |
| "tensor_parallel_size": 2, |
| "gpu_memory_utilization": 0.85, |
| "max_batch_size": 8, |
| "enable_prefix_caching": false, |
| "enable_chunked_prefill": false |
| } |
| }, |
| "research": { |
| "description": "Research configuration for experimentation", |
| "settings": { |
| "tensor_parallel_size": 2, |
| "gpu_memory_utilization": 0.90, |
| "max_batch_size": 4, |
| "enable_prefix_caching": false, |
| "enable_chunked_prefill": false, |
| "enable_logging": true |
| } |
| } |
| }, |
| "comparison_matrix": { |
| "base_vs_instruct": { |
| "base_advantages": [ |
| "More flexible for fine-tuning", |
| "Better for creative tasks", |
| "Less constrained outputs" |
| ], |
| "instruct_advantages": [ |
| "Better instruction following", |
| "More structured outputs", |
| "Improved task completion" |
| ] |
| }, |
| "base_vs_chat": { |
| "base_advantages": [ |
| "Better for single-turn tasks", |
| "More diverse outputs", |
| "Flexible formatting" |
| ], |
| "chat_advantages": [ |
| "Better conversation coherence", |
| "Improved context awareness", |
| "Natural dialogue flow" |
| ] |
| } |
| }, |
| "migration_guide": { |
| "from_base_to_instruct": { |
| "steps": [ |
| "Update prompt format to instruction style", |
| "Adjust temperature (typically lower)", |
| "Add explicit task descriptions", |
| "Use structured output formats" |
| ], |
| "example_prompt_change": { |
| "base": "Write a function to sort a list", |
| "instruct": "### Instruction:\nWrite a Python function that sorts a list in ascending order.\n\n### Response:" |
| } |
| }, |
| "from_base_to_chat": { |
| "steps": [ |
| "Convert to chat message format", |
| "Add system prompts", |
| "Maintain conversation history", |
| "Use appropriate message roles" |
| ], |
| "example_format_change": { |
| "base": "Hello, how are you?", |
| "chat": [ |
| { |
| "role": "system", |
| "content": "You are a helpful assistant." |
| }, |
| { |
| "role": "user", |
| "content": "Hello, how are you?" |
| } |
| ] |
| } |
| } |
| }, |
| "version_history": { |
| "2.5.0-rnd": { |
| "release_date": "2025-01-30", |
| "status": "current", |
| "changes": [ |
| "Initial research release", |
| "70B parameter model", |
| "131K context with YARN", |
| "SafeTensors format (96 shards)", |
| "Full precision (BF16)" |
| ] |
| } |
| }, |
| "roadmap": { |
| "upcoming_variants": [ |
| { |
| "name": "Helion-2.5-Rnd-Instruct", |
| "expected": "Q2 2025", |
| "status": "in_development" |
| }, |
| { |
| "name": "Helion-2.5-Rnd-Chat", |
| "expected": "Q2 2025", |
| "status": "planned" |
| }, |
| { |
| "name": "Helion-2.5-Rnd-Code", |
| "expected": "Q3 2025", |
| "status": "planned" |
| } |
| ], |
| "future_features": [ |
| "Multi-modal capabilities", |
| "Extended context to 256K", |
| "Improved multilingual support", |
| "Domain-specific variants" |
| ] |
| } |
| } |