Create metadata.json
Browse files- metadata.json +263 -0
metadata.json
ADDED
|
@@ -0,0 +1,263 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_id": "DeepXR/Helion-2.5-Rnd",
|
| 3 |
+
"model_name": "Helion-2.5-Rnd",
|
| 4 |
+
"full_name": "Helion 2.5 Research and Development",
|
| 5 |
+
"organization": "DeepXR",
|
| 6 |
+
"release_date": "2025-01-30",
|
| 7 |
+
"version": "2.5.0-rnd",
|
| 8 |
+
"status": "research",
|
| 9 |
+
"description": "Advanced research language model with 70B parameters, designed for exceptional performance across reasoning, code generation, mathematics, and multilingual understanding with 131K context window.",
|
| 10 |
+
"architecture": {
|
| 11 |
+
"type": "transformer",
|
| 12 |
+
"variant": "llama",
|
| 13 |
+
"parameters": "70B",
|
| 14 |
+
"layers": 32,
|
| 15 |
+
"hidden_size": 4096,
|
| 16 |
+
"attention_heads": 32,
|
| 17 |
+
"kv_heads": 8,
|
| 18 |
+
"intermediate_size": 14336,
|
| 19 |
+
"vocabulary_size": 128256,
|
| 20 |
+
"context_length": 131072,
|
| 21 |
+
"rope_theta": 500000,
|
| 22 |
+
"positional_encoding": "YARN",
|
| 23 |
+
"activation": "SiLU",
|
| 24 |
+
"normalization": "RMSNorm"
|
| 25 |
+
},
|
| 26 |
+
"capabilities": {
|
| 27 |
+
"text_generation": {
|
| 28 |
+
"enabled": true,
|
| 29 |
+
"quality": "high",
|
| 30 |
+
"max_length": 131072
|
| 31 |
+
},
|
| 32 |
+
"code_generation": {
|
| 33 |
+
"enabled": true,
|
| 34 |
+
"languages": [
|
| 35 |
+
"Python", "JavaScript", "TypeScript", "Java", "C++", "C#", "Go",
|
| 36 |
+
"Rust", "Swift", "Kotlin", "Ruby", "PHP", "Scala", "R"
|
| 37 |
+
],
|
| 38 |
+
"quality": "high"
|
| 39 |
+
},
|
| 40 |
+
"mathematics": {
|
| 41 |
+
"enabled": true,
|
| 42 |
+
"capabilities": [
|
| 43 |
+
"arithmetic", "algebra", "calculus", "statistics", "proof_generation"
|
| 44 |
+
],
|
| 45 |
+
"quality": "high"
|
| 46 |
+
},
|
| 47 |
+
"reasoning": {
|
| 48 |
+
"enabled": true,
|
| 49 |
+
"types": [
|
| 50 |
+
"logical", "analytical", "common_sense", "abstract"
|
| 51 |
+
],
|
| 52 |
+
"quality": "high"
|
| 53 |
+
},
|
| 54 |
+
"multilingual": {
|
| 55 |
+
"enabled": true,
|
| 56 |
+
"languages": 50,
|
| 57 |
+
"primary_languages": [
|
| 58 |
+
"English", "Spanish", "French", "German", "Chinese", "Japanese",
|
| 59 |
+
"Korean", "Russian", "Arabic", "Hindi", "Portuguese", "Italian"
|
| 60 |
+
]
|
| 61 |
+
},
|
| 62 |
+
"long_context": {
|
| 63 |
+
"enabled": true,
|
| 64 |
+
"max_tokens": 131072,
|
| 65 |
+
"performance": "optimized"
|
| 66 |
+
}
|
| 67 |
+
},
|
| 68 |
+
"performance": {
|
| 69 |
+
"benchmarks": {
|
| 70 |
+
"mmlu": {
|
| 71 |
+
"score": 0.847,
|
| 72 |
+
"description": "Massive Multitask Language Understanding"
|
| 73 |
+
},
|
| 74 |
+
"gsm8k": {
|
| 75 |
+
"score": 0.892,
|
| 76 |
+
"description": "Grade School Math 8K"
|
| 77 |
+
},
|
| 78 |
+
"humaneval": {
|
| 79 |
+
"score": 0.756,
|
| 80 |
+
"description": "Code Generation Accuracy"
|
| 81 |
+
},
|
| 82 |
+
"mbpp": {
|
| 83 |
+
"score": 0.723,
|
| 84 |
+
"description": "Python Programming Benchmark"
|
| 85 |
+
},
|
| 86 |
+
"arc_challenge": {
|
| 87 |
+
"score": 0.834,
|
| 88 |
+
"description": "ARC Challenge Reasoning"
|
| 89 |
+
},
|
| 90 |
+
"hellaswag": {
|
| 91 |
+
"score": 0.889,
|
| 92 |
+
"description": "Common Sense Inference"
|
| 93 |
+
},
|
| 94 |
+
"winogrande": {
|
| 95 |
+
"score": 0.823,
|
| 96 |
+
"description": "Commonsense Reasoning"
|
| 97 |
+
},
|
| 98 |
+
"truthfulqa": {
|
| 99 |
+
"score": 0.612,
|
| 100 |
+
"description": "Truthfulness in QA"
|
| 101 |
+
}
|
| 102 |
+
},
|
| 103 |
+
"inference": {
|
| 104 |
+
"throughput_tokens_per_second": "30-50",
|
| 105 |
+
"latency_first_token_ms": "100-300",
|
| 106 |
+
"optimal_batch_size": "1-32",
|
| 107 |
+
"memory_requirement_gb": 140
|
| 108 |
+
}
|
| 109 |
+
},
|
| 110 |
+
"technical_details": {
|
| 111 |
+
"precision": "bfloat16",
|
| 112 |
+
"weight_format": "safetensors",
|
| 113 |
+
"total_shards": 96,
|
| 114 |
+
"shard_size_avg_gb": 1.46,
|
| 115 |
+
"total_size_gb": 140,
|
| 116 |
+
"quantization": "none",
|
| 117 |
+
"optimization": [
|
| 118 |
+
"Flash Attention 2",
|
| 119 |
+
"Grouped Query Attention",
|
| 120 |
+
"Tensor Parallelism",
|
| 121 |
+
"Pipeline Parallelism"
|
| 122 |
+
]
|
| 123 |
+
},
|
| 124 |
+
"training": {
|
| 125 |
+
"steps": 150000,
|
| 126 |
+
"warmup_steps": 2000,
|
| 127 |
+
"learning_rate": 2e-05,
|
| 128 |
+
"optimizer": "AdamW",
|
| 129 |
+
"scheduler": "cosine_with_restarts",
|
| 130 |
+
"precision": "bfloat16",
|
| 131 |
+
"gradient_accumulation": 8,
|
| 132 |
+
"batch_size": 4,
|
| 133 |
+
"parallelization": {
|
| 134 |
+
"tensor_parallel": 4,
|
| 135 |
+
"pipeline_parallel": 2
|
| 136 |
+
}
|
| 137 |
+
},
|
| 138 |
+
"hardware_requirements": {
|
| 139 |
+
"minimum": {
|
| 140 |
+
"gpus": "2x NVIDIA A100 80GB",
|
| 141 |
+
"vram_gb": 160,
|
| 142 |
+
"ram_gb": 256,
|
| 143 |
+
"storage_gb": 500,
|
| 144 |
+
"network": "10Gbps"
|
| 145 |
+
},
|
| 146 |
+
"recommended": {
|
| 147 |
+
"gpus": "4x NVIDIA H100 80GB",
|
| 148 |
+
"vram_gb": 320,
|
| 149 |
+
"ram_gb": 512,
|
| 150 |
+
"storage_gb": 1000,
|
| 151 |
+
"network": "100Gbps InfiniBand"
|
| 152 |
+
}
|
| 153 |
+
},
|
| 154 |
+
"usage": {
|
| 155 |
+
"intended_uses": [
|
| 156 |
+
"Research and development",
|
| 157 |
+
"Advanced reasoning tasks",
|
| 158 |
+
"Code generation and analysis",
|
| 159 |
+
"Mathematical problem solving",
|
| 160 |
+
"Multilingual applications",
|
| 161 |
+
"Long document understanding",
|
| 162 |
+
"Creative writing",
|
| 163 |
+
"Educational purposes"
|
| 164 |
+
],
|
| 165 |
+
"not_recommended": [
|
| 166 |
+
"Production without validation",
|
| 167 |
+
"Critical decision-making without oversight",
|
| 168 |
+
"Medical diagnosis",
|
| 169 |
+
"Legal advice",
|
| 170 |
+
"Financial advice",
|
| 171 |
+
"Safety-critical systems"
|
| 172 |
+
]
|
| 173 |
+
},
|
| 174 |
+
"limitations": [
|
| 175 |
+
"Research model - requires validation",
|
| 176 |
+
"May exhibit training data biases",
|
| 177 |
+
"Can generate incorrect information",
|
| 178 |
+
"Performance varies by domain",
|
| 179 |
+
"Context degradation beyond 64K tokens",
|
| 180 |
+
"Requires significant compute resources"
|
| 181 |
+
],
|
| 182 |
+
"ethical_considerations": {
|
| 183 |
+
"bias_mitigation": "Ongoing evaluation and monitoring",
|
| 184 |
+
"safety_features": [
|
| 185 |
+
"Content filtering",
|
| 186 |
+
"PII detection",
|
| 187 |
+
"Toxicity monitoring",
|
| 188 |
+
"Prompt injection protection"
|
| 189 |
+
],
|
| 190 |
+
"responsible_use": [
|
| 191 |
+
"Verify outputs for critical applications",
|
| 192 |
+
"Monitor for bias",
|
| 193 |
+
"Implement content filtering",
|
| 194 |
+
"Respect privacy and data protection"
|
| 195 |
+
]
|
| 196 |
+
},
|
| 197 |
+
"license": {
|
| 198 |
+
"type": "Apache-2.0",
|
| 199 |
+
"url": "https://www.apache.org/licenses/LICENSE-2.0",
|
| 200 |
+
"commercial_use": true,
|
| 201 |
+
"modification": true,
|
| 202 |
+
"distribution": true,
|
| 203 |
+
"patent_use": true,
|
| 204 |
+
"private_use": true
|
| 205 |
+
},
|
| 206 |
+
"files": {
|
| 207 |
+
"safetensors": {
|
| 208 |
+
"format": "safetensors",
|
| 209 |
+
"num_shards": 96,
|
| 210 |
+
"pattern": "model-{:05d}-of-00096.safetensors",
|
| 211 |
+
"index_file": "model.safetensors.index.json",
|
| 212 |
+
"checksums_available": true
|
| 213 |
+
},
|
| 214 |
+
"config": [
|
| 215 |
+
"config.json",
|
| 216 |
+
"generation_config.json",
|
| 217 |
+
"tokenizer_config.json",
|
| 218 |
+
"model_config.yaml"
|
| 219 |
+
],
|
| 220 |
+
"inference": [
|
| 221 |
+
"inference/server.py",
|
| 222 |
+
"inference/client.py",
|
| 223 |
+
"inference/utils.py",
|
| 224 |
+
"inference/security.py",
|
| 225 |
+
"inference/evaluate.py",
|
| 226 |
+
"inference/batch_inference.py",
|
| 227 |
+
"inference/optimizer.py",
|
| 228 |
+
"inference/benchmark.py"
|
| 229 |
+
]
|
| 230 |
+
},
|
| 231 |
+
"links": {
|
| 232 |
+
"repository": "https://huggingface.co/DeepXR/Helion-2.5-Rnd",
|
| 233 |
+
"organization": "https://deepxr.ai",
|
| 234 |
+
"documentation": "https://docs.deepxr.ai/helion",
|
| 235 |
+
"paper": null,
|
| 236 |
+
"demo": null
|
| 237 |
+
},
|
| 238 |
+
"contact": {
|
| 239 |
+
"email": "[email protected]",
|
| 240 |
+
"research_email": "[email protected]",
|
| 241 |
+
"security_email": "[email protected]",
|
| 242 |
+
"website": "https://deepxr.ai"
|
| 243 |
+
},
|
| 244 |
+
"citation": {
|
| 245 |
+
"format": "bibtex",
|
| 246 |
+
"text": "@misc{helion-2.5-rnd-2025,\n title={Helion-2.5-Rnd: Advanced Research Language Model},\n author={DeepXR Research Team},\n year={2025},\n publisher={DeepXR},\n url={https://huggingface.co/DeepXR/Helion-2.5-Rnd}\n}"
|
| 247 |
+
},
|
| 248 |
+
"changelog": [
|
| 249 |
+
{
|
| 250 |
+
"version": "2.5.0-rnd",
|
| 251 |
+
"date": "2025-01-30",
|
| 252 |
+
"changes": [
|
| 253 |
+
"Initial research release",
|
| 254 |
+
"70B parameter model",
|
| 255 |
+
"131K context window with YARN",
|
| 256 |
+
"SafeTensors format (96 shards)",
|
| 257 |
+
"Comprehensive inference suite",
|
| 258 |
+
"Security implementation",
|
| 259 |
+
"Optimization tools"
|
| 260 |
+
]
|
| 261 |
+
}
|
| 262 |
+
]
|
| 263 |
+
}
|