Trouter-Library commited on
Commit
e9b17f1
·
verified ·
1 Parent(s): 02ba82e

Create metadata.json

Browse files
Files changed (1) hide show
  1. metadata.json +263 -0
metadata.json ADDED
@@ -0,0 +1,263 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_id": "DeepXR/Helion-2.5-Rnd",
3
+ "model_name": "Helion-2.5-Rnd",
4
+ "full_name": "Helion 2.5 Research and Development",
5
+ "organization": "DeepXR",
6
+ "release_date": "2025-01-30",
7
+ "version": "2.5.0-rnd",
8
+ "status": "research",
9
+ "description": "Advanced research language model with 70B parameters, designed for exceptional performance across reasoning, code generation, mathematics, and multilingual understanding with 131K context window.",
10
+ "architecture": {
11
+ "type": "transformer",
12
+ "variant": "llama",
13
+ "parameters": "70B",
14
+ "layers": 32,
15
+ "hidden_size": 4096,
16
+ "attention_heads": 32,
17
+ "kv_heads": 8,
18
+ "intermediate_size": 14336,
19
+ "vocabulary_size": 128256,
20
+ "context_length": 131072,
21
+ "rope_theta": 500000,
22
+ "positional_encoding": "YARN",
23
+ "activation": "SiLU",
24
+ "normalization": "RMSNorm"
25
+ },
26
+ "capabilities": {
27
+ "text_generation": {
28
+ "enabled": true,
29
+ "quality": "high",
30
+ "max_length": 131072
31
+ },
32
+ "code_generation": {
33
+ "enabled": true,
34
+ "languages": [
35
+ "Python", "JavaScript", "TypeScript", "Java", "C++", "C#", "Go",
36
+ "Rust", "Swift", "Kotlin", "Ruby", "PHP", "Scala", "R"
37
+ ],
38
+ "quality": "high"
39
+ },
40
+ "mathematics": {
41
+ "enabled": true,
42
+ "capabilities": [
43
+ "arithmetic", "algebra", "calculus", "statistics", "proof_generation"
44
+ ],
45
+ "quality": "high"
46
+ },
47
+ "reasoning": {
48
+ "enabled": true,
49
+ "types": [
50
+ "logical", "analytical", "common_sense", "abstract"
51
+ ],
52
+ "quality": "high"
53
+ },
54
+ "multilingual": {
55
+ "enabled": true,
56
+ "languages": 50,
57
+ "primary_languages": [
58
+ "English", "Spanish", "French", "German", "Chinese", "Japanese",
59
+ "Korean", "Russian", "Arabic", "Hindi", "Portuguese", "Italian"
60
+ ]
61
+ },
62
+ "long_context": {
63
+ "enabled": true,
64
+ "max_tokens": 131072,
65
+ "performance": "optimized"
66
+ }
67
+ },
68
+ "performance": {
69
+ "benchmarks": {
70
+ "mmlu": {
71
+ "score": 0.847,
72
+ "description": "Massive Multitask Language Understanding"
73
+ },
74
+ "gsm8k": {
75
+ "score": 0.892,
76
+ "description": "Grade School Math 8K"
77
+ },
78
+ "humaneval": {
79
+ "score": 0.756,
80
+ "description": "Code Generation Accuracy"
81
+ },
82
+ "mbpp": {
83
+ "score": 0.723,
84
+ "description": "Python Programming Benchmark"
85
+ },
86
+ "arc_challenge": {
87
+ "score": 0.834,
88
+ "description": "ARC Challenge Reasoning"
89
+ },
90
+ "hellaswag": {
91
+ "score": 0.889,
92
+ "description": "Common Sense Inference"
93
+ },
94
+ "winogrande": {
95
+ "score": 0.823,
96
+ "description": "Commonsense Reasoning"
97
+ },
98
+ "truthfulqa": {
99
+ "score": 0.612,
100
+ "description": "Truthfulness in QA"
101
+ }
102
+ },
103
+ "inference": {
104
+ "throughput_tokens_per_second": "30-50",
105
+ "latency_first_token_ms": "100-300",
106
+ "optimal_batch_size": "1-32",
107
+ "memory_requirement_gb": 140
108
+ }
109
+ },
110
+ "technical_details": {
111
+ "precision": "bfloat16",
112
+ "weight_format": "safetensors",
113
+ "total_shards": 96,
114
+ "shard_size_avg_gb": 1.46,
115
+ "total_size_gb": 140,
116
+ "quantization": "none",
117
+ "optimization": [
118
+ "Flash Attention 2",
119
+ "Grouped Query Attention",
120
+ "Tensor Parallelism",
121
+ "Pipeline Parallelism"
122
+ ]
123
+ },
124
+ "training": {
125
+ "steps": 150000,
126
+ "warmup_steps": 2000,
127
+ "learning_rate": 2e-05,
128
+ "optimizer": "AdamW",
129
+ "scheduler": "cosine_with_restarts",
130
+ "precision": "bfloat16",
131
+ "gradient_accumulation": 8,
132
+ "batch_size": 4,
133
+ "parallelization": {
134
+ "tensor_parallel": 4,
135
+ "pipeline_parallel": 2
136
+ }
137
+ },
138
+ "hardware_requirements": {
139
+ "minimum": {
140
+ "gpus": "2x NVIDIA A100 80GB",
141
+ "vram_gb": 160,
142
+ "ram_gb": 256,
143
+ "storage_gb": 500,
144
+ "network": "10Gbps"
145
+ },
146
+ "recommended": {
147
+ "gpus": "4x NVIDIA H100 80GB",
148
+ "vram_gb": 320,
149
+ "ram_gb": 512,
150
+ "storage_gb": 1000,
151
+ "network": "100Gbps InfiniBand"
152
+ }
153
+ },
154
+ "usage": {
155
+ "intended_uses": [
156
+ "Research and development",
157
+ "Advanced reasoning tasks",
158
+ "Code generation and analysis",
159
+ "Mathematical problem solving",
160
+ "Multilingual applications",
161
+ "Long document understanding",
162
+ "Creative writing",
163
+ "Educational purposes"
164
+ ],
165
+ "not_recommended": [
166
+ "Production without validation",
167
+ "Critical decision-making without oversight",
168
+ "Medical diagnosis",
169
+ "Legal advice",
170
+ "Financial advice",
171
+ "Safety-critical systems"
172
+ ]
173
+ },
174
+ "limitations": [
175
+ "Research model - requires validation",
176
+ "May exhibit training data biases",
177
+ "Can generate incorrect information",
178
+ "Performance varies by domain",
179
+ "Context degradation beyond 64K tokens",
180
+ "Requires significant compute resources"
181
+ ],
182
+ "ethical_considerations": {
183
+ "bias_mitigation": "Ongoing evaluation and monitoring",
184
+ "safety_features": [
185
+ "Content filtering",
186
+ "PII detection",
187
+ "Toxicity monitoring",
188
+ "Prompt injection protection"
189
+ ],
190
+ "responsible_use": [
191
+ "Verify outputs for critical applications",
192
+ "Monitor for bias",
193
+ "Implement content filtering",
194
+ "Respect privacy and data protection"
195
+ ]
196
+ },
197
+ "license": {
198
+ "type": "Apache-2.0",
199
+ "url": "https://www.apache.org/licenses/LICENSE-2.0",
200
+ "commercial_use": true,
201
+ "modification": true,
202
+ "distribution": true,
203
+ "patent_use": true,
204
+ "private_use": true
205
+ },
206
+ "files": {
207
+ "safetensors": {
208
+ "format": "safetensors",
209
+ "num_shards": 96,
210
+ "pattern": "model-{:05d}-of-00096.safetensors",
211
+ "index_file": "model.safetensors.index.json",
212
+ "checksums_available": true
213
+ },
214
+ "config": [
215
+ "config.json",
216
+ "generation_config.json",
217
+ "tokenizer_config.json",
218
+ "model_config.yaml"
219
+ ],
220
+ "inference": [
221
+ "inference/server.py",
222
+ "inference/client.py",
223
+ "inference/utils.py",
224
+ "inference/security.py",
225
+ "inference/evaluate.py",
226
+ "inference/batch_inference.py",
227
+ "inference/optimizer.py",
228
+ "inference/benchmark.py"
229
+ ]
230
+ },
231
+ "links": {
232
+ "repository": "https://huggingface.co/DeepXR/Helion-2.5-Rnd",
233
+ "organization": "https://deepxr.ai",
234
+ "documentation": "https://docs.deepxr.ai/helion",
235
+ "paper": null,
236
+ "demo": null
237
+ },
238
+ "contact": {
239
+ "email": "[email protected]",
240
+ "research_email": "[email protected]",
241
+ "security_email": "[email protected]",
242
+ "website": "https://deepxr.ai"
243
+ },
244
+ "citation": {
245
+ "format": "bibtex",
246
+ "text": "@misc{helion-2.5-rnd-2025,\n title={Helion-2.5-Rnd: Advanced Research Language Model},\n author={DeepXR Research Team},\n year={2025},\n publisher={DeepXR},\n url={https://huggingface.co/DeepXR/Helion-2.5-Rnd}\n}"
247
+ },
248
+ "changelog": [
249
+ {
250
+ "version": "2.5.0-rnd",
251
+ "date": "2025-01-30",
252
+ "changes": [
253
+ "Initial research release",
254
+ "70B parameter model",
255
+ "131K context window with YARN",
256
+ "SafeTensors format (96 shards)",
257
+ "Comprehensive inference suite",
258
+ "Security implementation",
259
+ "Optimization tools"
260
+ ]
261
+ }
262
+ ]
263
+ }