Spaces:

Heartsync
/

phoenix

Paused

App Files Files Community

seawolf2357 commited on 27 days ago

Commit

cce66a2

verified ·

1 Parent(s): 7916437

Update app.py

Browse files

Files changed (1) hide show

app.py +44 -30

app.py CHANGED Viewed

@@ -682,16 +682,17 @@ def replace_attention_with_retention(model, use_hierarchical=True, structure_inf
 def generate_modeling_phoenix_code():
     """
-    PHOENIX Custom Modeling Code 생성 v1.4.2
-    ✅ FIX: Embedding Tying 개선
     """
     modeling_code = '''"""
-PHOENIX Retention Model - Custom Implementation v1.4.2
 Auto-loaded by HuggingFace transformers with trust_remote_code=True
-✅ FIX v1.4.2: Embedding Tying 개선 - 저장 시점 처리
-✅ FIX v1.4.1: State Dict 직접 로드로 Retention 가중치 보존
 VIDraft AI Research Lab
 """
@@ -712,7 +713,7 @@ class PhoenixConfig(PretrainedConfig):
     def __init__(
         self,
         use_phoenix_retention=True,
-        phoenix_version="1.4.2",
         original_architecture=None,
         original_model=None,
         **kwargs
@@ -724,32 +725,43 @@ class PhoenixConfig(PretrainedConfig):
         self.original_model = original_model
-# [MultiScaleRetention and HierarchicalRetention classes would be here - same as in main code]
-class PhoenixPreTrainedModel(PreTrainedModel):
-    """Base PHOENIX PreTrainedModel"""
-    config_class = PhoenixConfig
-    base_model_prefix = "phoenix"
-    supports_gradient_checkpointing = True
-    _no_split_modules = ["MultiScaleRetention", "HierarchicalRetention"]
-    def _init_weights(self, module):
-        if isinstance(module, nn.Linear):
-            module.weight.data.normal_(mean=0.0, std=0.02)
-            if module.bias is not None:
-                module.bias.data.zero_()
-        elif isinstance(module, nn.Embedding):
-            module.weight.data.normal_(mean=0.0, std=0.02)
-        elif isinstance(module, nn.LayerNorm):
-            module.bias.data.zero_()
-            module.weight.data.fill_(1.0)
 class PhoenixModelForCausalLM(PhoenixPreTrainedModel):
     """
-    PHOENIX Model for Causal Language Modeling v1.4.2
-    ✅ FIX: Embedding Tying 개선
     """
     def __init__(self, config):
@@ -760,7 +772,7 @@ class PhoenixModelForCausalLM(PhoenixPreTrainedModel):
     @classmethod
     def from_pretrained(cls, pretrained_model_name_or_path, *model_args, **kwargs):
-        """🔥 PHOENIX 자동 로딩! v1.4.2"""
         print(f"🔥 Loading PHOENIX model from {pretrained_model_name_or_path}")
         config = AutoConfig.from_pretrained(pretrained_model_name_or_path, trust_remote_code=True)
@@ -780,9 +792,12 @@ class PhoenixModelForCausalLM(PhoenixPreTrainedModel):
         print(f"   ✅ Created base structure")
-        # Retention 변환 (실제 코드에서는 import 필요)
-        # base_model, converted, total = replace_attention_with_retention(base_model, use_hierarchical)
         state_dict = None
         if os.path.exists(pretrained_model_name_or_path):
@@ -830,7 +845,7 @@ class PhoenixModelForCausalLM(PhoenixPreTrainedModel):
                 print(f"      Missing keys: {len(missing)}")
                 print(f"      Unexpected keys: {len(unexpected)}")
-                # ✅ FIX v1.4.2: Embedding Tying 처리
                 if 'lm_head.weight' in missing:
                     print(f"   ⚠️ lm_head.weight missing - checking tie_word_embeddings...")
@@ -842,7 +857,6 @@ class PhoenixModelForCausalLM(PhoenixPreTrainedModel):
                             print(f"   🔗 Tying lm_head.weight to embed_tokens.weight...")
                             base_model.lm_head.weight = base_model.model.embed_tokens.weight
                             print(f"   ✅ Embedding tying applied!")
-                            print(f"      Verification: {base_model.lm_head.weight is base_model.model.embed_tokens.weight}")
                 retention_keys = [k for k in state_dict.keys() if 'retention' in k.lower()]
                 if retention_keys:

 def generate_modeling_phoenix_code():
     """
+    PHOENIX Custom Modeling Code 생성 v1.4.3
+    ✅ FIX: Retention 변환 포함
     """
     modeling_code = '''"""
+PHOENIX Retention Model - Custom Implementation v1.4.3
 Auto-loaded by HuggingFace transformers with trust_remote_code=True
+✅ FIX v1.4.3: Retention 변환 자동 실행
+✅ FIX v1.4.2: Embedding Tying 개선
+✅ FIX v1.4.1: State Dict 직접 로드
 VIDraft AI Research Lab
 """
     def __init__(
         self,
         use_phoenix_retention=True,
+        phoenix_version="1.4.3",
         original_architecture=None,
         original_model=None,
         **kwargs
         self.original_model = original_model
+# ✅ CRITICAL: Retention 클래스들을 포함해야 함!
+# (여기에 MultiScaleRetention, HierarchicalRetention 전체 코드 삽입)
+def replace_attention_with_retention_for_loading(model, use_hierarchical=True):
+    """
+    Hub 로드 시 자동으로 Attention → Retention 변환
+    """
+    print("🔄 Converting Attention → Retention for loaded model...")
+    layers = None
+    if hasattr(model, 'model') and hasattr(model.model, 'layers'):
+        layers = model.model.layers
+    if layers is None:
+        print("❌ Cannot find layers")
+        return model, 0, 0
+    replaced_count = 0
+    for layer_idx, layer in enumerate(layers):
+        if hasattr(layer, 'self_attn'):
+            if use_hierarchical:
+                new_retention = HierarchicalRetention(model.config, layer_idx)
+            else:
+                new_retention = MultiScaleRetention(model.config, layer_idx)
+            layer.self_attn = new_retention
+            replaced_count += 1
+    print(f"✅ Converted {replaced_count}/{len(layers)} layers")
+    return model, replaced_count, len(layers)
 class PhoenixModelForCausalLM(PhoenixPreTrainedModel):
     """
+    PHOENIX Model for Causal Language Modeling v1.4.3
+    ✅ FIX: Retention 자동 변환 포함
     """
     def __init__(self, config):
     @classmethod
     def from_pretrained(cls, pretrained_model_name_or_path, *model_args, **kwargs):
+        """🔥 PHOENIX 자동 로딩! v1.4.3"""
         print(f"🔥 Loading PHOENIX model from {pretrained_model_name_or_path}")
         config = AutoConfig.from_pretrained(pretrained_model_name_or_path, trust_remote_code=True)
         print(f"   ✅ Created base structure")
+        # ✅ CRITICAL FIX: Retention 변환 실행!
+        base_model, converted, total = replace_attention_with_retention_for_loading(
+            base_model, use_hierarchical
+        )
+        # state_dict 로드
         state_dict = None
         if os.path.exists(pretrained_model_name_or_path):
                 print(f"      Missing keys: {len(missing)}")
                 print(f"      Unexpected keys: {len(unexpected)}")
+                # ✅ Embedding Tying
                 if 'lm_head.weight' in missing:
                     print(f"   ⚠️ lm_head.weight missing - checking tie_word_embeddings...")
                             print(f"   🔗 Tying lm_head.weight to embed_tokens.weight...")
                             base_model.lm_head.weight = base_model.model.embed_tokens.weight
                             print(f"   ✅ Embedding tying applied!")
                 retention_keys = [k for k in state_dict.keys() if 'retention' in k.lower()]
                 if retention_keys: