Luigi
/

SmolLM2-135M-Instruct-TaiwanChat

Generated from Trainer

Model card Files Files and versions

Metrics Training metrics Community

Luigi commited on Apr 24

Commit

a4e859e

·

verified ·

1 Parent(s): e2fbc94

Model save

Files changed (3) hide show

README.md +2 -2
adapter_config.json +5 -5
adapter_model.safetensors +1 -1

README.md CHANGED Viewed

@@ -15,8 +15,8 @@ model-index:
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/pesi/SmolLM2-135M-Instruct-TaiwanChat_CLOUD/runs/3n6j9mm5)
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/pesi/SmolLM2-135M-Instruct-TaiwanChat_CLOUD/runs/3n6j9mm5)
 # SmolLM2-135M-Instruct-TaiwanChat
 This model is a fine-tuned version of [unsloth/SmolLM2-135M-Instruct](https://huggingface.co/unsloth/SmolLM2-135M-Instruct) on an unknown dataset.

 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/pesi/SmolLM2-135M-Instruct-TaiwanChat_CLOUD/runs/9fnxruem)
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/pesi/SmolLM2-135M-Instruct-TaiwanChat_CLOUD/runs/9fnxruem)
 # SmolLM2-135M-Instruct-TaiwanChat
 This model is a fine-tuned version of [unsloth/SmolLM2-135M-Instruct](https://huggingface.co/unsloth/SmolLM2-135M-Instruct) on an unknown dataset.

adapter_config.json CHANGED Viewed

@@ -23,13 +23,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "down_proj",
-    "up_proj",
-    "gate_proj",
     "o_proj",
     "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "o_proj",
     "q_proj",
+    "down_proj",
+    "v_proj",
+    "gate_proj",
+    "k_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:144ab0069994067311f6d6e928dc4ab81f91ab746e0f7f9655d5f05d1fe092d5
 size 19593064

 version https://git-lfs.github.com/spec/v1
+oid sha256:66579a549c4e35cb144962f30b1a0a5bbcfe42f06a70712a6353882737bfb256
 size 19593064