Luigi
/

SmolLM2-135M-Instruct-TaiwanChat

@@ -16,11 +16,11 @@ from transformers import EvalPrediction
 PROJECT_NAME='SmolLM2-135M-Instruct-TaiwanChat'
 BASE_MODEL_ID="HuggingFaceTB/SmolLM2-135M-Instruct"
 DATASET_ID="yentinglin/TaiwanChat"
-N_SAMPLES=85840
 MAX_LEN=256
 # Tell wandb which project to use, and that you want to log your model
-os.environ["WANDB_PROJECT"]    = PROJECT_NAME
 os.environ["WANDB_LOG_MODEL"]  = "end"
 # Detect GPU Type
@@ -139,7 +139,7 @@ training_args = TrainingArguments(
     # ─── W&B integration ───
     logging_dir=f"{PROJECT_NAME}/logs",    # where to store TensorBoard/W&B logs
     report_to=["wandb"],                   # enable W&B reporting
-    run_name=PROJECT_NAME,                 # name this run in your W&B project
     push_to_hub=True,
     gradient_checkpointing=True,

 PROJECT_NAME='SmolLM2-135M-Instruct-TaiwanChat'
 BASE_MODEL_ID="HuggingFaceTB/SmolLM2-135M-Instruct"
 DATASET_ID="yentinglin/TaiwanChat"
+N_SAMPLES=40000
 MAX_LEN=256
 # Tell wandb which project to use, and that you want to log your model
+os.environ["WANDB_PROJECT"]    = f"{PROJECT_NAME}_CLOUD"
 os.environ["WANDB_LOG_MODEL"]  = "end"
 # Detect GPU Type
     # ─── W&B integration ───
     logging_dir=f"{PROJECT_NAME}/logs",    # where to store TensorBoard/W&B logs
     report_to=["wandb"],                   # enable W&B reporting
+    run_name=f"{PROJECT_NAME}_CLOUD",                 # name this run in your W&B project
     push_to_hub=True,
     gradient_checkpointing=True,