Spaces:

akhaliq
/

MobileLLM-Pro

Running on Zero

akhaliq HF Staff

patrickhubermeta commited on about 21 hours ago

Commit

a221e28

verified ·

1 Parent(s): eb8ec5c

Update to account for MobileLLM-Pro repository split (#1)

- Update to account for MobileLLM-Pro repository split (dab7631d3bafef88b7c5376ff04bac0cd38f9cfb)

Co-authored-by: Patrick Huber <[email protected]>

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,7 +9,6 @@ from huggingface_hub import login
 import spaces
 MODEL_ID = "facebook/MobileLLM-Pro"
-SUBFOLDER = "instruct"           # use the chat template
 MAX_NEW_TOKENS = 256
 TEMPERATURE = 0.7
 TOP_P = 0.95
@@ -32,12 +31,11 @@ def _ensure_loaded():
     if _tokenizer is not None and _model is not None:
         return
     _tokenizer = AutoTokenizer.from_pretrained(
-        MODEL_ID, trust_remote_code=True, subfolder=SUBFOLDER
     )
     _model = AutoModelForCausalLM.from_pretrained(
         MODEL_ID,
         trust_remote_code=True,
-        subfolder=SUBFOLDER,
         torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
         low_cpu_mem_usage=True,
         device_map="auto" if torch.cuda.is_available() else None,

 import spaces
 MODEL_ID = "facebook/MobileLLM-Pro"
 MAX_NEW_TOKENS = 256
 TEMPERATURE = 0.7
 TOP_P = 0.95
     if _tokenizer is not None and _model is not None:
         return
     _tokenizer = AutoTokenizer.from_pretrained(
+        MODEL_ID, trust_remote_code=True
     )
     _model = AutoModelForCausalLM.from_pretrained(
         MODEL_ID,
         trust_remote_code=True,
         torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
         low_cpu_mem_usage=True,
         device_map="auto" if torch.cuda.is_available() else None,