michaelfeil
/

ct2fast-flan-alpaca-base

Model card Files Files and versions

michaelfeil commited on May 1, 2023

Commit

3d7749e

·

1 Parent(s): 6614ed4

Update README.md

Files changed (1) hide show

README.md +3 -1

README.md CHANGED Viewed

@@ -1,5 +1,7 @@
 ---
 license: apache-2.0
 ---
 # Fast-Inference with Ctranslate2
 Speedup inference by 2x-8x using int8 inference in C++
@@ -18,7 +20,7 @@ Checkpoint compatible to [ctranslate2](https://github.com/OpenNMT/CTranslate2) a
 from hf_hub_ctranslate2 import TranslatorCT2fromHfHub, GeneratorCT2fromHfHub
 model_name = "michaelfeil/ct2fast-flan-alpaca-base"
-model = GeneratorCT2fromHfHub(
         # load in int8 on CUDA
         model_name_or_path=model_name,
         device="cuda",

 ---
 license: apache-2.0
+tags:
+- ctranslate2
 ---
 # Fast-Inference with Ctranslate2
 Speedup inference by 2x-8x using int8 inference in C++
 from hf_hub_ctranslate2 import TranslatorCT2fromHfHub, GeneratorCT2fromHfHub
 model_name = "michaelfeil/ct2fast-flan-alpaca-base"
+model = TranslatorCT2fromHfHub(
         # load in int8 on CUDA
         model_name_or_path=model_name,
         device="cuda",