Update README.md
Browse files
README.md
CHANGED
|
@@ -5577,6 +5577,21 @@ Usage with [Infinity, MIT Licensed Inference Server](https://github.com/michaelf
|
|
| 5577 |
docker run --gpus all -v $PWD/data:/app/.cache \
|
| 5578 |
michaelf34/infinity:0.0.69-trt-onnx \
|
| 5579 |
v2 --model-id dunzhang/stella_en_1.5B_v5 --batch-size 16 --device cuda --engine torch --port 7997
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5580 |
```
|
| 5581 |
|
| 5582 |
# FAQ
|
|
|
|
| 5577 |
docker run --gpus all -v $PWD/data:/app/.cache \
|
| 5578 |
michaelf34/infinity:0.0.69-trt-onnx \
|
| 5579 |
v2 --model-id dunzhang/stella_en_1.5B_v5 --batch-size 16 --device cuda --engine torch --port 7997
|
| 5580 |
+
```
|
| 5581 |
+
# Citation
|
| 5582 |
+
|
| 5583 |
+
```
|
| 5584 |
+
|
| 5585 |
+
@misc{zhang2025jasperstelladistillationsota,
|
| 5586 |
+
title={Jasper and Stella: distillation of SOTA embedding models},
|
| 5587 |
+
author={Dun Zhang and Jiacheng Li and Ziyang Zeng and Fulong Wang},
|
| 5588 |
+
year={2025},
|
| 5589 |
+
eprint={2412.19048},
|
| 5590 |
+
archivePrefix={arXiv},
|
| 5591 |
+
primaryClass={cs.IR},
|
| 5592 |
+
url={https://arxiv.org/abs/2412.19048},
|
| 5593 |
+
}
|
| 5594 |
+
|
| 5595 |
```
|
| 5596 |
|
| 5597 |
# FAQ
|