Update README.md
Browse files
README.md
CHANGED
@@ -5577,6 +5577,21 @@ Usage with [Infinity, MIT Licensed Inference Server](https://github.com/michaelf
|
|
5577 |
docker run --gpus all -v $PWD/data:/app/.cache \
|
5578 |
michaelf34/infinity:0.0.69-trt-onnx \
|
5579 |
v2 --model-id dunzhang/stella_en_1.5B_v5 --batch-size 16 --device cuda --engine torch --port 7997
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5580 |
```
|
5581 |
|
5582 |
# FAQ
|
|
|
5577 |
docker run --gpus all -v $PWD/data:/app/.cache \
|
5578 |
michaelf34/infinity:0.0.69-trt-onnx \
|
5579 |
v2 --model-id dunzhang/stella_en_1.5B_v5 --batch-size 16 --device cuda --engine torch --port 7997
|
5580 |
+
```
|
5581 |
+
# Citation
|
5582 |
+
|
5583 |
+
```
|
5584 |
+
|
5585 |
+
@misc{zhang2025jasperstelladistillationsota,
|
5586 |
+
title={Jasper and Stella: distillation of SOTA embedding models},
|
5587 |
+
author={Dun Zhang and Jiacheng Li and Ziyang Zeng and Fulong Wang},
|
5588 |
+
year={2025},
|
5589 |
+
eprint={2412.19048},
|
5590 |
+
archivePrefix={arXiv},
|
5591 |
+
primaryClass={cs.IR},
|
5592 |
+
url={https://arxiv.org/abs/2412.19048},
|
5593 |
+
}
|
5594 |
+
|
5595 |
```
|
5596 |
|
5597 |
# FAQ
|