onnx

This is the ONNX variant of the gte-small embeddings model created with the DeepSparse Optimum integration.

To replicate ONNX export, run:

pip install git+https://github.com/neuralmagic/optimum-deepsparse.git
from optimum.deepsparse import DeepSparseModelForFeatureExtraction
from transformers.onnx.utils import get_preprocessor
from pathlib import Path

model_id = "thenlper/gte-small"

# load model and convert to onnx
model = DeepSparseModelForFeatureExtraction.from_pretrained(model_id, export=True)
tokenizer = get_preprocessor(model_id)

# save onnx checkpoint and tokenizer
onnx_path = Path("gte-small-dense")
model.save_pretrained(onnx_path)
tokenizer.save_pretrained(onnx_path)