From 72743b2c3b5b59976e5d421d512512c6ff23dfdb Mon Sep 17 00:00:00 2001 From: Marcin Antas <antas.marcin@gmail.com> Date: Mon, 22 Apr 2024 07:23:42 +0200 Subject: [PATCH] Add support for Snowflake's Arctic models --- .github/workflows/main.yaml | 24 ++++++++++++++++++++++++ README.md | 8 ++++++++ 2 files changed, 32 insertions(+) diff --git a/.github/workflows/main.yaml b/.github/workflows/main.yaml index 83e39e7..e4c66ac 100644 --- a/.github/workflows/main.yaml +++ b/.github/workflows/main.yaml @@ -103,6 +103,30 @@ jobs: - model_name: mixedbread-ai/mxbai-embed-large-v1 model_tag_name: mixedbread-ai-mxbai-embed-large-v1 onnx_runtime: true + - model_name: Snowflake/snowflake-arctic-embed-xs + model_tag_name: snowflake-snowflake-arctic-embed-xs + onnx_runtime: false + - model_name: Snowflake/snowflake-arctic-embed-xs + model_tag_name: snowflake-snowflake-arctic-embed-xs + onnx_runtime: true + - model_name: Snowflake/snowflake-arctic-embed-s + model_tag_name: snowflake-snowflake-arctic-embed-s + onnx_runtime: false + - model_name: Snowflake/snowflake-arctic-embed-s + model_tag_name: snowflake-snowflake-arctic-embed-s + onnx_runtime: true + - model_name: Snowflake/snowflake-arctic-embed-m + model_tag_name: snowflake-snowflake-arctic-embed-m + onnx_runtime: false + - model_name: Snowflake/snowflake-arctic-embed-m + model_tag_name: snowflake-snowflake-arctic-embed-m + onnx_runtime: true + - model_name: Snowflake/snowflake-arctic-embed-l + model_tag_name: snowflake-snowflake-arctic-embed-l + onnx_runtime: false + - model_name: Snowflake/snowflake-arctic-embed-l + model_tag_name: snowflake-snowflake-arctic-embed-l + onnx_runtime: true env: LOCAL_REPO: transformers-inference REMOTE_REPO: semitechnologies/transformers-inference diff --git a/README.md b/README.md index 3a6336a..254b8d2 100644 --- a/README.md +++ b/README.md @@ -42,6 +42,10 @@ The pre-built models include: |`BAAI/bge-small-en-v1.5` ([Info](https://huggingface.co/BAAI/bge-small-en-v1.5))|`semitechnologies/transformers-inference:baai-bge-small-en-v1.5`| |`BAAI/bge-base-en-v1.5` ([Info](https://huggingface.co/BAAI/bge-base-en-v1.5))|`semitechnologies/transformers-inference:baai-bge-base-en-v1.5`| |`mixedbread-ai/mxbai-embed-large-v1` ([Info](https://huggingface.co/mixedbread-ai/mxbai-embed-large-v1))|`semitechnologies/transformers-inference:mixedbread-ai-mxbai-embed-large-v1`| +|`Snowflake/snowflake-arctic-embed-xs` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-xs))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-xs`| +|`Snowflake/snowflake-arctic-embed-s` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-s))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-s`| +|`Snowflake/snowflake-arctic-embed-m` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-m))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-m`| +|`Snowflake/snowflake-arctic-embed-l` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-l))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-l`| |DPR Models| |`facebook/dpr-ctx_encoder-single-nq-base` ([Info](https://huggingface.co/facebook/dpr-ctx_encoder-single-nq-base))|`semitechnologies/transformers-inference:facebook-dpr-ctx_encoder-single-nq-base`| |`facebook/dpr-question_encoder-single-nq-base` ([Info](https://huggingface.co/facebook/dpr-question_encoder-single-nq-base))|`semitechnologies/transformers-inference:facebook-dpr-question_encoder-single-nq-base`| @@ -56,6 +60,10 @@ The pre-built models include: |`BAAI/bge-m3` ([Info](https://huggingface.co/BAAI/bge-m3))|`semitechnologies/transformers-inference:baai-bge-m3-onnx`| |`sentence-transformers/all-MiniLM-L6-v2` ([Info](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2))|`semitechnologies/transformers-inference:sentence-transformers-all-MiniLM-L6-v2-onnx`| |`mixedbread-ai/mxbai-embed-large-v1` ([Info](https://huggingface.co/mixedbread-ai/mxbai-embed-large-v1))|`semitechnologies/transformers-inference:mixedbread-ai-mxbai-embed-large-v1-onnx`| +|`Snowflake/snowflake-arctic-embed-xs` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-xs))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-xs-onnx`| +|`Snowflake/snowflake-arctic-embed-s` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-s))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-s-onnx`| +|`Snowflake/snowflake-arctic-embed-m` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-m))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-m-onnx`| +|`Snowflake/snowflake-arctic-embed-l` ([Info](https://huggingface.co/Snowflake/snowflake-arctic-embed-l))|`semitechnologies/transformers-inference:snowflake-snowflake-arctic-embed-l-onnx`| The above image names always point to the latest version of the inference