Skip to content

Commit 40aeee2

Browse files
shaankhoslaShaan
andauthored
feat: Added AllMpnetBaseV2 (#195)
* new model * update readme --------- Co-authored-by: Shaan <[email protected]>
1 parent 678e27c commit 40aeee2

File tree

4 files changed

+14
-0
lines changed

4 files changed

+14
-0
lines changed

README.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,7 @@
2424

2525
- [**BAAI/bge-small-en-v1.5**](https://huggingface.co/BAAI/bge-small-en-v1.5) - Default
2626
- [**sentence-transformers/all-MiniLM-L6-v2**](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2)
27+
- [**sentence-transformers/all-mpnet-base-v2**](https://huggingface.co/sentence-transformers/all-mpnet-base-v2)
2728
- [**mixedbread-ai/mxbai-embed-large-v1**](https://huggingface.co/mixedbread-ai/mxbai-embed-large-v1)
2829
- [**Qdrant/clip-ViT-B-32-text**](https://huggingface.co/Qdrant/clip-ViT-B-32-text) - pairs with `clip-ViT-B-32-vision` for image-to-text search
2930
- [**BAAI/bge-large-en-v1.5**](https://huggingface.co/BAAI/bge-large-en-v1.5)

src/models/text_embedding.rs

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,8 @@ pub enum EmbeddingModel {
1515
AllMiniLML12V2,
1616
/// Quantized sentence-transformers/all-MiniLM-L12-v2
1717
AllMiniLML12V2Q,
18+
/// sentence-transformers/all-mpnet-base-v2
19+
AllMpnetBaseV2,
1820
/// BAAI/bge-base-en-v1.5
1921
BGEBaseENV15,
2022
/// Quantized BAAI/bge-base-en-v1.5
@@ -111,6 +113,15 @@ fn init_models_map() -> HashMap<EmbeddingModel, ModelInfo<EmbeddingModel>> {
111113
additional_files: Vec::new(),
112114
output_key: None,
113115
},
116+
ModelInfo {
117+
model: EmbeddingModel::AllMpnetBaseV2,
118+
dim: 768,
119+
description: String::from("Sentence Transformer model, mpnet-base-v2"),
120+
model_code: String::from("Xenova/all-mpnet-base-v2"),
121+
model_file: String::from("onnx/model.onnx"),
122+
additional_files: Vec::new(),
123+
output_key: None,
124+
},
114125
ModelInfo {
115126
model: EmbeddingModel::BGEBaseENV15,
116127
dim: 768,

src/text_embedding/impl.rs

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -173,6 +173,7 @@ impl TextEmbedding {
173173
EmbeddingModel::ParaphraseMLMiniLML12V2 => Some(Pooling::Mean),
174174
EmbeddingModel::ParaphraseMLMiniLML12V2Q => Some(Pooling::Mean),
175175
EmbeddingModel::ParaphraseMLMpnetBaseV2 => Some(Pooling::Mean),
176+
EmbeddingModel::AllMpnetBaseV2 => Some(Pooling::Mean),
176177

177178
EmbeddingModel::ModernBertEmbedLarge => Some(Pooling::Mean),
178179

tests/embeddings.rs

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,7 @@ fn verify_embeddings(model: &EmbeddingModel, embeddings: &[Embedding]) -> Result
3838
EmbeddingModel::AllMiniLML12V2Q => [-0.07808663, 0.27919534, -0.0770612, -0.75660324],
3939
EmbeddingModel::AllMiniLML6V2 => [0.59605527, 0.36542925, -0.16450031, -0.40903988],
4040
EmbeddingModel::AllMiniLML6V2Q => [0.5677276, 0.40180072, -0.15454668, -0.4672576],
41+
EmbeddingModel::AllMpnetBaseV2=> [-0.51290065, -0.4844747, -0.53036124, -0.5337459],
4142
EmbeddingModel::BGEBaseENV15 => [-0.51290065, -0.4844747, -0.53036124, -0.5337459],
4243
EmbeddingModel::BGEBaseENV15Q => [-0.5130697, -0.48461288, -0.53067875, -0.5337806],
4344
EmbeddingModel::BGELargeENV15 => [-0.19347441, -0.28394595, -0.1549195, -0.22201893],

0 commit comments

Comments
 (0)