Add new SentenceTransformer model
#1
by
zpn
- opened
- README.md +6 -6
- config.json +2 -2
- model.safetensors +1 -1
README.md
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
---
|
2 |
-
base_model: nomic-ai/nomic-embed-text-v2-moe
|
3 |
library_name: sentence-transformers
|
4 |
pipeline_tag: sentence-similarity
|
5 |
tags:
|
@@ -8,15 +8,15 @@ tags:
|
|
8 |
- feature-extraction
|
9 |
---
|
10 |
|
11 |
-
# SentenceTransformer based on nomic-ai/nomic-embed-text-v2-moe
|
12 |
|
13 |
-
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [nomic-ai/nomic-embed-text-v2-moe](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
14 |
|
15 |
## Model Details
|
16 |
|
17 |
### Model Description
|
18 |
- **Model Type:** Sentence Transformer
|
19 |
-
- **Base model:** [nomic-ai/nomic-embed-text-v2-moe](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe) <!-- at revision
|
20 |
- **Maximum Sequence Length:** 512 tokens
|
21 |
- **Output Dimensionality:** 768 dimensions
|
22 |
- **Similarity Function:** Cosine Similarity
|
@@ -115,8 +115,8 @@ You can finetune this model on your own dataset.
|
|
115 |
- Sentence Transformers: 3.3.0
|
116 |
- Transformers: 4.44.2
|
117 |
- PyTorch: 2.4.1+cu121
|
118 |
-
- Accelerate: 1.
|
119 |
-
- Datasets: 2.
|
120 |
- Tokenizers: 0.19.1
|
121 |
|
122 |
## Citation
|
|
|
1 |
---
|
2 |
+
base_model: nomic-ai/nomic-embed-text-v2-moe-unsupervised
|
3 |
library_name: sentence-transformers
|
4 |
pipeline_tag: sentence-similarity
|
5 |
tags:
|
|
|
8 |
- feature-extraction
|
9 |
---
|
10 |
|
11 |
+
# SentenceTransformer based on nomic-ai/nomic-embed-text-v2-moe-unsupervised
|
12 |
|
13 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [nomic-ai/nomic-embed-text-v2-moe-unsupervised](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe-unsupervised). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
14 |
|
15 |
## Model Details
|
16 |
|
17 |
### Model Description
|
18 |
- **Model Type:** Sentence Transformer
|
19 |
+
- **Base model:** [nomic-ai/nomic-embed-text-v2-moe-unsupervised](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe-unsupervised) <!-- at revision e48a32f5906ed18933f85467e57c1dcc02ef401b -->
|
20 |
- **Maximum Sequence Length:** 512 tokens
|
21 |
- **Output Dimensionality:** 768 dimensions
|
22 |
- **Similarity Function:** Cosine Similarity
|
|
|
115 |
- Sentence Transformers: 3.3.0
|
116 |
- Transformers: 4.44.2
|
117 |
- PyTorch: 2.4.1+cu121
|
118 |
+
- Accelerate: 1.2.1
|
119 |
+
- Datasets: 3.2.0
|
120 |
- Tokenizers: 0.19.1
|
121 |
|
122 |
## Citation
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "nomic-ai/nomic-
|
3 |
"activation_function": "gelu",
|
4 |
"add_pooling_layer": false,
|
5 |
"architectures": [
|
@@ -55,7 +55,7 @@
|
|
55 |
"rotary_emb_interleaved": false,
|
56 |
"rotary_emb_scale_base": null,
|
57 |
"rotary_scaling_factor": null,
|
58 |
-
"router_aux_loss_coef": 0
|
59 |
"scale_attn_by_inverse_layer_idx": false,
|
60 |
"scale_attn_weights": true,
|
61 |
"summary_activation": null,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "nomic-ai/nomic-embed-text-v2-moe-unsupervised",
|
3 |
"activation_function": "gelu",
|
4 |
"add_pooling_layer": false,
|
5 |
"architectures": [
|
|
|
55 |
"rotary_emb_interleaved": false,
|
56 |
"rotary_emb_scale_base": null,
|
57 |
"rotary_scaling_factor": null,
|
58 |
+
"router_aux_loss_coef": 1.0,
|
59 |
"scale_attn_by_inverse_layer_idx": false,
|
60 |
"scale_attn_weights": true,
|
61 |
"summary_activation": null,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1901187232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d28e71c4128b432588d35ff44b2ad70839cf0c639a8096d2f44cef5018b655ee
|
3 |
size 1901187232
|