Add new SentenceTransformer model

#1
by zpn - opened
Files changed (3) hide show
  1. README.md +6 -6
  2. config.json +2 -2
  3. model.safetensors +1 -1
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: nomic-ai/nomic-embed-text-v2-moe
3
  library_name: sentence-transformers
4
  pipeline_tag: sentence-similarity
5
  tags:
@@ -8,15 +8,15 @@ tags:
8
  - feature-extraction
9
  ---
10
 
11
- # SentenceTransformer based on nomic-ai/nomic-embed-text-v2-moe
12
 
13
- This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [nomic-ai/nomic-embed-text-v2-moe](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
14
 
15
  ## Model Details
16
 
17
  ### Model Description
18
  - **Model Type:** Sentence Transformer
19
- - **Base model:** [nomic-ai/nomic-embed-text-v2-moe](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe) <!-- at revision 8e109938f32da90ed146077b419bedd5cc6590b7 -->
20
  - **Maximum Sequence Length:** 512 tokens
21
  - **Output Dimensionality:** 768 dimensions
22
  - **Similarity Function:** Cosine Similarity
@@ -115,8 +115,8 @@ You can finetune this model on your own dataset.
115
  - Sentence Transformers: 3.3.0
116
  - Transformers: 4.44.2
117
  - PyTorch: 2.4.1+cu121
118
- - Accelerate: 1.0.0
119
- - Datasets: 2.19.0
120
  - Tokenizers: 0.19.1
121
 
122
  ## Citation
 
1
  ---
2
+ base_model: nomic-ai/nomic-embed-text-v2-moe-unsupervised
3
  library_name: sentence-transformers
4
  pipeline_tag: sentence-similarity
5
  tags:
 
8
  - feature-extraction
9
  ---
10
 
11
+ # SentenceTransformer based on nomic-ai/nomic-embed-text-v2-moe-unsupervised
12
 
13
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [nomic-ai/nomic-embed-text-v2-moe-unsupervised](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe-unsupervised). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
14
 
15
  ## Model Details
16
 
17
  ### Model Description
18
  - **Model Type:** Sentence Transformer
19
+ - **Base model:** [nomic-ai/nomic-embed-text-v2-moe-unsupervised](https://huggingface.co/nomic-ai/nomic-embed-text-v2-moe-unsupervised) <!-- at revision e48a32f5906ed18933f85467e57c1dcc02ef401b -->
20
  - **Maximum Sequence Length:** 512 tokens
21
  - **Output Dimensionality:** 768 dimensions
22
  - **Similarity Function:** Cosine Similarity
 
115
  - Sentence Transformers: 3.3.0
116
  - Transformers: 4.44.2
117
  - PyTorch: 2.4.1+cu121
118
+ - Accelerate: 1.2.1
119
+ - Datasets: 3.2.0
120
  - Tokenizers: 0.19.1
121
 
122
  ## Citation
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "nomic-ai/nomic-xlm-2048",
3
  "activation_function": "gelu",
4
  "add_pooling_layer": false,
5
  "architectures": [
@@ -55,7 +55,7 @@
55
  "rotary_emb_interleaved": false,
56
  "rotary_emb_scale_base": null,
57
  "rotary_scaling_factor": null,
58
- "router_aux_loss_coef": 0.1,
59
  "scale_attn_by_inverse_layer_idx": false,
60
  "scale_attn_weights": true,
61
  "summary_activation": null,
 
1
  {
2
+ "_name_or_path": "nomic-ai/nomic-embed-text-v2-moe-unsupervised",
3
  "activation_function": "gelu",
4
  "add_pooling_layer": false,
5
  "architectures": [
 
55
  "rotary_emb_interleaved": false,
56
  "rotary_emb_scale_base": null,
57
  "rotary_scaling_factor": null,
58
+ "router_aux_loss_coef": 1.0,
59
  "scale_attn_by_inverse_layer_idx": false,
60
  "scale_attn_weights": true,
61
  "summary_activation": null,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:097012b27af76d80af74fed4bc2ccc9091245286f776adf03ad1758a24ade9a0
3
  size 1901187232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d28e71c4128b432588d35ff44b2ad70839cf0c639a8096d2f44cef5018b655ee
3
  size 1901187232