meandyou200175
/

e5_large_finetune_word

@@ -4,7 +4,7 @@ tags:
 - sentence-similarity
 - feature-extraction
 - generated_from_trainer
-- dataset_size:9316
 - loss:MultipleNegativesRankingLoss
 base_model: intfloat/multilingual-e5-large
 widget:
@@ -76,76 +76,76 @@ model-index:
       type: unknown
     metrics:
     - type: cosine_accuracy@1
-      value: 0.8108108108108109
       name: Cosine Accuracy@1
     - type: cosine_accuracy@2
-      value: 0.8957528957528957
       name: Cosine Accuracy@2
     - type: cosine_accuracy@5
-      value: 0.9382239382239382
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
-      value: 0.9642857142857143
       name: Cosine Accuracy@10
     - type: cosine_accuracy@100
-      value: 0.9932432432432432
       name: Cosine Accuracy@100
     - type: cosine_precision@1
-      value: 0.8108108108108109
       name: Cosine Precision@1
     - type: cosine_precision@2
-      value: 0.44787644787644787
       name: Cosine Precision@2
     - type: cosine_precision@5
-      value: 0.18764478764478765
       name: Cosine Precision@5
     - type: cosine_precision@10
-      value: 0.09642857142857143
       name: Cosine Precision@10
     - type: cosine_precision@100
-      value: 0.009932432432432433
       name: Cosine Precision@100
     - type: cosine_recall@1
-      value: 0.8108108108108109
       name: Cosine Recall@1
     - type: cosine_recall@2
-      value: 0.8957528957528957
       name: Cosine Recall@2
     - type: cosine_recall@5
-      value: 0.9382239382239382
       name: Cosine Recall@5
     - type: cosine_recall@10
-      value: 0.9642857142857143
       name: Cosine Recall@10
     - type: cosine_recall@100
-      value: 0.9932432432432432
       name: Cosine Recall@100
     - type: cosine_ndcg@10
-      value: 0.8923095558988695
       name: Cosine Ndcg@10
     - type: cosine_mrr@1
-      value: 0.8108108108108109
       name: Cosine Mrr@1
     - type: cosine_mrr@2
-      value: 0.8532818532818532
       name: Cosine Mrr@2
     - type: cosine_mrr@5
-      value: 0.8649292149292154
       name: Cosine Mrr@5
     - type: cosine_mrr@10
-      value: 0.8687695348409635
       name: Cosine Mrr@10
     - type: cosine_mrr@100
-      value: 0.8700193430588538
       name: Cosine Mrr@100
     - type: cosine_map@100
-      value: 0.8700193430588539
       name: Cosine Map@100
 ---
 # SentenceTransformer based on intfloat/multilingual-e5-large
-This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) on the [word_embedding](https://huggingface.co/datasets/meandyou200175/word_embedding) dataset. It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
 ## Model Details
@@ -155,8 +155,7 @@ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [i
 - **Maximum Sequence Length:** 512 tokens
 - **Output Dimensionality:** 1024 dimensions
 - **Similarity Function:** Cosine Similarity
-- **Training Dataset:**
-    - [word_embedding](https://huggingface.co/datasets/meandyou200175/word_embedding)
 <!-- - **Language:** Unknown -->
 <!-- - **License:** Unknown -->
@@ -242,28 +241,28 @@ You can finetune this model on your own dataset.
 | Metric               | Value      |
 |:---------------------|:-----------|
-| cosine_accuracy@1    | 0.8108     |
-| cosine_accuracy@2    | 0.8958     |
-| cosine_accuracy@5    | 0.9382     |
-| cosine_accuracy@10   | 0.9643     |
-| cosine_accuracy@100  | 0.9932     |
-| cosine_precision@1   | 0.8108     |
-| cosine_precision@2   | 0.4479     |
-| cosine_precision@5   | 0.1876     |
-| cosine_precision@10  | 0.0964     |
-| cosine_precision@100 | 0.0099     |
-| cosine_recall@1      | 0.8108     |
-| cosine_recall@2      | 0.8958     |
-| cosine_recall@5      | 0.9382     |
-| cosine_recall@10     | 0.9643     |
-| cosine_recall@100    | 0.9932     |
-| **cosine_ndcg@10**   | **0.8923** |
-| cosine_mrr@1         | 0.8108     |
-| cosine_mrr@2         | 0.8533     |
-| cosine_mrr@5         | 0.8649     |
-| cosine_mrr@10        | 0.8688     |
-| cosine_mrr@100       | 0.87       |
-| cosine_map@100       | 0.87       |
 <!--
 ## Bias, Risks and Limitations
@@ -281,10 +280,9 @@ You can finetune this model on your own dataset.
 ### Training Dataset
-#### word_embedding
-* Dataset: [word_embedding](https://huggingface.co/datasets/meandyou200175/word_embedding) at [af76b11](https://huggingface.co/datasets/meandyou200175/word_embedding/tree/af76b11c1d93542ca76e864a60b1744d5e02b099)
-* Size: 9,316 training samples
 * Columns: <code>query</code> and <code>positive</code>
 * Approximate statistics based on the first 1000 samples:
   |         | query                                                                              | positive                                                                        |
@@ -467,35 +465,38 @@ You can finetune this model on your own dataset.
 | Epoch  | Step | Training Loss | Validation Loss | cosine_ndcg@10 |
 |:------:|:----:|:-------------:|:---------------:|:--------------:|
 | -1     | -1   | -             | -               | 0.7166         |
-| 0.1715 | 100  | 0.8892        | -               | -              |
-| 0.3431 | 200  | 0.1724        | -               | -              |
-| 0.5146 | 300  | 0.1783        | -               | -              |
-| 0.6861 | 400  | 0.1393        | -               | -              |
-| 0.8576 | 500  | 0.1262        | -               | -              |
-| 1.0292 | 600  | 0.1046        | -               | -              |
-| 1.2007 | 700  | 0.0639        | -               | -              |
-| 1.3722 | 800  | 0.0692        | -               | -              |
-| 1.5437 | 900  | 0.043         | -               | -              |
-| 1.7153 | 1000 | 0.0614        | 0.0819          | 0.8774         |
-| 1.8868 | 1100 | 0.0538        | -               | -              |
-| 2.0583 | 1200 | 0.0414        | -               | -              |
-| 2.2298 | 1300 | 0.0146        | -               | -              |
-| 2.4014 | 1400 | 0.0164        | -               | -              |
-| 2.5729 | 1500 | 0.0225        | -               | -              |
-| 2.7444 | 1600 | 0.0215        | -               | -              |
-| 2.9160 | 1700 | 0.0271        | -               | -              |
-| 3.0875 | 1800 | 0.0202        | -               | -              |
-| 3.2590 | 1900 | 0.0194        | -               | -              |
-| 3.4305 | 2000 | 0.0144        | 0.0682          | 0.8923         |
-| 3.6021 | 2100 | 0.0118        | -               | -              |
-| 3.7736 | 2200 | 0.0155        | -               | -              |
-| 3.9451 | 2300 | 0.0177        | -               | -              |
-| 4.1166 | 2400 | 0.0059        | -               | -              |
-| 4.2882 | 2500 | 0.0099        | -               | -              |
-| 4.4597 | 2600 | 0.0056        | -               | -              |
-| 4.6312 | 2700 | 0.0153        | -               | -              |
-| 4.8027 | 2800 | 0.0069        | -               | -              |
-| 4.9743 | 2900 | 0.01          | -               | -              |
 ### Framework Versions

 - sentence-similarity
 - feature-extraction
 - generated_from_trainer
+- dataset_size:10356
 - loss:MultipleNegativesRankingLoss
 base_model: intfloat/multilingual-e5-large
 widget:
       type: unknown
     metrics:
     - type: cosine_accuracy@1
+      value: 0.9073359073359073
       name: Cosine Accuracy@1
     - type: cosine_accuracy@2
+      value: 0.9739382239382239
       name: Cosine Accuracy@2
     - type: cosine_accuracy@5
+      value: 0.9942084942084942
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
+      value: 0.999034749034749
       name: Cosine Accuracy@10
     - type: cosine_accuracy@100
+      value: 1.0
       name: Cosine Accuracy@100
     - type: cosine_precision@1
+      value: 0.9073359073359073
       name: Cosine Precision@1
     - type: cosine_precision@2
+      value: 0.48696911196911197
       name: Cosine Precision@2
     - type: cosine_precision@5
+      value: 0.19884169884169883
       name: Cosine Precision@5
     - type: cosine_precision@10
+      value: 0.0999034749034749
       name: Cosine Precision@10
     - type: cosine_precision@100
+      value: 0.010000000000000002
       name: Cosine Precision@100
     - type: cosine_recall@1
+      value: 0.9073359073359073
       name: Cosine Recall@1
     - type: cosine_recall@2
+      value: 0.9739382239382239
       name: Cosine Recall@2
     - type: cosine_recall@5
+      value: 0.9942084942084942
       name: Cosine Recall@5
     - type: cosine_recall@10
+      value: 0.999034749034749
       name: Cosine Recall@10
     - type: cosine_recall@100
+      value: 1.0
       name: Cosine Recall@100
     - type: cosine_ndcg@10
+      value: 0.9601842774877813
       name: Cosine Ndcg@10
     - type: cosine_mrr@1
+      value: 0.9073359073359073
       name: Cosine Mrr@1
     - type: cosine_mrr@2
+      value: 0.9406370656370656
       name: Cosine Mrr@2
     - type: cosine_mrr@5
+      value: 0.9462837837837839
       name: Cosine Mrr@5
     - type: cosine_mrr@10
+      value: 0.946988570202856
       name: Cosine Mrr@10
     - type: cosine_mrr@100
+      value: 0.9470763202906061
       name: Cosine Mrr@100
     - type: cosine_map@100
+      value: 0.9470763202906061
       name: Cosine Map@100
 ---
 # SentenceTransformer based on intfloat/multilingual-e5-large
+This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
 ## Model Details
 - **Maximum Sequence Length:** 512 tokens
 - **Output Dimensionality:** 1024 dimensions
 - **Similarity Function:** Cosine Similarity
+<!-- - **Training Dataset:** Unknown -->
 <!-- - **Language:** Unknown -->
 <!-- - **License:** Unknown -->
 | Metric               | Value      |
 |:---------------------|:-----------|
+| cosine_accuracy@1    | 0.9073     |
+| cosine_accuracy@2    | 0.9739     |
+| cosine_accuracy@5    | 0.9942     |
+| cosine_accuracy@10   | 0.999      |
+| cosine_accuracy@100  | 1.0        |
+| cosine_precision@1   | 0.9073     |
+| cosine_precision@2   | 0.487      |
+| cosine_precision@5   | 0.1988     |
+| cosine_precision@10  | 0.0999     |
+| cosine_precision@100 | 0.01       |
+| cosine_recall@1      | 0.9073     |
+| cosine_recall@2      | 0.9739     |
+| cosine_recall@5      | 0.9942     |
+| cosine_recall@10     | 0.999      |
+| cosine_recall@100    | 1.0        |
+| **cosine_ndcg@10**   | **0.9602** |
+| cosine_mrr@1         | 0.9073     |
+| cosine_mrr@2         | 0.9406     |
+| cosine_mrr@5         | 0.9463     |
+| cosine_mrr@10        | 0.947      |
+| cosine_mrr@100       | 0.9471     |
+| cosine_map@100       | 0.9471     |
 <!--
 ## Bias, Risks and Limitations
 ### Training Dataset
+#### Unnamed Dataset
+* Size: 10,356 training samples
 * Columns: <code>query</code> and <code>positive</code>
 * Approximate statistics based on the first 1000 samples:
   |         | query                                                                              | positive                                                                        |
 | Epoch  | Step | Training Loss | Validation Loss | cosine_ndcg@10 |
 |:------:|:----:|:-------------:|:---------------:|:--------------:|
 | -1     | -1   | -             | -               | 0.7166         |
+| 0.1543 | 100  | 0.9191        | -               | -              |
+| 0.3086 | 200  | 0.1876        | -               | -              |
+| 0.4630 | 300  | 0.1547        | -               | -              |
+| 0.6173 | 400  | 0.1556        | -               | -              |
+| 0.7716 | 500  | 0.179         | -               | -              |
+| 0.9259 | 600  | 0.1234        | -               | -              |
+| 1.0802 | 700  | 0.087         | -               | -              |
+| 1.2346 | 800  | 0.0576        | -               | -              |
+| 1.3889 | 900  | 0.0564        | -               | -              |
+| 1.5432 | 1000 | 0.0583        | 0.0271          | 0.9198         |
+| 1.6975 | 1100 | 0.0764        | -               | -              |
+| 1.8519 | 1200 | 0.0493        | -               | -              |
+| 2.0062 | 1300 | 0.0481        | -               | -              |
+| 2.1605 | 1400 | 0.0222        | -               | -              |
+| 2.3148 | 1500 | 0.0234        | -               | -              |
+| 2.4691 | 1600 | 0.0283        | -               | -              |
+| 2.6235 | 1700 | 0.0236        | -               | -              |
+| 2.7778 | 1800 | 0.026         | -               | -              |
+| 2.9321 | 1900 | 0.0217        | -               | -              |
+| 3.0864 | 2000 | 0.0193        | 0.0061          | 0.9534         |
+| 3.2407 | 2100 | 0.0135        | -               | -              |
+| 3.3951 | 2200 | 0.0162        | -               | -              |
+| 3.5494 | 2300 | 0.0109        | -               | -              |
+| 3.7037 | 2400 | 0.0107        | -               | -              |
+| 3.8580 | 2500 | 0.0105        | -               | -              |
+| 4.0123 | 2600 | 0.0095        | -               | -              |
+| 4.1667 | 2700 | 0.0146        | -               | -              |
+| 4.3210 | 2800 | 0.0102        | -               | -              |
+| 4.4753 | 2900 | 0.0108        | -               | -              |
+| 4.6296 | 3000 | 0.01          | 0.0061          | 0.9602         |
+| 4.7840 | 3100 | 0.008         | -               | -              |
+| 4.9383 | 3200 | 0.0117        | -               | -              |
 ### Framework Versions

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:24854dafae65ef24432ea85eb056628daff94e85bcb8d60730361305c68126c1
 size 2239607176

 version https://git-lfs.github.com/spec/v1
+oid sha256:8a156fd71ddd697aac4e8c39e7714f28d7852c7d782f6b21c821d0f433937f07
 size 2239607176