skfrost19
/

reranker-ModernBERT-base-msmarco-bce-Lion.Cosine-ep-1-3

@@ -27,13 +27,13 @@ model-index:
       type: NanoMSMARCO_R100
     metrics:
     - type: map
-      value: 0.6322
       name: Map
     - type: mrr@10
-      value: 0.6257
       name: Mrr@10
     - type: ndcg@10
-      value: 0.6902
       name: Ndcg@10
   - task:
       type: cross-encoder-reranking
@@ -43,13 +43,13 @@ model-index:
       type: NanoNFCorpus_R100
     metrics:
     - type: map
-      value: 0.3433
       name: Map
     - type: mrr@10
-      value: 0.5436
       name: Mrr@10
     - type: ndcg@10
-      value: 0.3796
       name: Ndcg@10
   - task:
       type: cross-encoder-reranking
@@ -59,13 +59,13 @@ model-index:
       type: NanoNQ_R100
     metrics:
     - type: map
-      value: 0.6859
       name: Map
     - type: mrr@10
-      value: 0.7007
       name: Mrr@10
     - type: ndcg@10
-      value: 0.7323
       name: Ndcg@10
   - task:
       type: cross-encoder-nano-beir
@@ -75,13 +75,13 @@ model-index:
       type: NanoBEIR_R100_mean
     metrics:
     - type: map
-      value: 0.5538
       name: Map
     - type: mrr@10
-      value: 0.6233
       name: Mrr@10
     - type: ndcg@10
-      value: 0.6007
       name: Ndcg@10
 ---
@@ -191,9 +191,9 @@ You can finetune this model on your own dataset.
 | Metric      | NanoMSMARCO_R100     | NanoNFCorpus_R100    | NanoNQ_R100          |
 |:------------|:---------------------|:---------------------|:---------------------|
-| map         | 0.6322 (+0.1426)     | 0.3433 (+0.0823)     | 0.6859 (+0.2663)     |
-| mrr@10      | 0.6257 (+0.1482)     | 0.5436 (+0.0437)     | 0.7007 (+0.2740)     |
-| **ndcg@10** | **0.6902 (+0.1498)** | **0.3796 (+0.0546)** | **0.7323 (+0.2316)** |
 #### Cross Encoder Nano BEIR
@@ -214,9 +214,9 @@ You can finetune this model on your own dataset.
 | Metric      | Value                |
 |:------------|:---------------------|
-| map         | 0.5538 (+0.1637)     |
-| mrr@10      | 0.6233 (+0.1553)     |
-| **ndcg@10** | **0.6007 (+0.1453)** |
 <!--
 ## Bias, Risks and Limitations
@@ -421,23 +421,21 @@ You can finetune this model on your own dataset.
 </details>
 ### Training Logs
-| Epoch   | Step      | Training Loss | Validation Loss | NanoMSMARCO_R100_ndcg@10 | NanoNFCorpus_R100_ndcg@10 | NanoNQ_R100_ndcg@10  | NanoBEIR_R100_mean_ndcg@10 |
-|:-------:|:---------:|:-------------:|:---------------:|:------------------------:|:-------------------------:|:--------------------:|:--------------------------:|
-| -1      | -1        | -             | -               | 0.0186 (-0.5218)         | 0.2940 (-0.0310)          | 0.0428 (-0.4579)     | 0.1185 (-0.3369)           |
-| 0.0001  | 1         | 0.7403        | -               | -                        | -                         | -                    | -                          |
-| 0.3860  | 4000      | 0.2255        | -               | -                        | -                         | -                    | -                          |
-| 0.7719  | 8000      | 0.153         | -               | -                        | -                         | -                    | -                          |
-| **1.0** | **10364** | **-**         | **0.1429**      | **0.6902 (+0.1498)**     | **0.3796 (+0.0546)**      | **0.7323 (+0.2316)** | **0.6007 (+0.1453)**       |
-| 1.1579  | 12000     | 0.1356        | -               | -                        | -                         | -                    | -                          |
-| 1.5438  | 16000     | 0.122         | -               | -                        | -                         | -                    | -                          |
-| 1.9298  | 20000     | 0.1158        | -               | -                        | -                         | -                    | -                          |
-| 2.0     | 20728     | -             | 0.1267          | 0.6900 (+0.1495)         | 0.3621 (+0.0370)          | 0.7013 (+0.2007)     | 0.5844 (+0.1291)           |
-| 2.3157  | 24000     | 0.0993        | -               | -                        | -                         | -                    | -                          |
-| 2.7017  | 28000     | 0.0945        | -               | -                        | -                         | -                    | -                          |
-| 3.0     | 31092     | -             | 0.1184          | 0.6916 (+0.1512)         | 0.3806 (+0.0556)          | 0.7025 (+0.2018)     | 0.5916 (+0.1362)           |
-| -1      | -1        | -             | -               | 0.6902 (+0.1498)         | 0.3796 (+0.0546)          | 0.7323 (+0.2316)     | 0.6007 (+0.1453)           |
-* The bold row denotes the saved checkpoint.
 ### Framework Versions
 - Python: 3.11.5

       type: NanoMSMARCO_R100
     metrics:
     - type: map
+      value: 0.6266
       name: Map
     - type: mrr@10
+      value: 0.622
       name: Mrr@10
     - type: ndcg@10
+      value: 0.6916
       name: Ndcg@10
   - task:
       type: cross-encoder-reranking
       type: NanoNFCorpus_R100
     metrics:
     - type: map
+      value: 0.3574
       name: Map
     - type: mrr@10
+      value: 0.5321
       name: Mrr@10
     - type: ndcg@10
+      value: 0.3806
       name: Ndcg@10
   - task:
       type: cross-encoder-reranking
       type: NanoNQ_R100
     metrics:
     - type: map
+      value: 0.6437
       name: Map
     - type: mrr@10
+      value: 0.6663
       name: Mrr@10
     - type: ndcg@10
+      value: 0.7025
       name: Ndcg@10
   - task:
       type: cross-encoder-nano-beir
       type: NanoBEIR_R100_mean
     metrics:
     - type: map
+      value: 0.5426
       name: Map
     - type: mrr@10
+      value: 0.6068
       name: Mrr@10
     - type: ndcg@10
+      value: 0.5916
       name: Ndcg@10
 ---
 | Metric      | NanoMSMARCO_R100     | NanoNFCorpus_R100    | NanoNQ_R100          |
 |:------------|:---------------------|:---------------------|:---------------------|
+| map         | 0.6266 (+0.1371)     | 0.3574 (+0.0964)     | 0.6437 (+0.2241)     |
+| mrr@10      | 0.6220 (+0.1445)     | 0.5321 (+0.0322)     | 0.6663 (+0.2396)     |
+| **ndcg@10** | **0.6916 (+0.1512)** | **0.3806 (+0.0556)** | **0.7025 (+0.2018)** |
 #### Cross Encoder Nano BEIR
 | Metric      | Value                |
 |:------------|:---------------------|
+| map         | 0.5426 (+0.1525)     |
+| mrr@10      | 0.6068 (+0.1388)     |
+| **ndcg@10** | **0.5916 (+0.1362)** |
 <!--
 ## Bias, Risks and Limitations
 </details>
 ### Training Logs
+| Epoch  | Step  | Training Loss | Validation Loss | NanoMSMARCO_R100_ndcg@10 | NanoNFCorpus_R100_ndcg@10 | NanoNQ_R100_ndcg@10 | NanoBEIR_R100_mean_ndcg@10 |
+|:------:|:-----:|:-------------:|:---------------:|:------------------------:|:-------------------------:|:-------------------:|:--------------------------:|
+| -1     | -1    | -             | -               | 0.0186 (-0.5218)         | 0.2940 (-0.0310)          | 0.0428 (-0.4579)    | 0.1185 (-0.3369)           |
+| 0.0001 | 1     | 0.7403        | -               | -                        | -                         | -                   | -                          |
+| 0.3860 | 4000  | 0.2255        | -               | -                        | -                         | -                   | -                          |
+| 0.7719 | 8000  | 0.153         | -               | -                        | -                         | -                   | -                          |
+| 1.0    | 10364 | -             | 0.1429          | 0.6902 (+0.1498)         | 0.3796 (+0.0546)          | 0.7323 (+0.2316)    | 0.6007 (+0.1453)           |
+| 1.1579 | 12000 | 0.1356        | -               | -                        | -                         | -                   | -                          |
+| 1.5438 | 16000 | 0.122         | -               | -                        | -                         | -                   | -                          |
+| 1.9298 | 20000 | 0.1158        | -               | -                        | -                         | -                   | -                          |
+| 2.0    | 20728 | -             | 0.1267          | 0.6900 (+0.1495)         | 0.3621 (+0.0370)          | 0.7013 (+0.2007)    | 0.5844 (+0.1291)           |
+| 2.3157 | 24000 | 0.0993        | -               | -                        | -                         | -                   | -                          |
+| 2.7017 | 28000 | 0.0945        | -               | -                        | -                         | -                   | -                          |
+| 3.0    | 31092 | -             | 0.1184          | 0.6916 (+0.1512)         | 0.3806 (+0.0556)          | 0.7025 (+0.2018)    | 0.5916 (+0.1362)           |
 ### Framework Versions
 - Python: 3.11.5

config.json CHANGED Viewed

@@ -41,16 +41,15 @@
   "num_hidden_layers": 22,
   "pad_token_id": 50283,
   "position_embedding_type": "absolute",
-  "reference_compile": true,
   "repad_logits_with_grad": false,
   "sentence_transformers": {
     "activation_fn": "torch.nn.modules.activation.Sigmoid",
-    "version": "4.0.1"
   },
   "sep_token_id": 50282,
   "sparse_pred_ignore_index": -100,
   "sparse_prediction": false,
   "torch_dtype": "float32",
-  "transformers_version": "4.50.3",
   "vocab_size": 50368
 }

   "num_hidden_layers": 22,
   "pad_token_id": 50283,
   "position_embedding_type": "absolute",
   "repad_logits_with_grad": false,
   "sentence_transformers": {
     "activation_fn": "torch.nn.modules.activation.Sigmoid",
+    "version": "4.0.2"
   },
   "sep_token_id": 50282,
   "sparse_pred_ignore_index": -100,
   "sparse_prediction": false,
   "torch_dtype": "float32",
+  "transformers_version": "4.51.0",
   "vocab_size": 50368
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f4cffca4b22f3dee1801eedc43b6390a7148e160d29c1bb412fceae36fef7f27
 size 598436708

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb68e7aaba743a9bafcf7fd76ee9097328acc5e550b2c18209b302ecb6ef5c8c
 size 598436708

tokenizer_config.json CHANGED Viewed

@@ -933,13 +933,20 @@
   "cls_token": "[CLS]",
   "extra_special_tokens": {},
   "mask_token": "[MASK]",
   "model_input_names": [
     "input_ids",
     "attention_mask"
   ],
   "model_max_length": 8192,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "tokenizer_class": "PreTrainedTokenizer",
   "unk_token": "[UNK]"
 }

   "cls_token": "[CLS]",
   "extra_special_tokens": {},
   "mask_token": "[MASK]",
+  "max_length": 8192,
   "model_input_names": [
     "input_ids",
     "attention_mask"
   ],
   "model_max_length": 8192,
+  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "sep_token": "[SEP]",
+  "stride": 0,
   "tokenizer_class": "PreTrainedTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "[UNK]"
 }