Update model with fully trained weights from checkpoint-31092
Browse files- README.md +33 -35
- config.json +2 -3
- model.safetensors +1 -1
- tokenizer_config.json +7 -0
README.md
CHANGED
@@ -27,13 +27,13 @@ model-index:
|
|
27 |
type: NanoMSMARCO_R100
|
28 |
metrics:
|
29 |
- type: map
|
30 |
-
value: 0.
|
31 |
name: Map
|
32 |
- type: mrr@10
|
33 |
-
value: 0.
|
34 |
name: Mrr@10
|
35 |
- type: ndcg@10
|
36 |
-
value: 0.
|
37 |
name: Ndcg@10
|
38 |
- task:
|
39 |
type: cross-encoder-reranking
|
@@ -43,13 +43,13 @@ model-index:
|
|
43 |
type: NanoNFCorpus_R100
|
44 |
metrics:
|
45 |
- type: map
|
46 |
-
value: 0.
|
47 |
name: Map
|
48 |
- type: mrr@10
|
49 |
-
value: 0.
|
50 |
name: Mrr@10
|
51 |
- type: ndcg@10
|
52 |
-
value: 0.
|
53 |
name: Ndcg@10
|
54 |
- task:
|
55 |
type: cross-encoder-reranking
|
@@ -59,13 +59,13 @@ model-index:
|
|
59 |
type: NanoNQ_R100
|
60 |
metrics:
|
61 |
- type: map
|
62 |
-
value: 0.
|
63 |
name: Map
|
64 |
- type: mrr@10
|
65 |
-
value: 0.
|
66 |
name: Mrr@10
|
67 |
- type: ndcg@10
|
68 |
-
value: 0.
|
69 |
name: Ndcg@10
|
70 |
- task:
|
71 |
type: cross-encoder-nano-beir
|
@@ -75,13 +75,13 @@ model-index:
|
|
75 |
type: NanoBEIR_R100_mean
|
76 |
metrics:
|
77 |
- type: map
|
78 |
-
value: 0.
|
79 |
name: Map
|
80 |
- type: mrr@10
|
81 |
-
value: 0.
|
82 |
name: Mrr@10
|
83 |
- type: ndcg@10
|
84 |
-
value: 0.
|
85 |
name: Ndcg@10
|
86 |
---
|
87 |
|
@@ -191,9 +191,9 @@ You can finetune this model on your own dataset.
|
|
191 |
|
192 |
| Metric | NanoMSMARCO_R100 | NanoNFCorpus_R100 | NanoNQ_R100 |
|
193 |
|:------------|:---------------------|:---------------------|:---------------------|
|
194 |
-
| map | 0.
|
195 |
-
| mrr@10 | 0.
|
196 |
-
| **ndcg@10** | **0.
|
197 |
|
198 |
#### Cross Encoder Nano BEIR
|
199 |
|
@@ -214,9 +214,9 @@ You can finetune this model on your own dataset.
|
|
214 |
|
215 |
| Metric | Value |
|
216 |
|:------------|:---------------------|
|
217 |
-
| map | 0.
|
218 |
-
| mrr@10 | 0.
|
219 |
-
| **ndcg@10** | **0.
|
220 |
|
221 |
<!--
|
222 |
## Bias, Risks and Limitations
|
@@ -421,23 +421,21 @@ You can finetune this model on your own dataset.
|
|
421 |
</details>
|
422 |
|
423 |
### Training Logs
|
424 |
-
| Epoch
|
425 |
-
|
426 |
-
| -1
|
427 |
-
| 0.0001
|
428 |
-
| 0.3860
|
429 |
-
| 0.7719
|
430 |
-
|
|
431 |
-
| 1.1579
|
432 |
-
| 1.5438
|
433 |
-
| 1.9298
|
434 |
-
| 2.0
|
435 |
-
| 2.3157
|
436 |
-
| 2.7017
|
437 |
-
| 3.0
|
438 |
-
|
439 |
-
|
440 |
-
* The bold row denotes the saved checkpoint.
|
441 |
|
442 |
### Framework Versions
|
443 |
- Python: 3.11.5
|
|
|
27 |
type: NanoMSMARCO_R100
|
28 |
metrics:
|
29 |
- type: map
|
30 |
+
value: 0.6266
|
31 |
name: Map
|
32 |
- type: mrr@10
|
33 |
+
value: 0.622
|
34 |
name: Mrr@10
|
35 |
- type: ndcg@10
|
36 |
+
value: 0.6916
|
37 |
name: Ndcg@10
|
38 |
- task:
|
39 |
type: cross-encoder-reranking
|
|
|
43 |
type: NanoNFCorpus_R100
|
44 |
metrics:
|
45 |
- type: map
|
46 |
+
value: 0.3574
|
47 |
name: Map
|
48 |
- type: mrr@10
|
49 |
+
value: 0.5321
|
50 |
name: Mrr@10
|
51 |
- type: ndcg@10
|
52 |
+
value: 0.3806
|
53 |
name: Ndcg@10
|
54 |
- task:
|
55 |
type: cross-encoder-reranking
|
|
|
59 |
type: NanoNQ_R100
|
60 |
metrics:
|
61 |
- type: map
|
62 |
+
value: 0.6437
|
63 |
name: Map
|
64 |
- type: mrr@10
|
65 |
+
value: 0.6663
|
66 |
name: Mrr@10
|
67 |
- type: ndcg@10
|
68 |
+
value: 0.7025
|
69 |
name: Ndcg@10
|
70 |
- task:
|
71 |
type: cross-encoder-nano-beir
|
|
|
75 |
type: NanoBEIR_R100_mean
|
76 |
metrics:
|
77 |
- type: map
|
78 |
+
value: 0.5426
|
79 |
name: Map
|
80 |
- type: mrr@10
|
81 |
+
value: 0.6068
|
82 |
name: Mrr@10
|
83 |
- type: ndcg@10
|
84 |
+
value: 0.5916
|
85 |
name: Ndcg@10
|
86 |
---
|
87 |
|
|
|
191 |
|
192 |
| Metric | NanoMSMARCO_R100 | NanoNFCorpus_R100 | NanoNQ_R100 |
|
193 |
|:------------|:---------------------|:---------------------|:---------------------|
|
194 |
+
| map | 0.6266 (+0.1371) | 0.3574 (+0.0964) | 0.6437 (+0.2241) |
|
195 |
+
| mrr@10 | 0.6220 (+0.1445) | 0.5321 (+0.0322) | 0.6663 (+0.2396) |
|
196 |
+
| **ndcg@10** | **0.6916 (+0.1512)** | **0.3806 (+0.0556)** | **0.7025 (+0.2018)** |
|
197 |
|
198 |
#### Cross Encoder Nano BEIR
|
199 |
|
|
|
214 |
|
215 |
| Metric | Value |
|
216 |
|:------------|:---------------------|
|
217 |
+
| map | 0.5426 (+0.1525) |
|
218 |
+
| mrr@10 | 0.6068 (+0.1388) |
|
219 |
+
| **ndcg@10** | **0.5916 (+0.1362)** |
|
220 |
|
221 |
<!--
|
222 |
## Bias, Risks and Limitations
|
|
|
421 |
</details>
|
422 |
|
423 |
### Training Logs
|
424 |
+
| Epoch | Step | Training Loss | Validation Loss | NanoMSMARCO_R100_ndcg@10 | NanoNFCorpus_R100_ndcg@10 | NanoNQ_R100_ndcg@10 | NanoBEIR_R100_mean_ndcg@10 |
|
425 |
+
|:------:|:-----:|:-------------:|:---------------:|:------------------------:|:-------------------------:|:-------------------:|:--------------------------:|
|
426 |
+
| -1 | -1 | - | - | 0.0186 (-0.5218) | 0.2940 (-0.0310) | 0.0428 (-0.4579) | 0.1185 (-0.3369) |
|
427 |
+
| 0.0001 | 1 | 0.7403 | - | - | - | - | - |
|
428 |
+
| 0.3860 | 4000 | 0.2255 | - | - | - | - | - |
|
429 |
+
| 0.7719 | 8000 | 0.153 | - | - | - | - | - |
|
430 |
+
| 1.0 | 10364 | - | 0.1429 | 0.6902 (+0.1498) | 0.3796 (+0.0546) | 0.7323 (+0.2316) | 0.6007 (+0.1453) |
|
431 |
+
| 1.1579 | 12000 | 0.1356 | - | - | - | - | - |
|
432 |
+
| 1.5438 | 16000 | 0.122 | - | - | - | - | - |
|
433 |
+
| 1.9298 | 20000 | 0.1158 | - | - | - | - | - |
|
434 |
+
| 2.0 | 20728 | - | 0.1267 | 0.6900 (+0.1495) | 0.3621 (+0.0370) | 0.7013 (+0.2007) | 0.5844 (+0.1291) |
|
435 |
+
| 2.3157 | 24000 | 0.0993 | - | - | - | - | - |
|
436 |
+
| 2.7017 | 28000 | 0.0945 | - | - | - | - | - |
|
437 |
+
| 3.0 | 31092 | - | 0.1184 | 0.6916 (+0.1512) | 0.3806 (+0.0556) | 0.7025 (+0.2018) | 0.5916 (+0.1362) |
|
438 |
+
|
|
|
|
|
439 |
|
440 |
### Framework Versions
|
441 |
- Python: 3.11.5
|
config.json
CHANGED
@@ -41,16 +41,15 @@
|
|
41 |
"num_hidden_layers": 22,
|
42 |
"pad_token_id": 50283,
|
43 |
"position_embedding_type": "absolute",
|
44 |
-
"reference_compile": true,
|
45 |
"repad_logits_with_grad": false,
|
46 |
"sentence_transformers": {
|
47 |
"activation_fn": "torch.nn.modules.activation.Sigmoid",
|
48 |
-
"version": "4.0.
|
49 |
},
|
50 |
"sep_token_id": 50282,
|
51 |
"sparse_pred_ignore_index": -100,
|
52 |
"sparse_prediction": false,
|
53 |
"torch_dtype": "float32",
|
54 |
-
"transformers_version": "4.
|
55 |
"vocab_size": 50368
|
56 |
}
|
|
|
41 |
"num_hidden_layers": 22,
|
42 |
"pad_token_id": 50283,
|
43 |
"position_embedding_type": "absolute",
|
|
|
44 |
"repad_logits_with_grad": false,
|
45 |
"sentence_transformers": {
|
46 |
"activation_fn": "torch.nn.modules.activation.Sigmoid",
|
47 |
+
"version": "4.0.2"
|
48 |
},
|
49 |
"sep_token_id": 50282,
|
50 |
"sparse_pred_ignore_index": -100,
|
51 |
"sparse_prediction": false,
|
52 |
"torch_dtype": "float32",
|
53 |
+
"transformers_version": "4.51.0",
|
54 |
"vocab_size": 50368
|
55 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 598436708
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb68e7aaba743a9bafcf7fd76ee9097328acc5e550b2c18209b302ecb6ef5c8c
|
3 |
size 598436708
|
tokenizer_config.json
CHANGED
@@ -933,13 +933,20 @@
|
|
933 |
"cls_token": "[CLS]",
|
934 |
"extra_special_tokens": {},
|
935 |
"mask_token": "[MASK]",
|
|
|
936 |
"model_input_names": [
|
937 |
"input_ids",
|
938 |
"attention_mask"
|
939 |
],
|
940 |
"model_max_length": 8192,
|
|
|
941 |
"pad_token": "[PAD]",
|
|
|
|
|
942 |
"sep_token": "[SEP]",
|
|
|
943 |
"tokenizer_class": "PreTrainedTokenizer",
|
|
|
|
|
944 |
"unk_token": "[UNK]"
|
945 |
}
|
|
|
933 |
"cls_token": "[CLS]",
|
934 |
"extra_special_tokens": {},
|
935 |
"mask_token": "[MASK]",
|
936 |
+
"max_length": 8192,
|
937 |
"model_input_names": [
|
938 |
"input_ids",
|
939 |
"attention_mask"
|
940 |
],
|
941 |
"model_max_length": 8192,
|
942 |
+
"pad_to_multiple_of": null,
|
943 |
"pad_token": "[PAD]",
|
944 |
+
"pad_token_type_id": 0,
|
945 |
+
"padding_side": "right",
|
946 |
"sep_token": "[SEP]",
|
947 |
+
"stride": 0,
|
948 |
"tokenizer_class": "PreTrainedTokenizer",
|
949 |
+
"truncation_side": "right",
|
950 |
+
"truncation_strategy": "longest_first",
|
951 |
"unk_token": "[UNK]"
|
952 |
}
|