Training in progress, step 500

Browse files

Files changed (11) hide show

config.json +23 -15
merges.txt +0 -0
pytorch_model.bin +2 -2
runs/Jul20_15-14-30_13a322e3f7f6/events.out.tfevents.1658330179.13a322e3f7f6.80.0 +2 -2
runs/Jul20_15-50-39_13a322e3f7f6/1658332243.7114267/events.out.tfevents.1658332243.13a322e3f7f6.80.3 +3 -0
runs/Jul20_15-50-39_13a322e3f7f6/events.out.tfevents.1658332243.13a322e3f7f6.80.2 +3 -0
special_tokens_map.json +49 -5
tokenizer.json +0 -0
tokenizer_config.json +63 -10
training_args.bin +1 -1
vocab.json +0 -0

config.json CHANGED Viewed

@@ -1,30 +1,38 @@
 {
-  "_name_or_path": "distilbert-base-uncased",
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "dim": 768,
-  "dropout": 0.1,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "LABEL_0"
   },
   "initializer_range": 0.02,
   "label2id": {
     "LABEL_0": 0
   },
   "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "pad_token_id": 0,
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "torch_dtype": "float32",
   "transformers_version": "4.20.1",
-  "vocab_size": 30522
 }

 {
+  "_name_or_path": "microsoft/deberta-base",
   "architectures": [
+    "DebertaForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "LABEL_0"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
   "label2id": {
     "LABEL_0": 0
   },
+  "layer_norm_eps": 1e-07,
   "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
   "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 768,
+  "pos_att_type": [
+    "c2p",
+    "p2c"
+  ],
+  "position_biased_input": false,
+  "relative_attention": true,
   "torch_dtype": "float32",
   "transformers_version": "4.20.1",
+  "type_vocab_size": 0,
+  "vocab_size": 50265
 }

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:51da89b344836b15b2f124e392d5bef6ecad1f9b57917b652549fc7584dc36c5
-size 267851249

 version https://git-lfs.github.com/spec/v1
+oid sha256:3dd41efbc575dd0687d31ce9ee305cc891349538fb6b6dfab1357de8b958cbd8
+size 556843759

runs/Jul20_15-14-30_13a322e3f7f6/events.out.tfevents.1658330179.13a322e3f7f6.80.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8e68a0e9ae15ff125a5a8a28c8a58d328538595f3b48e451addad410796ad12
-size 4180

 version https://git-lfs.github.com/spec/v1
+oid sha256:a69c22d53ad344d58de4ea64c2a92f426e0890e418084d6895fe9b053586cab3
+size 21540

runs/Jul20_15-50-39_13a322e3f7f6/1658332243.7114267/events.out.tfevents.1658332243.13a322e3f7f6.80.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a8d7342dbf1853c2c394a71078a1e69f7197c9d09e79ef167dd8a0811854930b
+size 5327

runs/Jul20_15-50-39_13a322e3f7f6/events.out.tfevents.1658332243.13a322e3f7f6.80.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b00214a3c3652502a1f506a4aa55f72843c8f3cc0b449cf961fb638b346f97f9
+size 4350

special_tokens_map.json CHANGED Viewed

@@ -1,7 +1,51 @@
 {
-  "cls_token": "[CLS]",
-  "mask_token": "[MASK]",
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "unk_token": "[UNK]"
 }

 {
+  "bos_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -1,14 +1,67 @@
 {
-  "cls_token": "[CLS]",
-  "do_lower_case": true,
-  "mask_token": "[MASK]",
   "model_max_length": 512,
-  "name_or_path": "distilbert-base-uncased",
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
   "special_tokens_map_file": null,
-  "strip_accents": null,
-  "tokenize_chinese_chars": true,
-  "tokenizer_class": "DistilBertTokenizer",
-  "unk_token": "[UNK]"
 }

 {
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "cls_token": {
+    "__type": "AddedToken",
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "do_lower_case": false,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "mask_token": {
+    "__type": "AddedToken",
+    "content": "[MASK]",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "model_max_length": 512,
+  "name_or_path": "microsoft/deberta-base",
+  "pad_token": {
+    "__type": "AddedToken",
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "__type": "AddedToken",
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "special_tokens_map_file": null,
+  "tokenizer_class": "DebertaTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "vocab_type": "gpt2"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:49a7f70d73b3d125ded65a39442cdfac9759bbc7a749eacb29a4029a96f4e8aa
 size 3247

 version https://git-lfs.github.com/spec/v1
+oid sha256:ebff1b2578d1a609fbff8f596d5266adde7240d5506f8aa5559e22b3db7fa4c5
 size 3247

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff