diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a136721311d1c1d4fc27d7946d5cb8297e9ec495 --- /dev/null +++ b/config.json @@ -0,0 +1,35 @@ +{ + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": 128001, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 3072, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "num_attention_heads": 24, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "torch_dtype": "bfloat16", + "transformers_version": "4.55.4", + "use_cache": false, + "vocab_size": 128256 +} diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00000-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00000-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6b30abd0299b140102f80ccf183becc0c2a92bc0 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00000-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13fceebe5fc4b5abc6c4c97bb5657655ebd0e6ecd515452174fba1e9fd7e7b83 +size 6917672 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00001-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00001-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..c0f86aa6d595f1eb1e6df2a4c9af605be6e6e6a7 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00001-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c036edd5778dd904665ba34ae451890786d5a59170d8edbd7fcad883d8ef0382 +size 6825952 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00002-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00002-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..70eaa2bfad43afcdd0e9cc0d0926bd1b7497e5f6 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00002-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23be0816f6776858ad7392838c8bb01856a6b9737043ce9c7162b1c913c8f151 +size 6859424 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00003-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00003-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e52798963001c7813b9bf59ede39a4253eaef8a6 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00003-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c5f531ad82f221c205ffdfd5380ffec53a0d36d6e66df498c35541e9831652 +size 6933168 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00004-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00004-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b183d7c4b091bb3de9b5850d285bebecdf5e9178 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00004-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d02dba8d27a67206fcdbf06b137718b70fdf164f24ec804a1ee97565345049 +size 6703448 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00005-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00005-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..d21165a04698eca7a0fa7a6e815ad9032c7a6047 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00005-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:082933d31f79bb7b3b05d00cfc7350146c30c754d72e61dbcf951f4e8d6591f4 +size 6912016 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00006-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00006-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..21f15d03d72a9be66cde1e95faa3497469071243 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00006-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c2ad7ffa261a201cde6648cf6bbb52335330a6aa6140168da604feb2da5849 +size 6867792 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00007-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00007-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..cf29bc0441659116bf229586ed99e973d23f487f --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00007-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f602652d4b781e24fcb795b804b66269a8fcbb943d01a1c5520bdfd726ffff5 +size 7061616 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00008-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00008-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..709239387c5cd1b84dc767cddf40a07fe56570a5 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00008-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec0db8129bdde35d5421fe4a0006e96f54dfb94589650bcebed5c8b6ac9dfc5 +size 6849160 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00009-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00009-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..682757070b018882a73449e4816b32b24f6a792e --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00009-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582e54605c4e0b429b97f717a548c238261441d3afdccb1ff93443cffdfa32f6 +size 6780472 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00010-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00010-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..20b5f8fee2fad229ee07dc537100409aae0b639f --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00010-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c074820939af0bf6d31e57be2d02f98d62422f518618c78093ac375ce384823 +size 6875072 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00011-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00011-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6d92c0ccff38a2060defc519f793efc163c4e2f5 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00011-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a4665472917c3b8afc2f1ba802bbaccb29728724f1200238b14dbf25222bcd +size 6973824 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00012-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00012-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7f94e5e8dce6b7289e6a193b430fdf255cbeec8c --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00012-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0653333e6b112c8a3d6648fee97fd900621358bb372261bc3492ccc218aea280 +size 6904480 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00013-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00013-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..bfeb3803d460a9a9126305f5b932154fe775e48d --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00013-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dce31ad7e07c62d7b247dede34138421c5e908ae8317c1c6f1d0d6acf8c909a +size 6948976 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00014-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00014-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..01e4d9d287569ac4c5b11606fb069b3705df36d8 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00014-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b913f903de5cfae743dce45d43efe9b9ffaf5aec8add388d953a8972510efd +size 6937328 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00015-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00015-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..5fb976284b2a6492dbbcb55dcd79d16cb10ef5f4 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00015-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e329498cd850f0f3163c0535fc62f5b02e5a93caea727f7f7bd3c31464f6a189 +size 7158560 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00016-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00016-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..9818fc4365627aab2d87f3700efb8a58a68ffd3a --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00016-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4cc4255bead8ec94c7e3d245cdeed8e957d1b5e23cf0864e28dd3e7cd41fb69 +size 7046512 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00017-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00017-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..c1375a4d2cb39ac1ef32f5310a8d18433e47cc78 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00017-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89c12b9a140ae6a25276820c5401262f0e3c9f9492a71982170cc63af0bb19d +size 6867960 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00018-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00018-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b454f662fc2e60107e910d17d9db8f97ab98a529 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00018-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1bd66d83dba50d987ef182cf132add642c2137f960fb4126b07c3495950ae9 +size 6904392 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00019-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00019-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..9579c846d26058a154488e21fae239f10411ad28 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00019-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b97082992fb288254493f688d6866758174c0cce905803a012f2f17b2c5f1a9 +size 7017248 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00020-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00020-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6663fc2e6d4de943415b712e77957ba14e13ffe8 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00020-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd775ca10234be618f5eb54c623cc6d2cfdd473a36bae72fae7a1b5e7a24407 +size 7085272 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00021-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00021-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7073ee62e2e890504b6ba63da84a439ec23f403a --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00021-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a1b6396bc87bda2a2becc9880a165eb01552b1872e85f5cab9baca6360387f +size 7202112 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00022-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00022-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..2014e0fed19780823f3eb108f393616fc3b62e78 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00022-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133490047030ec7e295613f02a6d7767079ceacbb449a57ad5e7b5279e148891 +size 7076888 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00023-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00023-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..8603e3402d631d73fb2d274c729deedc113f5dcd --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00023-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05517673ae62fa233fa2e52be76359e15b017a3bc19cb273d157bff49d162063 +size 7054312 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00024-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00024-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..006836f06656303812fae54e942794d52d461f98 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00024-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af7a7f143ab1d3f4bf8fccdf05d68232a5fbca6b9fdbfa470a3eadcedc3d1950 +size 6994248 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00025-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00025-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..231a11bdf674012b529bb869018d404a81c10a9a --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00025-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5800aeb87cdc31b8d377ed5e3bcac2551264b562128ca34bec335d3cc0388c9d +size 6839208 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00026-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00026-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..df0dc85e418ad7eb725a7d109d11f6989c7eb2de --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00026-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a273ced942be54a02d6d751d8b9a31831903154b2cb5f8e7af8672b82d7c0e8b +size 6973208 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00027-of-00028.arrow b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00027-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6cffd09d14cf6c2f0a5df39ca843bdab82db5b62 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/data-00027-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:271a44ac87198d71091872779399729e0bd72ec5f773a845f9dc79ef1b6864af +size 7046528 diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/dataset_info.json b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..2c93369e7a9b746589b7dbc435dd643bc02d8d6c --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/dataset_info.json @@ -0,0 +1,40 @@ +{ + "citation": "", + "description": "", + "features": { + "input_ids": { + "feature": { + "dtype": "int32", + "_type": "Value" + }, + "_type": "List" + }, + "attention_mask": { + "feature": { + "dtype": "int8", + "_type": "Value" + }, + "_type": "List" + }, + "labels": { + "feature": { + "dtype": "int64", + "_type": "Value" + }, + "_type": "List" + }, + "position_ids": { + "feature": { + "dtype": "int64", + "_type": "Value" + }, + "_type": "List" + }, + "length": { + "dtype": "int64", + "_type": "Value" + } + }, + "homepage": "", + "license": "" +} \ No newline at end of file diff --git a/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/state.json b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/state.json new file mode 100644 index 0000000000000000000000000000000000000000..d350727d34a8229b82d209275206fe7da630e1f6 --- /dev/null +++ b/dataset_prepared/0d17ed7654ff305aa19c77e503fc1265/state.json @@ -0,0 +1,94 @@ +{ + "_data_files": [ + { + "filename": "data-00000-of-00028.arrow" + }, + { + "filename": "data-00001-of-00028.arrow" + }, + { + "filename": "data-00002-of-00028.arrow" + }, + { + "filename": "data-00003-of-00028.arrow" + }, + { + "filename": "data-00004-of-00028.arrow" + }, + { + "filename": "data-00005-of-00028.arrow" + }, + { + "filename": "data-00006-of-00028.arrow" + }, + { + "filename": "data-00007-of-00028.arrow" + }, + { + "filename": "data-00008-of-00028.arrow" + }, + { + "filename": "data-00009-of-00028.arrow" + }, + { + "filename": "data-00010-of-00028.arrow" + }, + { + "filename": "data-00011-of-00028.arrow" + }, + { + "filename": "data-00012-of-00028.arrow" + }, + { + "filename": "data-00013-of-00028.arrow" + }, + { + "filename": "data-00014-of-00028.arrow" + }, + { + "filename": "data-00015-of-00028.arrow" + }, + { + "filename": "data-00016-of-00028.arrow" + }, + { + "filename": "data-00017-of-00028.arrow" + }, + { + "filename": "data-00018-of-00028.arrow" + }, + { + "filename": "data-00019-of-00028.arrow" + }, + { + "filename": "data-00020-of-00028.arrow" + }, + { + "filename": "data-00021-of-00028.arrow" + }, + { + "filename": "data-00022-of-00028.arrow" + }, + { + "filename": "data-00023-of-00028.arrow" + }, + { + "filename": "data-00024-of-00028.arrow" + }, + { + "filename": "data-00025-of-00028.arrow" + }, + { + "filename": "data-00026-of-00028.arrow" + }, + { + "filename": "data-00027-of-00028.arrow" + } + ], + "_fingerprint": "d9cfb4a95203cd78", + "_format_columns": null, + "_format_kwargs": {}, + "_format_type": null, + "_output_all_columns": false, + "_split": null +} \ No newline at end of file diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00000-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00000-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..71890e93083f66fb69eb28e86ac3ecfe4476f631 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00000-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed50a45a97932f9b301c5960db14496c7a770c62eaa4353a882bbad1775e8480 +size 4256104 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00001-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00001-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..585b3a4339d7a4433757d9cfdf3a7a261f9aec93 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00001-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:859b8371be178104f881bbfae81745966d5f8b89597ef636bf48d67cc97be6a4 +size 4329376 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00002-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00002-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b4db74794f314848b4026e81479067bf3a1a5b94 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00002-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35eb72eed75e16f397e450f301619b9edde042d73c40b4fc0a1194b90cd708a1 +size 4229312 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00003-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00003-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..05f2530d6358d0057ff4da0cf1b747223fc0816e --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00003-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c85a4604ca251367d92caea18c07ebd55351bffa2b86492646bfac4b987627 +size 4195952 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00004-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00004-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a788687eca682a8be09790e7589351ab14fa0d15 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00004-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c07d894e78863bd12244912cfdd88b87fae6732e64945188edb87683e42f8d +size 4374608 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00005-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00005-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a1b151b1a1e0f0a96c98e37004dd7ccd62c85bb6 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00005-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a93d6aec3f2e84fa94e742506b510ec08c7fe1d9bcab6f253a49b0ac5a87db +size 4316656 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00006-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00006-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..041ea55b7e04246688747acbf4d9b08fa1e3b49e --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00006-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f7e0c89910704e2acf6900077aaf8436d74ea0226065dd0b73d8f6f35c146b +size 4407544 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00007-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00007-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..9559c94d68bb944078a3274abd15510850e7fe22 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00007-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781c7dc9f7dcbcd5a2cdee471d2ccd340e0bbf6a9e5d2f943a8bd9bacc2875cf +size 4270040 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00008-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00008-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..2debbfe9326a9afd5bb5229be8184368bf3041cd --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00008-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c77ec8363b77c97b2d6727040624dc8367b58196c3a5346daad876f0343196bc +size 4302048 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00009-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00009-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..8be370ca9b35bc47bcd82e83e6b9b446bd11c51d --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00009-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ce9902c943e1ab7b5cfd2bb6c14d2c9f80ad6f55085273a9b72151484fb6926 +size 4334336 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00010-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00010-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b47eacda9949d689d63467a375db47dc93d7ce30 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00010-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:661c143c0a4b1b2c4795114882b88d28bf9c3b713ef99b1027b603e7f95deb3c +size 4297032 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00011-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00011-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b1c3dc007f7b4da943f665d7d8cee6060fa3d92a --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00011-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb7c50aa9ef171afacf3fb9c7ecb46cf9fcc0e7b4faa0a6d38e57031ec64f33 +size 4312624 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00012-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00012-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..5338ffbbfe0a74883a61e6f27658afad80166e36 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00012-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d3ee09c7d0094f9a49b1c4e767a1696a56a0b02eda7f1de3de286860051ca4 +size 4274608 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00013-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00013-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..91da614389c895689fe707a9518ef882f19db3f6 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00013-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:342483149fb99f2f5f2a82fa991bb2ba075a5bdd00a77468cf556b8bebd5f29c +size 4331336 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00014-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00014-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..5fd5bca39d06a7ec416754d528b5173908d0bca0 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00014-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079532d6452e53fa6706ca47f0e52ef125725c59be9ece47cdbd0b59fa043e94 +size 4341456 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00015-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00015-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3382c7c54c9c0264eba3daf983240edc0fc377a1 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00015-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6512490f51e0d26840e3f6bbe2371709e5709e145fb5a48532a31593e81756 +size 4286616 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00016-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00016-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..80632e3833d4106a22dfb7c90da3cd199d979cee --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00016-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9756b4cc7bc036161ccd7034a538ec1a771c099c979c6fe9392f7f2bdfe445 +size 4360440 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00017-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00017-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3ac632e9409be9c118f9cbaa11bb7713cd674a72 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00017-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8644aea002ab00f8aa9d3b4299e4a35d3d3b0ed69c7224ce07ad2ccd685c770 +size 4200408 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00018-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00018-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3ce8c5b0bb288debfba2ebb6604a296ec12eeb65 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00018-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d8482586a945fb08942ecbe22266a6af4e9fb274e350fdbcea98fc7cf94f45 +size 4289720 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00019-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00019-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e3334a5b94db5a87c7993e1a13ce8b6a9b8a0e46 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00019-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88945a1674fdf85be0fdb83feeeb472eb961378e8e189be0d96900277d19b0b6 +size 4254104 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00020-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00020-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..d426d0fe3c2dded6fe004cff67c05f673b27b40b --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00020-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1dbc3029baa42dd775c445d0a85782dcc8f3871a590b88a602a0962829ff9ae +size 4253040 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00021-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00021-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7f002810f925aca96e09e2d95a71cefe1a9e2d92 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00021-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4921fa64b5223f0ab1b4ad4eaf0e1c3149aedec884f5d481c235289adb1e340d +size 4319336 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00022-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00022-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7f115ec9979d9599be249a0028c27c4abcc28d50 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00022-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0097ab40452b0df2dc4f4563e8a293c6651c8d91f115a99d177d787448c10609 +size 4341136 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00023-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00023-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b28945ca35dbe82b9aafc19dca283b423ee7e103 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00023-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326415c6cc5c728ad61d9c6890fd4b50fdbee7a1a27a0f7e539f5104859c1c7b +size 4397448 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00024-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00024-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..ea36f09c930985dafa88678b4980da48cb35b9e2 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00024-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7efab1233d963c4b8d4af9f442447b67c420acf8d16b4ac41adac2628026201 +size 4234240 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00025-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00025-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..9c4c1e5c62cc09579c5c3ceeecbfe2e56170384d --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00025-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea2fa0dac995c63ce6c3ce95638240368d03c352ba7266eeb842fbeb30f095f +size 4264896 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00026-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00026-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..f5d4119b46bdec3600d0d5bc0ab4e532090b6303 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00026-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6224f61b7d6fd1ee6e56a462d9bad4dc6985cad34680648d8d9b0e726da1bc2f +size 4292560 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00027-of-00028.arrow b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00027-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..2b434f7e597f0b08593c9b70a0c9456647fa627f --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/data-00027-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfbe92285819e9eafbb32310b0d8bfc418fe8f9ae52ef4510731bdf9c3413a7a +size 4275888 diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/dataset_info.json b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..0dc0cb28b8abc3a16a2403e346f17f2db870eccd --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/dataset_info.json @@ -0,0 +1,29 @@ +{ + "citation": "", + "description": "", + "features": { + "input_ids": { + "feature": { + "dtype": "int32", + "_type": "Value" + }, + "_type": "List" + }, + "attention_mask": { + "feature": { + "dtype": "int8", + "_type": "Value" + }, + "_type": "List" + }, + "labels": { + "feature": { + "dtype": "int64", + "_type": "Value" + }, + "_type": "List" + } + }, + "homepage": "", + "license": "" +} \ No newline at end of file diff --git a/dataset_prepared/9bc662aed65b76546b2d635b3957a343/state.json b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/state.json new file mode 100644 index 0000000000000000000000000000000000000000..cbb25799112fe91cfc54051fba4f4b009e23c6f0 --- /dev/null +++ b/dataset_prepared/9bc662aed65b76546b2d635b3957a343/state.json @@ -0,0 +1,94 @@ +{ + "_data_files": [ + { + "filename": "data-00000-of-00028.arrow" + }, + { + "filename": "data-00001-of-00028.arrow" + }, + { + "filename": "data-00002-of-00028.arrow" + }, + { + "filename": "data-00003-of-00028.arrow" + }, + { + "filename": "data-00004-of-00028.arrow" + }, + { + "filename": "data-00005-of-00028.arrow" + }, + { + "filename": "data-00006-of-00028.arrow" + }, + { + "filename": "data-00007-of-00028.arrow" + }, + { + "filename": "data-00008-of-00028.arrow" + }, + { + "filename": "data-00009-of-00028.arrow" + }, + { + "filename": "data-00010-of-00028.arrow" + }, + { + "filename": "data-00011-of-00028.arrow" + }, + { + "filename": "data-00012-of-00028.arrow" + }, + { + "filename": "data-00013-of-00028.arrow" + }, + { + "filename": "data-00014-of-00028.arrow" + }, + { + "filename": "data-00015-of-00028.arrow" + }, + { + "filename": "data-00016-of-00028.arrow" + }, + { + "filename": "data-00017-of-00028.arrow" + }, + { + "filename": "data-00018-of-00028.arrow" + }, + { + "filename": "data-00019-of-00028.arrow" + }, + { + "filename": "data-00020-of-00028.arrow" + }, + { + "filename": "data-00021-of-00028.arrow" + }, + { + "filename": "data-00022-of-00028.arrow" + }, + { + "filename": "data-00023-of-00028.arrow" + }, + { + "filename": "data-00024-of-00028.arrow" + }, + { + "filename": "data-00025-of-00028.arrow" + }, + { + "filename": "data-00026-of-00028.arrow" + }, + { + "filename": "data-00027-of-00028.arrow" + } + ], + "_fingerprint": "91eb925f8773717a", + "_format_columns": null, + "_format_kwargs": {}, + "_format_type": null, + "_output_all_columns": false, + "_split": null +} \ No newline at end of file diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00000-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00000-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..57d0e06f57ab611fa58a8481f63f2a78f6d07d49 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00000-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ece875b9a47f181a21a3ba9461769a3ed6542b0b26a9b0ac1898ce3f4a696ab +size 4252024 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00001-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00001-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..8885b38be0f0497b89429d3ca40982b0557f0167 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00001-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:851131dba92edbb0886ac34119dafc6cd5115816d19540b3336384cd552c463c +size 4170016 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00002-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00002-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..ec1e5945128195ad2940d60d26dc79d0eef47c6d --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00002-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46706a50a1026910268963c6b150750e75f6dc3c2d993d9961fffe43e33824d7 +size 4274936 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00003-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00003-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7beb2370e71fdb2d429b1c0b6cefc071e37f6581 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00003-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a1853b8c7b1c61bc71f1ce87e1b23e8265703c6ead4bbfcdf8a2679d6a2cce7 +size 4354480 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00004-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00004-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e709cdbd5a104e96c9c71366256b2c6e03572650 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00004-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc0cd4a9035fb29fa4e8673a775250ef7a6a02dc31e7a7a1881b0789413c24ae +size 4232496 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00005-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00005-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7292294c8b9d6f27e09c3b59b94c9edebe1e6105 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00005-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce81795b814bde101af1bf9f7e9bb9533f8e12083ba1015f9d746f025d43036 +size 4317080 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00006-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00006-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..38c9d0479dd18261037c49556b43fc1dc6f52e33 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00006-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5613e3551f7ddcf1bd56c823c89aef8b5a183fc2c2fb9e26befc1dfa883ded74 +size 4371000 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00007-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00007-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..ea8cce3ee2a89978719fed3ab1b539425e6721d8 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00007-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e462da793b444b5234787c6a7d85fd7b82c4c527dc224a175ffb570237dec23 +size 4273168 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00008-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00008-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..8e07e223c18cb559cd9eed3392663459fa6a94ce --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00008-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:096de7f3a34869a28b50b35c4bb97d415f2a606d84a82c9ba4713ff5cd3866f4 +size 4319240 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00009-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00009-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..694c86b2dd017453ccdc37eb687b509a28e7932e --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00009-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22eec843f9fe9bcdc6de5192e160e3a7c2d66e3436783922f5be469a36388a3f +size 4220840 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00010-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00010-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..c5f61472986c14555f73d5f2614d8aeadbdd3730 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00010-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf2f1c19cf5a8f83301076d34c7cc384e70f780db185d5ad9c5002b314ad928 +size 4361872 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00011-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00011-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..2a3a4c0f5c46ebdbfceb91fbd104f723d1e96c10 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00011-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8455a6e031a17d6cc9bda895dec3121db7d25b179510d77fe2c5eb1ded0c8fe +size 4339848 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00012-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00012-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..d71cae8c784ec218562e697a596ef50c9f5b13f3 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00012-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da37250592d009faea37475abf27f8582a4fe6e313e4f427be464ab9d7c1fcb0 +size 4246928 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00013-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00013-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..461b71a7ef6cce7bc7c24158448446b44646a90d --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00013-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:238efc1bbd637c7e6b4a2525adc455fb8d92f9e96b0d9d330b40255dba6965d9 +size 4264536 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00014-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00014-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..45ceee6d3e0e9f5a11ac1c62a06c0abce28460c9 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00014-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d9c0ae6d0e442038db7de67e3d56d071ac185cfac2b86d70d38a86dbe0a95bb +size 4273960 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00015-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00015-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e5df30eeff53cd5635e816623bd7512748b87d28 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00015-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4132174c84ed843f097ef3bd817db9ec5fc204f364f356ca7fc16d510e1eb689 +size 4260432 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00016-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00016-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a9e6b2a86634a69240929a4dc45da2639222ded1 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00016-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372a23b8cbe82d9b0423c36a9ac1086e38e9db845ecf1011cd28159f25019e74 +size 4286712 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00017-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00017-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..118be1f1e22a15cc11f784bc990551437765ead8 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00017-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2849ffc027a7f7e3ad7c7a3df75168e062869d982e11b0b6a5d61f33e4aa7106 +size 4406904 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00018-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00018-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a6edf2400f969d2cdba5f0c099763a6501275255 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00018-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb9ce21e9ec2b8254b887aac14c279268ab6c8237b39c5b598c01db1a982bdcb +size 4366688 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00019-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00019-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..ba3c37c6085834b2be660e60bde52882dc65651c --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00019-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d0a9625940fac25380a3e1b8af0372813cf4918594e71a8e29aa228ce3c112 +size 4263992 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00020-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00020-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b0cb51a8f79733a2c0d730eddaa29b9c006dd454 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00020-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c19f4dbecb15e977c0c75d18742824796553510831c0b8244ea9f3876c425dc +size 4384344 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00021-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00021-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..dccd0d9820e9c999795c4091a7030d4dd7537abd --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00021-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:347f4c7d9f4ddadfe6bd7a5041565f43141f7504dca14be0877adacee6b4dba2 +size 4310888 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00022-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00022-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..4501e6472bfff1b240a3b16c129e461f1a9b7d46 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00022-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4afaf16306c321b54ab1f4396bc3cc1e7cf879373af7d835cf856ed8049fe57c +size 4331792 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00023-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00023-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b3fc002deb9f27b245724305133a2ed044c06cd2 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00023-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07cdef1b5c5cf52a530f6daebbfb5ebe2a49877de8196a9b87d2a4be7b4b3b6 +size 4201064 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00024-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00024-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6a6590f5bbdccf0fb7f859af9fd6e5a43d29108f --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00024-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4959889937973e0d9dd787c0a0a1ed376659cb6cf74eb3996faaae7b9ed289c +size 4336352 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00025-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00025-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..15bd3b0761e86c84e50ae47b8ab69c45e5577a79 --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00025-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88aa5c30d5866d4e29d09d0fef3c910eb3c8d9cbfd4b9220465b5f8097daa849 +size 4290936 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00026-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00026-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..c9bfad4769586a405adf96aa670bad811023d13a --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00026-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54834458e3a0fe199b72e9f18d931f8e0474aea7dd79062759750420ee48c619 +size 4346848 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00027-of-00028.arrow b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00027-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e1d24517c911709dc71f529adf380e7bea27e91a --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/data-00027-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0009ce9cae5ba053e2efa0974b6c04f4c8b2ddfbec2000cd26af48eb41d9774b +size 4283504 diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/dataset_info.json b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..0dc0cb28b8abc3a16a2403e346f17f2db870eccd --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/dataset_info.json @@ -0,0 +1,29 @@ +{ + "citation": "", + "description": "", + "features": { + "input_ids": { + "feature": { + "dtype": "int32", + "_type": "Value" + }, + "_type": "List" + }, + "attention_mask": { + "feature": { + "dtype": "int8", + "_type": "Value" + }, + "_type": "List" + }, + "labels": { + "feature": { + "dtype": "int64", + "_type": "Value" + }, + "_type": "List" + } + }, + "homepage": "", + "license": "" +} \ No newline at end of file diff --git a/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/state.json b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/state.json new file mode 100644 index 0000000000000000000000000000000000000000..1995d045a557e61e95e025caa1bd6470ef9c24de --- /dev/null +++ b/dataset_prepared/a50226d4b4361e66bb091ddd7857cd71/state.json @@ -0,0 +1,94 @@ +{ + "_data_files": [ + { + "filename": "data-00000-of-00028.arrow" + }, + { + "filename": "data-00001-of-00028.arrow" + }, + { + "filename": "data-00002-of-00028.arrow" + }, + { + "filename": "data-00003-of-00028.arrow" + }, + { + "filename": "data-00004-of-00028.arrow" + }, + { + "filename": "data-00005-of-00028.arrow" + }, + { + "filename": "data-00006-of-00028.arrow" + }, + { + "filename": "data-00007-of-00028.arrow" + }, + { + "filename": "data-00008-of-00028.arrow" + }, + { + "filename": "data-00009-of-00028.arrow" + }, + { + "filename": "data-00010-of-00028.arrow" + }, + { + "filename": "data-00011-of-00028.arrow" + }, + { + "filename": "data-00012-of-00028.arrow" + }, + { + "filename": "data-00013-of-00028.arrow" + }, + { + "filename": "data-00014-of-00028.arrow" + }, + { + "filename": "data-00015-of-00028.arrow" + }, + { + "filename": "data-00016-of-00028.arrow" + }, + { + "filename": "data-00017-of-00028.arrow" + }, + { + "filename": "data-00018-of-00028.arrow" + }, + { + "filename": "data-00019-of-00028.arrow" + }, + { + "filename": "data-00020-of-00028.arrow" + }, + { + "filename": "data-00021-of-00028.arrow" + }, + { + "filename": "data-00022-of-00028.arrow" + }, + { + "filename": "data-00023-of-00028.arrow" + }, + { + "filename": "data-00024-of-00028.arrow" + }, + { + "filename": "data-00025-of-00028.arrow" + }, + { + "filename": "data-00026-of-00028.arrow" + }, + { + "filename": "data-00027-of-00028.arrow" + } + ], + "_fingerprint": "f6c319a09007ccf8", + "_format_columns": null, + "_format_kwargs": {}, + "_format_type": null, + "_output_all_columns": false, + "_split": null +} \ No newline at end of file diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00000-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00000-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b277a21b3cf7f47d0572a1b00b19481d70f64cd2 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00000-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be71087455f3418aa32acfc779e52c0a08f07eded32de3f1130513b8fa56eb1 +size 7234504 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00001-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00001-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..5de0247559a6c7ed12fc5c62808aa54b5a645466 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00001-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e69ae8ac18c9b45276438f47cdda7fa07a854088e37388c2c8a2135bfbcaed +size 6803304 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00002-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00002-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3c7d1cd83363a32be2dbd62fc18d63a31fec3244 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00002-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c91674ce32fb10612c43fdf7ef6882a043096b4c614312fedf8ad19e634ed3c +size 6995384 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00003-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00003-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a28df0a0ff7c4dd065d65de8e56d3c3c2d762a8c --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00003-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161dfe2212c103551eb4ddc932ae892addf455ea4d015f6d5ffe61aca0accdc6 +size 6756608 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00004-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00004-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..1f0ecd52073231a4af70e9a7efa7a36ddf0285f1 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00004-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c731a83ee2cd49911c7c2ee472526f973328c289c57872b74231b289104ca438 +size 7052384 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00005-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00005-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..8e988ad089b6fb69390ec141ae1cdc2797aaa98d --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00005-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd7e4f7cca735f56fd5d20009eb7be6095e75bbcc5a1ce7fbd6bab4324535f0e +size 6899208 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00006-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00006-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..800a3dbff495216a0a066b0f7cb8bbf770b9fe79 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00006-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43a3945f47222be8acd77fd013545af630737e08a9b2fb1a158709b805ebfce +size 7102712 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00007-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00007-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..bf2d63e199d550e8eea323018fc7707a442bb497 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00007-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4244ae2fc11e02dbc413ac013e73ecbede813bd022aa98b49503db4c22c814ff +size 6678048 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00008-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00008-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..5d387d989df13e19a95f646c79e7104945ccffaf --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00008-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b22bd08867796ad779f8216b3f89e4b634290ad5459c1a0cbb7435d1d8d825 +size 7019912 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00009-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00009-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..76abcd3cb5aeae2731ff282934cb9403662c8359 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00009-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c66f0f7e4d67d0ffe6e20a62e654f3cebadabd004a2b9335ea332144bd7d54 +size 6927632 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00010-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00010-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..390abe34077d0ef39c96c5c63080f0914e5e6397 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00010-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7585ab715e960e492b60377fbeb842353c4f1fb4f5e3dff62397ad754f5ebc +size 6911448 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00011-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00011-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6abe23c9be5aad18932a7545d3340c6873da641f --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00011-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03682ceeb039bb405a97fbc7d58734126867faa426b113668972771997526b51 +size 6958496 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00012-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00012-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b314a8bd7f8809fffb94fa4a5df7538428fc3ddc --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00012-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95738bd380a95938e95323ae7672c7b5eae38d8fe4bf164907537e39048d1f3c +size 6910992 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00013-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00013-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6b2701702de4991df1ed9993fa82ac41a2d75863 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00013-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0fcbae0666cf46878a14e2942467e2f83ebb6a73542ecb19b2ae3aad1dbe44 +size 7038000 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00014-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00014-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3725d4395ca483a5df08d20352278408c4653b9a --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00014-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07e705ab9076dd80029ceabc7a5b1304497bb16a7c81b57ea497e4c92d582819 +size 6797272 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00015-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00015-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..be898e536a69e882005a47c0b0a23a7db0e5d65b --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00015-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b05a8332f333a95c036006331ff66727c992654cc6930b42cbbe1bdbf201b0 +size 6968088 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00016-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00016-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..898732f67232d2b18b6e9a5015af332d2856fc8c --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00016-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e207ee06c6e0c33750423fe700c951c9235ad6a73be741674aae1e17463261ce +size 7039640 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00017-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00017-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..ae79c6fb05c28661c8229dc87a36bf32a4a707de --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00017-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aa7459cb37a05382666246873456d1add929525ae9836b0525f6c7d0f1b3c73 +size 6914704 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00018-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00018-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..f3fc9c940947a871aca60baebffe60428898398d --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00018-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68c3f2dc9bf80b2bdc559e0a8e866c6618353a6f4b3fb5c8f1de273a89a4980 +size 6925192 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00019-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00019-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..135e666c549c6a570dfb220d8edafb9d6762d1d8 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00019-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ae4c82efc67e53acc244bc5f7b7827843560f8b0ee249326bb1e4156622f3d +size 6880968 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00020-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00020-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..43caf915b31dfbbe89aa762fcb449d7d3a742342 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00020-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e53b281a547c422db43e75a96dc5a12f0916978cd305e0cd80e3e6285729f70 +size 6943032 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00021-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00021-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..44be8e5eb7ec3b98ed886b304778df237cc14c1f --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00021-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f59622abbb8cef5643c94e37a02e967d2fff82ad338d943f46127e1ec02e768 +size 6846520 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00022-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00022-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..76e8d22d02857e16801bdac31f5beb08bde2f996 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00022-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7eaea778f877efcbf05684a11774ccfadc6fadc8533ecf3530a3619f78a582 +size 6992464 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00023-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00023-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..f5f3083d92621796ed368ddbbfd83f577df885de --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00023-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ee9b617348414f9f70e341b8e6e79d2224d50f8e291ab541dba664b8b62cd3 +size 7164632 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00024-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00024-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6f1a9230d501de6a889f25d26d1074653b07d7fb --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00024-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f330955a83214c96826af80efca68d22b34b5621d38f8ffb48c6ff480f6f2315 +size 7000568 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00025-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00025-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..111c2db19ddb455dcd0c9609d67889748ae3e3b2 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00025-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41631a959ce7d95880f671dadd896a4a4389bde7deea8048bc39a961488fe5f1 +size 6944984 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00026-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00026-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..aa2016956d54e96437c82b7eb87b848028321221 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00026-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568c90437eb068d5a13aa1f9d02c2c5d287c59ea141be9b8cefbd5f3c5f03fe9 +size 6939488 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00027-of-00028.arrow b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00027-of-00028.arrow new file mode 100644 index 0000000000000000000000000000000000000000..72ae13abee66dfb09556e540edb8f5ea4f1359a6 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/data-00027-of-00028.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa184a02f7a75c5ddd9122459f41421ed66c598f8db92b19e61d06c67379509 +size 6970712 diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/dataset_info.json b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..2c93369e7a9b746589b7dbc435dd643bc02d8d6c --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/dataset_info.json @@ -0,0 +1,40 @@ +{ + "citation": "", + "description": "", + "features": { + "input_ids": { + "feature": { + "dtype": "int32", + "_type": "Value" + }, + "_type": "List" + }, + "attention_mask": { + "feature": { + "dtype": "int8", + "_type": "Value" + }, + "_type": "List" + }, + "labels": { + "feature": { + "dtype": "int64", + "_type": "Value" + }, + "_type": "List" + }, + "position_ids": { + "feature": { + "dtype": "int64", + "_type": "Value" + }, + "_type": "List" + }, + "length": { + "dtype": "int64", + "_type": "Value" + } + }, + "homepage": "", + "license": "" +} \ No newline at end of file diff --git a/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/state.json b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/state.json new file mode 100644 index 0000000000000000000000000000000000000000..e93555290eeb2a63290ed407d618652c1dccafa6 --- /dev/null +++ b/dataset_prepared/a54435349df4e7483d0519bb93d7fd9a/state.json @@ -0,0 +1,94 @@ +{ + "_data_files": [ + { + "filename": "data-00000-of-00028.arrow" + }, + { + "filename": "data-00001-of-00028.arrow" + }, + { + "filename": "data-00002-of-00028.arrow" + }, + { + "filename": "data-00003-of-00028.arrow" + }, + { + "filename": "data-00004-of-00028.arrow" + }, + { + "filename": "data-00005-of-00028.arrow" + }, + { + "filename": "data-00006-of-00028.arrow" + }, + { + "filename": "data-00007-of-00028.arrow" + }, + { + "filename": "data-00008-of-00028.arrow" + }, + { + "filename": "data-00009-of-00028.arrow" + }, + { + "filename": "data-00010-of-00028.arrow" + }, + { + "filename": "data-00011-of-00028.arrow" + }, + { + "filename": "data-00012-of-00028.arrow" + }, + { + "filename": "data-00013-of-00028.arrow" + }, + { + "filename": "data-00014-of-00028.arrow" + }, + { + "filename": "data-00015-of-00028.arrow" + }, + { + "filename": "data-00016-of-00028.arrow" + }, + { + "filename": "data-00017-of-00028.arrow" + }, + { + "filename": "data-00018-of-00028.arrow" + }, + { + "filename": "data-00019-of-00028.arrow" + }, + { + "filename": "data-00020-of-00028.arrow" + }, + { + "filename": "data-00021-of-00028.arrow" + }, + { + "filename": "data-00022-of-00028.arrow" + }, + { + "filename": "data-00023-of-00028.arrow" + }, + { + "filename": "data-00024-of-00028.arrow" + }, + { + "filename": "data-00025-of-00028.arrow" + }, + { + "filename": "data-00026-of-00028.arrow" + }, + { + "filename": "data-00027-of-00028.arrow" + } + ], + "_fingerprint": "d741c22fac48027d", + "_format_columns": null, + "_format_kwargs": {}, + "_format_type": null, + "_output_all_columns": false, + "_split": null +} \ No newline at end of file diff --git a/dataset_prepared/datasets_prep.lock b/dataset_prepared/datasets_prep.lock new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9468708525d51476d9de6e9d801d64e45ca25817 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,9 @@ +{ + "_from_model_config": true, + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": 128001, + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.55.4" +} diff --git a/model-00001-of-00002.safetensors b/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6569eb868a1b8b6f5b11c0c9c64311a74b8df9d --- /dev/null +++ b/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:449488eb379733f4e1e90ba1ff3b8ca79eb1de645e56abfd2dd1514f7dde4b26 +size 4965799096 diff --git a/model-00002-of-00002.safetensors b/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9b6131e8b4b54ddc83b8c9ddb784e57b40a4c83 --- /dev/null +++ b/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4620123f28be3355abd208704f2dc2047b09670b5fefd0480ce5c505a5bcb43 +size 1459729952 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..f84d97fd898b58f94bee86f87fd1ea4ce22e86f3 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,262 @@ +{ + "metadata": { + "total_parameters": 3212749824, + "total_size": 6425499648 + }, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-00002.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.norm.weight": "model-00002-of-00002.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..68b10c7f0a479eae0c358eac6a14959b3f9acdf1 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,23 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1d8d5c9024994f1d3b00f9662b8dd89ca13cf2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e876241357e9b7a9d01ac27b79a203d26713f24e --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2063 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "clean_up_tokenization_spaces": true, + "eos_token": "<|end_of_text|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "pad_token": "<|finetune_right_pad_id|>", + "tokenizer_class": "PreTrainedTokenizerFast" +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..04285aca1175741e2ccf42f80d38ae8c1a3c7800 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b50e110bea2cc8ea6f214573221d89a6f808a946a2fc9f68cfcdd88b873f24f +size 7313