Update README.md
Browse files
README.md
CHANGED
@@ -3,6 +3,10 @@ license: mit
|
|
3 |
tags:
|
4 |
- text-game
|
5 |
- world-model
|
|
|
|
|
|
|
|
|
6 |
---
|
7 |
|
8 |
See https://github.com/thuml/RLVR-World for examples for using this model.
|
@@ -15,4 +19,4 @@ See https://github.com/thuml/RLVR-World for examples for using this model.
|
|
15 |
author={Jialong Wu and Shaofeng Yin and Ningya Feng and Mingsheng Long},
|
16 |
journal={arXiv preprint arXiv:2505.13934},
|
17 |
year={2025},
|
18 |
-
}
|
|
|
3 |
tags:
|
4 |
- text-game
|
5 |
- world-model
|
6 |
+
datasets:
|
7 |
+
- thuml/bytesized32-world-model-cot
|
8 |
+
base_model:
|
9 |
+
- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
|
10 |
---
|
11 |
|
12 |
See https://github.com/thuml/RLVR-World for examples for using this model.
|
|
|
19 |
author={Jialong Wu and Shaofeng Yin and Ningya Feng and Mingsheng Long},
|
20 |
journal={arXiv preprint arXiv:2505.13934},
|
21 |
year={2025},
|
22 |
+
}
|