Upload 15 files
Browse files- agent_cppo_100_epochs_20k_steps.pth +3 -0
- agent_cppo_20_epochs_20k_steps.pth +3 -0
- agent_cppo_deepseek_100_epochs_20k_steps.pth +3 -0
- agent_cppo_deepseek_100_epochs_20k_steps_01.pth +3 -0
- agent_cppo_deepseek_100_epochs_20k_steps_1.pth +3 -0
- agent_cppo_llama_20_epochs_20k_steps.pth +3 -0
- agent_deepseek_20_epochs_20k_steps.pth +3 -0
- agent_ppo_100_epochs_20k_steps.pth +3 -0
- agent_ppo_20_epochs_20k_steps.pth +3 -0
- agent_ppo_deepseek_100_epochs_20k_steps.pth +3 -0
- agent_ppo_deepseek_100_epochs_20k_steps_01.pth +3 -0
- agent_ppo_deepseek_100_epochs_20k_steps_1.pth +3 -0
- agent_ppo_deepseek_20_epochs_20k_steps.pth +3 -0
- agent_ppo_llama_100_epochs_20k_steps.pth +3 -0
- agent_ppo_llama_20_epochs_20k_steps.pth +3 -0
agent_cppo_100_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7017d10df45958f1a09ee8e009d8c99346be867ff312b03876ed1b8cfb289b1
|
3 |
+
size 5730119
|
agent_cppo_20_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c9771b11a99c389877c35317ef7d542208a35264c47051ce460791e207ec985
|
3 |
+
size 5730102
|
agent_cppo_deepseek_100_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8dc3e1cc247a16c258d6940644008f3a491f0dd962145d37659a66c55b99d44
|
3 |
+
size 6418400
|
agent_cppo_deepseek_100_epochs_20k_steps_01.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:672fa6bfc0e656f724833fac2046f04f5598fd9a87a1ea457bcaf9b1a2edcda0
|
3 |
+
size 6418349
|
agent_cppo_deepseek_100_epochs_20k_steps_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0995acb84653b5ffbfaab13fed295ff1efa8443df66f6dfe80e0ac82280fe53d
|
3 |
+
size 6418519
|
agent_cppo_llama_20_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9f0fb6fe944f01a6f5e38c6fe6a1e92369b92252e29ed16101766e92b9d8087
|
3 |
+
size 6418332
|
agent_deepseek_20_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98d4c116d6e17ade1ed6710488446c3d10fe01fbd7350974bbf146641868b693
|
3 |
+
size 6418298
|
agent_ppo_100_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f138a91c36e0b88b27d58bf41549de24717aec48e7107641f3dfa1838b51177b
|
3 |
+
size 5730102
|
agent_ppo_20_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:238632dc96b40aa21a3993e1cac90578b7f84ea8e6811aebcfc4cbf3ac37443e
|
3 |
+
size 5730085
|
agent_ppo_deepseek_100_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae05dd713d1c0e8a880daad0a3be49db0314c50211805272f8a61dd84794ef84
|
3 |
+
size 6074319
|
agent_ppo_deepseek_100_epochs_20k_steps_01.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0969fc0b9d4c49aa816b2ec88dd321ffa619d765df27d79ef8975797747b8d5b
|
3 |
+
size 6074370
|
agent_ppo_deepseek_100_epochs_20k_steps_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f54f756654dc9a23c9c6fe6836a0be5ac03cc1fecf8952f020e58f63291fb8c
|
3 |
+
size 6074540
|
agent_ppo_deepseek_20_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e799bdf91c48654b4e7a0f3c090abff69b45a5ec88f592511c1dd34bc446d41
|
3 |
+
size 6074302
|
agent_ppo_llama_100_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06a1dbc0e65a7868c9c98db19c53311fc23ffc954faab3b913df4f4c05aa7cd9
|
3 |
+
size 6074268
|
agent_ppo_llama_20_epochs_20k_steps.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67c515df96ed32e57a37566d86c3547c63987d9e758ebe2984749a6f771cedfe
|
3 |
+
size 6074251
|