Upload folder using huggingface_hub
Browse files- README.md +1 -1
- replay.mp4 +2 -2
- sf_log.txt +82 -0
README.md
CHANGED
@@ -15,7 +15,7 @@ model-index:
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
-
value: 3.
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
+
value: 3.97 +/- 0.86
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a549007a1480ea6dd428a375c9b56de16c0ca8c8ffd505c0e983c3953b63f755
|
3 |
+
size 6158905
|
sf_log.txt
CHANGED
@@ -1696,3 +1696,85 @@ main_loop: 1200.1674
|
|
1696 |
[2025-08-17 21:19:25,200][08154] Avg episode rewards: #0: 4.013, true rewards: #0: 3.813
|
1697 |
[2025-08-17 21:19:25,201][08154] Avg episode reward: 4.013, avg true_objective: 3.813
|
1698 |
[2025-08-17 21:19:30,114][08154] Replay video saved to /home/dmin/HuggingFace/notebooks/unit8/part_2/train_dir/default_experiment/replay.mp4!
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1696 |
[2025-08-17 21:19:25,200][08154] Avg episode rewards: #0: 4.013, true rewards: #0: 3.813
|
1697 |
[2025-08-17 21:19:25,201][08154] Avg episode reward: 4.013, avg true_objective: 3.813
|
1698 |
[2025-08-17 21:19:30,114][08154] Replay video saved to /home/dmin/HuggingFace/notebooks/unit8/part_2/train_dir/default_experiment/replay.mp4!
|
1699 |
+
[2025-08-17 21:19:35,417][08154] The model has been pushed to https://huggingface.co/LizardAPN/rl_course_vizdoom_health_gathering_supreme
|
1700 |
+
[2025-08-17 21:20:16,176][08154] Loading existing experiment configuration from /home/dmin/HuggingFace/notebooks/unit8/part_2/train_dir/default_experiment/config.json
|
1701 |
+
[2025-08-17 21:20:16,177][08154] Overriding arg 'num_workers' with value 4 passed from command line
|
1702 |
+
[2025-08-17 21:20:16,178][08154] Adding new argument 'no_render'=True that is not in the saved config file!
|
1703 |
+
[2025-08-17 21:20:16,179][08154] Adding new argument 'save_video'=True that is not in the saved config file!
|
1704 |
+
[2025-08-17 21:20:16,180][08154] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!
|
1705 |
+
[2025-08-17 21:20:16,181][08154] Adding new argument 'video_name'=None that is not in the saved config file!
|
1706 |
+
[2025-08-17 21:20:16,182][08154] Adding new argument 'max_num_frames'=100000 that is not in the saved config file!
|
1707 |
+
[2025-08-17 21:20:16,183][08154] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!
|
1708 |
+
[2025-08-17 21:20:16,184][08154] Adding new argument 'push_to_hub'=True that is not in the saved config file!
|
1709 |
+
[2025-08-17 21:20:16,185][08154] Adding new argument 'hf_repository'='LizardAPN/rl_course_vizdoom_health_gathering_supreme' that is not in the saved config file!
|
1710 |
+
[2025-08-17 21:20:16,186][08154] Adding new argument 'policy_index'=0 that is not in the saved config file!
|
1711 |
+
[2025-08-17 21:20:16,186][08154] Adding new argument 'eval_deterministic'=False that is not in the saved config file!
|
1712 |
+
[2025-08-17 21:20:16,188][08154] Adding new argument 'train_script'=None that is not in the saved config file!
|
1713 |
+
[2025-08-17 21:20:16,189][08154] Adding new argument 'enjoy_script'=None that is not in the saved config file!
|
1714 |
+
[2025-08-17 21:20:16,190][08154] Using frameskip 1 and render_action_repeat=4 for evaluation
|
1715 |
+
[2025-08-17 21:20:16,211][08154] RunningMeanStd input shape: (3, 72, 128)
|
1716 |
+
[2025-08-17 21:20:16,213][08154] RunningMeanStd input shape: (1,)
|
1717 |
+
[2025-08-17 21:20:16,245][08154] ConvEncoder: input_channels=3
|
1718 |
+
[2025-08-17 21:20:16,294][08154] Conv encoder output size: 512
|
1719 |
+
[2025-08-17 21:20:16,295][08154] Policy head output size: 512
|
1720 |
+
[2025-08-17 21:20:16,330][08154] Loading state from checkpoint /home/dmin/HuggingFace/notebooks/unit8/part_2/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
1721 |
+
[2025-08-17 21:20:16,820][08154] Num frames 100...
|
1722 |
+
[2025-08-17 21:20:17,032][08154] Num frames 200...
|
1723 |
+
[2025-08-17 21:20:17,186][08154] Num frames 300...
|
1724 |
+
[2025-08-17 21:20:17,379][08154] Avg episode rewards: #0: 3.840, true rewards: #0: 3.840
|
1725 |
+
[2025-08-17 21:20:17,381][08154] Avg episode reward: 3.840, avg true_objective: 3.840
|
1726 |
+
[2025-08-17 21:20:17,408][08154] Num frames 400...
|
1727 |
+
[2025-08-17 21:20:17,610][08154] Num frames 500...
|
1728 |
+
[2025-08-17 21:20:17,779][08154] Num frames 600...
|
1729 |
+
[2025-08-17 21:20:17,942][08154] Num frames 700...
|
1730 |
+
[2025-08-17 21:20:18,102][08154] Num frames 800...
|
1731 |
+
[2025-08-17 21:20:18,211][08154] Avg episode rewards: #0: 4.660, true rewards: #0: 4.160
|
1732 |
+
[2025-08-17 21:20:18,212][08154] Avg episode reward: 4.660, avg true_objective: 4.160
|
1733 |
+
[2025-08-17 21:20:18,336][08154] Num frames 900...
|
1734 |
+
[2025-08-17 21:20:18,516][08154] Num frames 1000...
|
1735 |
+
[2025-08-17 21:20:18,679][08154] Num frames 1100...
|
1736 |
+
[2025-08-17 21:20:18,846][08154] Num frames 1200...
|
1737 |
+
[2025-08-17 21:20:18,928][08154] Avg episode rewards: #0: 4.387, true rewards: #0: 4.053
|
1738 |
+
[2025-08-17 21:20:18,929][08154] Avg episode reward: 4.387, avg true_objective: 4.053
|
1739 |
+
[2025-08-17 21:20:19,095][08154] Num frames 1300...
|
1740 |
+
[2025-08-17 21:20:19,298][08154] Num frames 1400...
|
1741 |
+
[2025-08-17 21:20:19,499][08154] Num frames 1500...
|
1742 |
+
[2025-08-17 21:20:19,669][08154] Num frames 1600...
|
1743 |
+
[2025-08-17 21:20:19,855][08154] Num frames 1700...
|
1744 |
+
[2025-08-17 21:20:20,021][08154] Avg episode rewards: #0: 5.150, true rewards: #0: 4.400
|
1745 |
+
[2025-08-17 21:20:20,022][08154] Avg episode reward: 5.150, avg true_objective: 4.400
|
1746 |
+
[2025-08-17 21:20:20,107][08154] Num frames 1800...
|
1747 |
+
[2025-08-17 21:20:20,299][08154] Num frames 1900...
|
1748 |
+
[2025-08-17 21:20:20,495][08154] Num frames 2000...
|
1749 |
+
[2025-08-17 21:20:20,584][08154] Avg episode rewards: #0: 4.632, true rewards: #0: 4.032
|
1750 |
+
[2025-08-17 21:20:20,585][08154] Avg episode reward: 4.632, avg true_objective: 4.032
|
1751 |
+
[2025-08-17 21:20:20,732][08154] Num frames 2100...
|
1752 |
+
[2025-08-17 21:20:20,918][08154] Num frames 2200...
|
1753 |
+
[2025-08-17 21:20:21,101][08154] Avg episode rewards: #0: 4.287, true rewards: #0: 3.787
|
1754 |
+
[2025-08-17 21:20:21,102][08154] Avg episode reward: 4.287, avg true_objective: 3.787
|
1755 |
+
[2025-08-17 21:20:21,157][08154] Num frames 2300...
|
1756 |
+
[2025-08-17 21:20:21,334][08154] Num frames 2400...
|
1757 |
+
[2025-08-17 21:20:21,506][08154] Num frames 2500...
|
1758 |
+
[2025-08-17 21:20:21,685][08154] Num frames 2600...
|
1759 |
+
[2025-08-17 21:20:21,860][08154] Num frames 2700...
|
1760 |
+
[2025-08-17 21:20:21,951][08154] Avg episode rewards: #0: 4.457, true rewards: #0: 3.886
|
1761 |
+
[2025-08-17 21:20:21,951][08154] Avg episode reward: 4.457, avg true_objective: 3.886
|
1762 |
+
[2025-08-17 21:20:22,085][08154] Num frames 2800...
|
1763 |
+
[2025-08-17 21:20:22,259][08154] Num frames 2900...
|
1764 |
+
[2025-08-17 21:20:22,430][08154] Num frames 3000...
|
1765 |
+
[2025-08-17 21:20:22,631][08154] Num frames 3100...
|
1766 |
+
[2025-08-17 21:20:22,695][08154] Avg episode rewards: #0: 4.380, true rewards: #0: 3.880
|
1767 |
+
[2025-08-17 21:20:22,696][08154] Avg episode reward: 4.380, avg true_objective: 3.880
|
1768 |
+
[2025-08-17 21:20:22,891][08154] Num frames 3200...
|
1769 |
+
[2025-08-17 21:20:23,094][08154] Num frames 3300...
|
1770 |
+
[2025-08-17 21:20:23,269][08154] Num frames 3400...
|
1771 |
+
[2025-08-17 21:20:23,466][08154] Avg episode rewards: #0: 4.320, true rewards: #0: 3.876
|
1772 |
+
[2025-08-17 21:20:23,467][08154] Avg episode reward: 4.320, avg true_objective: 3.876
|
1773 |
+
[2025-08-17 21:20:23,492][08154] Num frames 3500...
|
1774 |
+
[2025-08-17 21:20:23,653][08154] Num frames 3600...
|
1775 |
+
[2025-08-17 21:20:23,813][08154] Num frames 3700...
|
1776 |
+
[2025-08-17 21:20:23,970][08154] Num frames 3800...
|
1777 |
+
[2025-08-17 21:20:24,129][08154] Num frames 3900...
|
1778 |
+
[2025-08-17 21:20:24,306][08154] Avg episode rewards: #0: 4.468, true rewards: #0: 3.968
|
1779 |
+
[2025-08-17 21:20:24,307][08154] Avg episode reward: 4.468, avg true_objective: 3.968
|
1780 |
+
[2025-08-17 21:20:29,751][08154] Replay video saved to /home/dmin/HuggingFace/notebooks/unit8/part_2/train_dir/default_experiment/replay.mp4!
|