Upload folder using huggingface_hub
Browse files
.summary/0/events.out.tfevents.1688878853.snowflake
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:440f3682432896f32d41a122192825803e3ee49b39e95ec081ddda42a7105474
|
3 |
+
size 4526
|
.summary/0/events.out.tfevents.1688879192.snowflake
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34e11fa2e82dffd054eaec8e49fef1ca9028159b42f5eb78b05f554c8e50e21c
|
3 |
+
size 16844
|
README.md
CHANGED
@@ -15,7 +15,7 @@ model-index:
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
-
value: 3.
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
+
value: 3.94 +/- 0.61
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
checkpoint_p0/checkpoint_000000000_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f546634a38180cb4a57aec199213e3b845b90a5ebb8206ddaa081c2c9d4ba854
|
3 |
+
size 41231900
|
checkpoint_p0/checkpoint_000466273_3819708416.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad911b64da964df63b10a6c450dbf67193cd2e4eb0163db5a9e46fa8946e6efb
|
3 |
+
size 41232964
|
config.json
CHANGED
@@ -63,7 +63,7 @@
|
|
63 |
"summaries_use_frameskip": true,
|
64 |
"heartbeat_interval": 10,
|
65 |
"heartbeat_reporting_interval": 300,
|
66 |
-
"train_for_env_steps":
|
67 |
"train_for_seconds": 1000000,
|
68 |
"save_every_sec": 120,
|
69 |
"keep_checkpoints": 2,
|
@@ -130,8 +130,8 @@
|
|
130 |
"cli_args": {},
|
131 |
"git_hash": "0401714b01ee832562a0930e3744117f1ba51e10",
|
132 |
"git_repo_name": "https://github.com/tenkara/HF-DeepRL.git",
|
133 |
-
"command_line": "--env=doom_health_gathering_supreme --train_for_env_steps=
|
134 |
-
"env_gpu_observations": true,
|
135 |
"lr_adaptive_min": 1e-06,
|
136 |
-
"lr_adaptive_max": 0.01
|
|
|
137 |
}
|
|
|
63 |
"summaries_use_frameskip": true,
|
64 |
"heartbeat_interval": 10,
|
65 |
"heartbeat_reporting_interval": 300,
|
66 |
+
"train_for_env_steps": 20,
|
67 |
"train_for_seconds": 1000000,
|
68 |
"save_every_sec": 120,
|
69 |
"keep_checkpoints": 2,
|
|
|
130 |
"cli_args": {},
|
131 |
"git_hash": "0401714b01ee832562a0930e3744117f1ba51e10",
|
132 |
"git_repo_name": "https://github.com/tenkara/HF-DeepRL.git",
|
133 |
+
"command_line": "--env=doom_health_gathering_supreme --train_for_env_steps=20",
|
|
|
134 |
"lr_adaptive_min": 1e-06,
|
135 |
+
"lr_adaptive_max": 0.01,
|
136 |
+
"env_gpu_observations": true
|
137 |
}
|
git.diff
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8b97eeeb6021f14696de0a65f48c22164dbc358a9a63500114e3970e8a301d7
|
3 |
+
size 211342672
|
sf_log.txt
CHANGED
@@ -701,3 +701,278 @@ Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.
|
|
701 |
[2023-07-08 22:48:57,115][18621] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
702 |
[2023-07-08 22:48:57,152][18621] Stopping LearnerWorker_p0...
|
703 |
[2023-07-08 22:48:57,152][18621] Loop learner_proc0_evt_loop terminating...
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
701 |
[2023-07-08 22:48:57,115][18621] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
702 |
[2023-07-08 22:48:57,152][18621] Stopping LearnerWorker_p0...
|
703 |
[2023-07-08 22:48:57,152][18621] Loop learner_proc0_evt_loop terminating...
|
704 |
+
[2023-07-08 23:01:01,233][19220] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
705 |
+
[2023-07-08 23:01:01,234][19220] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0
|
706 |
+
[2023-07-08 23:01:01,277][19220] Num visible devices: 1
|
707 |
+
[2023-07-08 23:01:01,412][19220] Setting fixed seed 42
|
708 |
+
[2023-07-08 23:01:01,412][19220] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
709 |
+
[2023-07-08 23:01:01,412][19220] Initializing actor-critic model on device cuda:0
|
710 |
+
[2023-07-08 23:01:01,413][19220] RunningMeanStd input shape: (3, 72, 128)
|
711 |
+
[2023-07-08 23:01:01,413][19220] RunningMeanStd input shape: (1,)
|
712 |
+
[2023-07-08 23:01:01,420][19220] ConvEncoder: input_channels=3
|
713 |
+
[2023-07-08 23:01:01,502][19241] Worker 0 uses CPU cores [0]
|
714 |
+
[2023-07-08 23:01:01,550][19242] Worker 2 uses CPU cores [2]
|
715 |
+
[2023-07-08 23:01:01,609][19243] Worker 1 uses CPU cores [1]
|
716 |
+
[2023-07-08 23:01:01,648][19244] Worker 3 uses CPU cores [3]
|
717 |
+
[2023-07-08 23:01:01,649][19240] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
718 |
+
[2023-07-08 23:01:01,649][19240] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0
|
719 |
+
[2023-07-08 23:01:01,737][19240] Num visible devices: 1
|
720 |
+
[2023-07-08 23:01:01,782][19246] Worker 4 uses CPU cores [0]
|
721 |
+
[2023-07-08 23:01:01,741][19220] Conv encoder output size: 512
|
722 |
+
[2023-07-08 23:01:01,787][19220] Policy head output size: 512
|
723 |
+
[2023-07-08 23:01:01,794][19252] Worker 11 uses CPU cores [3]
|
724 |
+
[2023-07-08 23:01:01,800][19250] Worker 9 uses CPU cores [1]
|
725 |
+
[2023-07-08 23:01:01,807][19220] Created Actor Critic model with architecture:
|
726 |
+
[2023-07-08 23:01:01,831][19248] Worker 7 uses CPU cores [3]
|
727 |
+
[2023-07-08 23:01:01,849][19249] Worker 8 uses CPU cores [0]
|
728 |
+
[2023-07-08 23:01:01,862][19251] Worker 10 uses CPU cores [2]
|
729 |
+
[2023-07-08 23:01:01,891][19220] ActorCriticSharedWeights(
|
730 |
+
(obs_normalizer): ObservationNormalizer(
|
731 |
+
(running_mean_std): RunningMeanStdDictInPlace(
|
732 |
+
(running_mean_std): ModuleDict(
|
733 |
+
(obs): RunningMeanStdInPlace()
|
734 |
+
)
|
735 |
+
)
|
736 |
+
)
|
737 |
+
(returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)
|
738 |
+
(encoder): VizdoomEncoder(
|
739 |
+
(basic_encoder): ConvEncoder(
|
740 |
+
(enc): RecursiveScriptModule(
|
741 |
+
original_name=ConvEncoderImpl
|
742 |
+
(conv_head): RecursiveScriptModule(
|
743 |
+
original_name=Sequential
|
744 |
+
(0): RecursiveScriptModule(original_name=Conv2d)
|
745 |
+
(1): RecursiveScriptModule(original_name=ReLU)
|
746 |
+
(2): RecursiveScriptModule(original_name=Conv2d)
|
747 |
+
(3): RecursiveScriptModule(original_name=ReLU)
|
748 |
+
(4): RecursiveScriptModule(original_name=Conv2d)
|
749 |
+
(5): RecursiveScriptModule(original_name=ReLU)
|
750 |
+
)
|
751 |
+
(mlp_layers): RecursiveScriptModule(
|
752 |
+
original_name=Sequential
|
753 |
+
(0): RecursiveScriptModule(original_name=Linear)
|
754 |
+
(1): RecursiveScriptModule(original_name=ReLU)
|
755 |
+
)
|
756 |
+
)
|
757 |
+
)
|
758 |
+
)
|
759 |
+
(core): ModelCoreRNN(
|
760 |
+
(core): LSTM(512, 512)
|
761 |
+
)
|
762 |
+
(decoder): MlpDecoder(
|
763 |
+
(mlp): Identity()
|
764 |
+
)
|
765 |
+
(critic_linear): Linear(in_features=512, out_features=1, bias=True)
|
766 |
+
(action_parameterization): ActionParameterizationDefault(
|
767 |
+
(distribution_linear): Linear(in_features=512, out_features=5, bias=True)
|
768 |
+
)
|
769 |
+
)
|
770 |
+
[2023-07-08 23:01:01,903][19253] Worker 12 uses CPU cores [0]
|
771 |
+
[2023-07-08 23:01:01,925][19247] Worker 6 uses CPU cores [2]
|
772 |
+
[2023-07-08 23:01:01,943][19254] Worker 13 uses CPU cores [1]
|
773 |
+
[2023-07-08 23:01:01,967][19256] Worker 15 uses CPU cores [3]
|
774 |
+
[2023-07-08 23:01:01,975][19259] Worker 18 uses CPU cores [2]
|
775 |
+
[2023-07-08 23:01:01,991][19255] Worker 14 uses CPU cores [2]
|
776 |
+
[2023-07-08 23:01:02,001][19257] Worker 16 uses CPU cores [0]
|
777 |
+
[2023-07-08 23:01:02,021][19260] Worker 19 uses CPU cores [3]
|
778 |
+
[2023-07-08 23:01:02,041][19245] Worker 5 uses CPU cores [1]
|
779 |
+
[2023-07-08 23:01:02,052][19258] Worker 17 uses CPU cores [1]
|
780 |
+
[2023-07-08 23:01:02,219][19220] Using optimizer <class 'torch.optim.adam.Adam'>
|
781 |
+
[2023-07-08 23:01:02,220][19220] No checkpoints found
|
782 |
+
[2023-07-08 23:01:02,220][19220] Did not load from checkpoint, starting from scratch!
|
783 |
+
[2023-07-08 23:01:02,220][19220] Initialized policy 0 weights for model version 0
|
784 |
+
[2023-07-08 23:01:02,223][19220] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
785 |
+
[2023-07-08 23:01:02,236][19220] LearnerWorker_p0 finished initialization!
|
786 |
+
[2023-07-08 23:01:02,356][19240] Unhandled exception CUDA error: OS call failed or operation not supported on this OS
|
787 |
+
CUDA kernel errors might be asynchronously reported at some other API call, so the stacktrace below might be incorrect.
|
788 |
+
For debugging consider passing CUDA_LAUNCH_BLOCKING=1.
|
789 |
+
Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.
|
790 |
+
in evt loop inference_proc0-0_evt_loop
|
791 |
+
[2023-07-08 23:02:53,735][19220] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
792 |
+
[2023-07-08 23:04:53,736][19220] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
793 |
+
[2023-07-08 23:05:29,863][19259] Stopping RolloutWorker_w18...
|
794 |
+
[2023-07-08 23:05:29,864][19259] Loop rollout_proc18_evt_loop terminating...
|
795 |
+
[2023-07-08 23:05:29,864][19260] Stopping RolloutWorker_w19...
|
796 |
+
[2023-07-08 23:05:29,864][19260] Loop rollout_proc19_evt_loop terminating...
|
797 |
+
[2023-07-08 23:05:29,872][19252] Stopping RolloutWorker_w11...
|
798 |
+
[2023-07-08 23:05:29,872][19249] Stopping RolloutWorker_w8...
|
799 |
+
[2023-07-08 23:05:29,872][19251] Stopping RolloutWorker_w10...
|
800 |
+
[2023-07-08 23:05:29,872][19252] Loop rollout_proc11_evt_loop terminating...
|
801 |
+
[2023-07-08 23:05:29,872][19249] Loop rollout_proc8_evt_loop terminating...
|
802 |
+
[2023-07-08 23:05:29,872][19251] Loop rollout_proc10_evt_loop terminating...
|
803 |
+
[2023-07-08 23:05:29,882][19255] Stopping RolloutWorker_w14...
|
804 |
+
[2023-07-08 23:05:29,882][19248] Stopping RolloutWorker_w7...
|
805 |
+
[2023-07-08 23:05:29,882][19257] Stopping RolloutWorker_w16...
|
806 |
+
[2023-07-08 23:05:29,882][19255] Loop rollout_proc14_evt_loop terminating...
|
807 |
+
[2023-07-08 23:05:29,882][19248] Loop rollout_proc7_evt_loop terminating...
|
808 |
+
[2023-07-08 23:05:29,882][19257] Loop rollout_proc16_evt_loop terminating...
|
809 |
+
[2023-07-08 23:05:29,882][19220] Stopping Batcher_0...
|
810 |
+
[2023-07-08 23:05:29,883][19220] Loop batcher_evt_loop terminating...
|
811 |
+
[2023-07-08 23:05:29,892][19244] Stopping RolloutWorker_w3...
|
812 |
+
[2023-07-08 23:05:29,892][19241] Stopping RolloutWorker_w0...
|
813 |
+
[2023-07-08 23:05:29,892][19244] Loop rollout_proc3_evt_loop terminating...
|
814 |
+
[2023-07-08 23:05:29,892][19241] Loop rollout_proc0_evt_loop terminating...
|
815 |
+
[2023-07-08 23:05:29,892][19220] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
816 |
+
[2023-07-08 23:05:29,895][19256] Stopping RolloutWorker_w15...
|
817 |
+
[2023-07-08 23:05:29,895][19247] Stopping RolloutWorker_w6...
|
818 |
+
[2023-07-08 23:05:29,895][19256] Loop rollout_proc15_evt_loop terminating...
|
819 |
+
[2023-07-08 23:05:29,896][19253] Stopping RolloutWorker_w12...
|
820 |
+
[2023-07-08 23:05:29,896][19247] Loop rollout_proc6_evt_loop terminating...
|
821 |
+
[2023-07-08 23:05:29,896][19253] Loop rollout_proc12_evt_loop terminating...
|
822 |
+
[2023-07-08 23:05:29,901][19246] Stopping RolloutWorker_w4...
|
823 |
+
[2023-07-08 23:05:29,902][19246] Loop rollout_proc4_evt_loop terminating...
|
824 |
+
[2023-07-08 23:05:29,903][19242] Stopping RolloutWorker_w2...
|
825 |
+
[2023-07-08 23:05:29,905][19242] Loop rollout_proc2_evt_loop terminating...
|
826 |
+
[2023-07-08 23:05:29,956][19220] Stopping LearnerWorker_p0...
|
827 |
+
[2023-07-08 23:05:29,956][19220] Loop learner_proc0_evt_loop terminating...
|
828 |
+
[2023-07-08 23:05:30,040][19250] Stopping RolloutWorker_w9...
|
829 |
+
[2023-07-08 23:05:30,041][19250] Loop rollout_proc9_evt_loop terminating...
|
830 |
+
[2023-07-08 23:05:30,042][19254] Stopping RolloutWorker_w13...
|
831 |
+
[2023-07-08 23:05:30,042][19254] Loop rollout_proc13_evt_loop terminating...
|
832 |
+
[2023-07-08 23:05:30,052][19245] Stopping RolloutWorker_w5...
|
833 |
+
[2023-07-08 23:05:30,052][19245] Loop rollout_proc5_evt_loop terminating...
|
834 |
+
[2023-07-08 23:05:30,062][19258] Stopping RolloutWorker_w17...
|
835 |
+
[2023-07-08 23:05:30,062][19258] Loop rollout_proc17_evt_loop terminating...
|
836 |
+
[2023-07-08 23:05:30,072][19243] Stopping RolloutWorker_w1...
|
837 |
+
[2023-07-08 23:05:30,072][19243] Loop rollout_proc1_evt_loop terminating...
|
838 |
+
[2023-07-08 23:06:39,079][19475] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
839 |
+
[2023-07-08 23:06:39,079][19475] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0
|
840 |
+
[2023-07-08 23:06:39,116][19475] Num visible devices: 1
|
841 |
+
[2023-07-08 23:06:39,240][19475] Setting fixed seed 42
|
842 |
+
[2023-07-08 23:06:39,241][19475] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
843 |
+
[2023-07-08 23:06:39,241][19475] Initializing actor-critic model on device cuda:0
|
844 |
+
[2023-07-08 23:06:39,241][19475] RunningMeanStd input shape: (3, 72, 128)
|
845 |
+
[2023-07-08 23:06:39,242][19475] RunningMeanStd input shape: (1,)
|
846 |
+
[2023-07-08 23:06:39,248][19475] ConvEncoder: input_channels=3
|
847 |
+
[2023-07-08 23:06:39,280][19499] Worker 3 uses CPU cores [3]
|
848 |
+
[2023-07-08 23:06:39,412][19496] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
849 |
+
[2023-07-08 23:06:39,412][19496] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0
|
850 |
+
[2023-07-08 23:06:39,470][19496] Num visible devices: 1
|
851 |
+
[2023-07-08 23:06:39,462][19500] Worker 4 uses CPU cores [0]
|
852 |
+
[2023-07-08 23:06:39,527][19495] Worker 0 uses CPU cores [0]
|
853 |
+
[2023-07-08 23:06:39,541][19497] Worker 1 uses CPU cores [1]
|
854 |
+
[2023-07-08 23:06:39,541][19502] Worker 6 uses CPU cores [2]
|
855 |
+
[2023-07-08 23:06:39,604][19475] Conv encoder output size: 512
|
856 |
+
[2023-07-08 23:06:39,605][19475] Policy head output size: 512
|
857 |
+
[2023-07-08 23:06:39,608][19507] Worker 12 uses CPU cores [0]
|
858 |
+
[2023-07-08 23:06:39,646][19475] Created Actor Critic model with architecture:
|
859 |
+
[2023-07-08 23:06:39,646][19475] ActorCriticSharedWeights(
|
860 |
+
(obs_normalizer): ObservationNormalizer(
|
861 |
+
(running_mean_std): RunningMeanStdDictInPlace(
|
862 |
+
(running_mean_std): ModuleDict(
|
863 |
+
(obs): RunningMeanStdInPlace()
|
864 |
+
)
|
865 |
+
)
|
866 |
+
)
|
867 |
+
(returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)
|
868 |
+
(encoder): VizdoomEncoder(
|
869 |
+
(basic_encoder): ConvEncoder(
|
870 |
+
(enc): RecursiveScriptModule(
|
871 |
+
original_name=ConvEncoderImpl
|
872 |
+
(conv_head): RecursiveScriptModule(
|
873 |
+
original_name=Sequential
|
874 |
+
(0): RecursiveScriptModule(original_name=Conv2d)
|
875 |
+
(1): RecursiveScriptModule(original_name=ReLU)
|
876 |
+
(2): RecursiveScriptModule(original_name=Conv2d)
|
877 |
+
(3): RecursiveScriptModule(original_name=ReLU)
|
878 |
+
(4): RecursiveScriptModule(original_name=Conv2d)
|
879 |
+
(5): RecursiveScriptModule(original_name=ReLU)
|
880 |
+
)
|
881 |
+
(mlp_layers): RecursiveScriptModule(
|
882 |
+
original_name=Sequential
|
883 |
+
(0): RecursiveScriptModule(original_name=Linear)
|
884 |
+
(1): RecursiveScriptModule(original_name=ReLU)
|
885 |
+
)
|
886 |
+
)
|
887 |
+
)
|
888 |
+
)
|
889 |
+
(core): ModelCoreRNN(
|
890 |
+
(core): LSTM(512, 512)
|
891 |
+
)
|
892 |
+
(decoder): MlpDecoder(
|
893 |
+
(mlp): Identity()
|
894 |
+
)
|
895 |
+
(critic_linear): Linear(in_features=512, out_features=1, bias=True)
|
896 |
+
(action_parameterization): ActionParameterizationDefault(
|
897 |
+
(distribution_linear): Linear(in_features=512, out_features=5, bias=True)
|
898 |
+
)
|
899 |
+
)
|
900 |
+
[2023-07-08 23:06:39,648][19498] Worker 2 uses CPU cores [2]
|
901 |
+
[2023-07-08 23:06:39,753][19513] Worker 15 uses CPU cores [3]
|
902 |
+
[2023-07-08 23:06:39,774][19503] Worker 7 uses CPU cores [3]
|
903 |
+
[2023-07-08 23:06:39,781][19510] Worker 14 uses CPU cores [2]
|
904 |
+
[2023-07-08 23:06:39,800][19511] Worker 16 uses CPU cores [0]
|
905 |
+
[2023-07-08 23:06:39,801][19506] Worker 10 uses CPU cores [2]
|
906 |
+
[2023-07-08 23:06:39,804][19508] Worker 13 uses CPU cores [1]
|
907 |
+
[2023-07-08 23:06:39,805][19505] Worker 9 uses CPU cores [1]
|
908 |
+
[2023-07-08 23:06:39,811][19501] Worker 5 uses CPU cores [1]
|
909 |
+
[2023-07-08 23:06:39,821][19509] Worker 11 uses CPU cores [3]
|
910 |
+
[2023-07-08 23:06:39,888][19514] Worker 17 uses CPU cores [1]
|
911 |
+
[2023-07-08 23:06:39,899][19515] Worker 19 uses CPU cores [3]
|
912 |
+
[2023-07-08 23:06:39,901][19512] Worker 18 uses CPU cores [2]
|
913 |
+
[2023-07-08 23:06:39,968][19504] Worker 8 uses CPU cores [0]
|
914 |
+
[2023-07-08 23:06:40,230][19475] Using optimizer <class 'torch.optim.adam.Adam'>
|
915 |
+
[2023-07-08 23:06:40,230][19475] Loading state from checkpoint /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
|
916 |
+
[2023-07-08 23:06:40,254][19475] Loading model from checkpoint
|
917 |
+
[2023-07-08 23:06:40,257][19475] Loaded experiment state at self.train_step=466273, self.env_steps=3819708416
|
918 |
+
[2023-07-08 23:06:40,257][19475] Initialized policy 0 weights for model version 466273
|
919 |
+
[2023-07-08 23:06:40,260][19475] LearnerWorker_p0 finished initialization!
|
920 |
+
[2023-07-08 23:06:40,260][19475] Using GPUs [0] for process 0 (actually maps to GPUs [0])
|
921 |
+
[2023-07-08 23:06:40,402][19496] Unhandled exception CUDA error: OS call failed or operation not supported on this OS
|
922 |
+
CUDA kernel errors might be asynchronously reported at some other API call, so the stacktrace below might be incorrect.
|
923 |
+
For debugging consider passing CUDA_LAUNCH_BLOCKING=1.
|
924 |
+
Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.
|
925 |
+
in evt loop inference_proc0-0_evt_loop
|
926 |
+
[2023-07-08 23:08:32,108][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
927 |
+
[2023-07-08 23:10:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
928 |
+
[2023-07-08 23:12:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
929 |
+
[2023-07-08 23:14:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
930 |
+
[2023-07-08 23:16:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
931 |
+
[2023-07-08 23:18:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
932 |
+
[2023-07-08 23:20:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
933 |
+
[2023-07-08 23:21:32,107][19507] Stopping RolloutWorker_w12...
|
934 |
+
[2023-07-08 23:21:32,107][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
935 |
+
[2023-07-08 23:21:32,107][19513] Stopping RolloutWorker_w15...
|
936 |
+
[2023-07-08 23:21:32,107][19507] Loop rollout_proc12_evt_loop terminating...
|
937 |
+
[2023-07-08 23:21:32,108][19513] Loop rollout_proc15_evt_loop terminating...
|
938 |
+
[2023-07-08 23:21:32,108][19505] Stopping RolloutWorker_w9...
|
939 |
+
[2023-07-08 23:21:32,108][19508] Stopping RolloutWorker_w13...
|
940 |
+
[2023-07-08 23:21:32,109][19514] Stopping RolloutWorker_w17...
|
941 |
+
[2023-07-08 23:21:32,109][19501] Stopping RolloutWorker_w5...
|
942 |
+
[2023-07-08 23:21:32,109][19501] Loop rollout_proc5_evt_loop terminating...
|
943 |
+
[2023-07-08 23:21:32,109][19502] Stopping RolloutWorker_w6...
|
944 |
+
[2023-07-08 23:21:32,109][19502] Loop rollout_proc6_evt_loop terminating...
|
945 |
+
[2023-07-08 23:21:32,107][19497] Stopping RolloutWorker_w1...
|
946 |
+
[2023-07-08 23:21:32,112][19497] Loop rollout_proc1_evt_loop terminating...
|
947 |
+
[2023-07-08 23:21:32,112][19509] Stopping RolloutWorker_w11...
|
948 |
+
[2023-07-08 23:21:32,112][19495] Stopping RolloutWorker_w0...
|
949 |
+
[2023-07-08 23:21:32,112][19512] Stopping RolloutWorker_w18...
|
950 |
+
[2023-07-08 23:21:32,112][19495] Loop rollout_proc0_evt_loop terminating...
|
951 |
+
[2023-07-08 23:21:32,112][19509] Loop rollout_proc11_evt_loop terminating...
|
952 |
+
[2023-07-08 23:21:32,112][19512] Loop rollout_proc18_evt_loop terminating...
|
953 |
+
[2023-07-08 23:21:32,117][19499] Stopping RolloutWorker_w3...
|
954 |
+
[2023-07-08 23:21:32,117][19506] Stopping RolloutWorker_w10...
|
955 |
+
[2023-07-08 23:21:32,107][19515] Stopping RolloutWorker_w19...
|
956 |
+
[2023-07-08 23:21:32,116][19503] Stopping RolloutWorker_w7...
|
957 |
+
[2023-07-08 23:21:32,117][19506] Loop rollout_proc10_evt_loop terminating...
|
958 |
+
[2023-07-08 23:21:32,117][19499] Loop rollout_proc3_evt_loop terminating...
|
959 |
+
[2023-07-08 23:21:32,117][19503] Loop rollout_proc7_evt_loop terminating...
|
960 |
+
[2023-07-08 23:21:32,122][19505] Loop rollout_proc9_evt_loop terminating...
|
961 |
+
[2023-07-08 23:21:32,122][19498] Stopping RolloutWorker_w2...
|
962 |
+
[2023-07-08 23:21:32,122][19511] Stopping RolloutWorker_w16...
|
963 |
+
[2023-07-08 23:21:32,118][19515] Loop rollout_proc19_evt_loop terminating...
|
964 |
+
[2023-07-08 23:21:32,122][19511] Loop rollout_proc16_evt_loop terminating...
|
965 |
+
[2023-07-08 23:21:32,122][19498] Loop rollout_proc2_evt_loop terminating...
|
966 |
+
[2023-07-08 23:21:32,129][19510] Stopping RolloutWorker_w14...
|
967 |
+
[2023-07-08 23:21:32,129][19510] Loop rollout_proc14_evt_loop terminating...
|
968 |
+
[2023-07-08 23:21:32,132][19514] Loop rollout_proc17_evt_loop terminating...
|
969 |
+
[2023-07-08 23:21:32,132][19504] Stopping RolloutWorker_w8...
|
970 |
+
[2023-07-08 23:21:32,132][19504] Loop rollout_proc8_evt_loop terminating...
|
971 |
+
[2023-07-08 23:21:32,132][19475] Stopping Batcher_0...
|
972 |
+
[2023-07-08 23:21:32,132][19475] Loop batcher_evt_loop terminating...
|
973 |
+
[2023-07-08 23:21:32,136][19508] Loop rollout_proc13_evt_loop terminating...
|
974 |
+
[2023-07-08 23:21:32,142][19500] Stopping RolloutWorker_w4...
|
975 |
+
[2023-07-08 23:21:32,142][19500] Loop rollout_proc4_evt_loop terminating...
|
976 |
+
[2023-07-08 23:21:32,239][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
|
977 |
+
[2023-07-08 23:21:32,373][19475] Stopping LearnerWorker_p0...
|
978 |
+
[2023-07-08 23:21:32,373][19475] Loop learner_proc0_evt_loop terminating...
|