RajkNakka commited on
Commit
0012f0a
1 Parent(s): b4a9e85

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1688878853.snowflake ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:440f3682432896f32d41a122192825803e3ee49b39e95ec081ddda42a7105474
3
+ size 4526
.summary/0/events.out.tfevents.1688879192.snowflake ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34e11fa2e82dffd054eaec8e49fef1ca9028159b42f5eb78b05f554c8e50e21c
3
+ size 16844
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 3.97 +/- 0.26
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 3.94 +/- 0.61
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/checkpoint_000000000_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd947d392e08465a103e5c4243c9f5c9277099b2304fc1ba5c09a1ad1867e86d
3
- size 14040084
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f546634a38180cb4a57aec199213e3b845b90a5ebb8206ddaa081c2c9d4ba854
3
+ size 41231900
checkpoint_p0/checkpoint_000466273_3819708416.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad911b64da964df63b10a6c450dbf67193cd2e4eb0163db5a9e46fa8946e6efb
3
+ size 41232964
config.json CHANGED
@@ -63,7 +63,7 @@
63
  "summaries_use_frameskip": true,
64
  "heartbeat_interval": 10,
65
  "heartbeat_reporting_interval": 300,
66
- "train_for_env_steps": 20000,
67
  "train_for_seconds": 1000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
@@ -130,8 +130,8 @@
130
  "cli_args": {},
131
  "git_hash": "0401714b01ee832562a0930e3744117f1ba51e10",
132
  "git_repo_name": "https://github.com/tenkara/HF-DeepRL.git",
133
- "command_line": "--env=doom_health_gathering_supreme --train_for_env_steps=2000000",
134
- "env_gpu_observations": true,
135
  "lr_adaptive_min": 1e-06,
136
- "lr_adaptive_max": 0.01
 
137
  }
 
63
  "summaries_use_frameskip": true,
64
  "heartbeat_interval": 10,
65
  "heartbeat_reporting_interval": 300,
66
+ "train_for_env_steps": 20,
67
  "train_for_seconds": 1000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
 
130
  "cli_args": {},
131
  "git_hash": "0401714b01ee832562a0930e3744117f1ba51e10",
132
  "git_repo_name": "https://github.com/tenkara/HF-DeepRL.git",
133
+ "command_line": "--env=doom_health_gathering_supreme --train_for_env_steps=20",
 
134
  "lr_adaptive_min": 1e-06,
135
+ "lr_adaptive_max": 0.01,
136
+ "env_gpu_observations": true
137
  }
git.diff CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72fd3c87dce5ac3afe8766d7caea74393f7369ee1e0f7a4adff360d24911b999
3
- size 211383812
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b97eeeb6021f14696de0a65f48c22164dbc358a9a63500114e3970e8a301d7
3
+ size 211342672
sf_log.txt CHANGED
@@ -701,3 +701,278 @@ Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.
701
  [2023-07-08 22:48:57,115][18621] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
702
  [2023-07-08 22:48:57,152][18621] Stopping LearnerWorker_p0...
703
  [2023-07-08 22:48:57,152][18621] Loop learner_proc0_evt_loop terminating...
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
701
  [2023-07-08 22:48:57,115][18621] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
702
  [2023-07-08 22:48:57,152][18621] Stopping LearnerWorker_p0...
703
  [2023-07-08 22:48:57,152][18621] Loop learner_proc0_evt_loop terminating...
704
+ [2023-07-08 23:01:01,233][19220] Using GPUs [0] for process 0 (actually maps to GPUs [0])
705
+ [2023-07-08 23:01:01,234][19220] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0
706
+ [2023-07-08 23:01:01,277][19220] Num visible devices: 1
707
+ [2023-07-08 23:01:01,412][19220] Setting fixed seed 42
708
+ [2023-07-08 23:01:01,412][19220] Using GPUs [0] for process 0 (actually maps to GPUs [0])
709
+ [2023-07-08 23:01:01,412][19220] Initializing actor-critic model on device cuda:0
710
+ [2023-07-08 23:01:01,413][19220] RunningMeanStd input shape: (3, 72, 128)
711
+ [2023-07-08 23:01:01,413][19220] RunningMeanStd input shape: (1,)
712
+ [2023-07-08 23:01:01,420][19220] ConvEncoder: input_channels=3
713
+ [2023-07-08 23:01:01,502][19241] Worker 0 uses CPU cores [0]
714
+ [2023-07-08 23:01:01,550][19242] Worker 2 uses CPU cores [2]
715
+ [2023-07-08 23:01:01,609][19243] Worker 1 uses CPU cores [1]
716
+ [2023-07-08 23:01:01,648][19244] Worker 3 uses CPU cores [3]
717
+ [2023-07-08 23:01:01,649][19240] Using GPUs [0] for process 0 (actually maps to GPUs [0])
718
+ [2023-07-08 23:01:01,649][19240] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0
719
+ [2023-07-08 23:01:01,737][19240] Num visible devices: 1
720
+ [2023-07-08 23:01:01,782][19246] Worker 4 uses CPU cores [0]
721
+ [2023-07-08 23:01:01,741][19220] Conv encoder output size: 512
722
+ [2023-07-08 23:01:01,787][19220] Policy head output size: 512
723
+ [2023-07-08 23:01:01,794][19252] Worker 11 uses CPU cores [3]
724
+ [2023-07-08 23:01:01,800][19250] Worker 9 uses CPU cores [1]
725
+ [2023-07-08 23:01:01,807][19220] Created Actor Critic model with architecture:
726
+ [2023-07-08 23:01:01,831][19248] Worker 7 uses CPU cores [3]
727
+ [2023-07-08 23:01:01,849][19249] Worker 8 uses CPU cores [0]
728
+ [2023-07-08 23:01:01,862][19251] Worker 10 uses CPU cores [2]
729
+ [2023-07-08 23:01:01,891][19220] ActorCriticSharedWeights(
730
+ (obs_normalizer): ObservationNormalizer(
731
+ (running_mean_std): RunningMeanStdDictInPlace(
732
+ (running_mean_std): ModuleDict(
733
+ (obs): RunningMeanStdInPlace()
734
+ )
735
+ )
736
+ )
737
+ (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)
738
+ (encoder): VizdoomEncoder(
739
+ (basic_encoder): ConvEncoder(
740
+ (enc): RecursiveScriptModule(
741
+ original_name=ConvEncoderImpl
742
+ (conv_head): RecursiveScriptModule(
743
+ original_name=Sequential
744
+ (0): RecursiveScriptModule(original_name=Conv2d)
745
+ (1): RecursiveScriptModule(original_name=ReLU)
746
+ (2): RecursiveScriptModule(original_name=Conv2d)
747
+ (3): RecursiveScriptModule(original_name=ReLU)
748
+ (4): RecursiveScriptModule(original_name=Conv2d)
749
+ (5): RecursiveScriptModule(original_name=ReLU)
750
+ )
751
+ (mlp_layers): RecursiveScriptModule(
752
+ original_name=Sequential
753
+ (0): RecursiveScriptModule(original_name=Linear)
754
+ (1): RecursiveScriptModule(original_name=ReLU)
755
+ )
756
+ )
757
+ )
758
+ )
759
+ (core): ModelCoreRNN(
760
+ (core): LSTM(512, 512)
761
+ )
762
+ (decoder): MlpDecoder(
763
+ (mlp): Identity()
764
+ )
765
+ (critic_linear): Linear(in_features=512, out_features=1, bias=True)
766
+ (action_parameterization): ActionParameterizationDefault(
767
+ (distribution_linear): Linear(in_features=512, out_features=5, bias=True)
768
+ )
769
+ )
770
+ [2023-07-08 23:01:01,903][19253] Worker 12 uses CPU cores [0]
771
+ [2023-07-08 23:01:01,925][19247] Worker 6 uses CPU cores [2]
772
+ [2023-07-08 23:01:01,943][19254] Worker 13 uses CPU cores [1]
773
+ [2023-07-08 23:01:01,967][19256] Worker 15 uses CPU cores [3]
774
+ [2023-07-08 23:01:01,975][19259] Worker 18 uses CPU cores [2]
775
+ [2023-07-08 23:01:01,991][19255] Worker 14 uses CPU cores [2]
776
+ [2023-07-08 23:01:02,001][19257] Worker 16 uses CPU cores [0]
777
+ [2023-07-08 23:01:02,021][19260] Worker 19 uses CPU cores [3]
778
+ [2023-07-08 23:01:02,041][19245] Worker 5 uses CPU cores [1]
779
+ [2023-07-08 23:01:02,052][19258] Worker 17 uses CPU cores [1]
780
+ [2023-07-08 23:01:02,219][19220] Using optimizer <class 'torch.optim.adam.Adam'>
781
+ [2023-07-08 23:01:02,220][19220] No checkpoints found
782
+ [2023-07-08 23:01:02,220][19220] Did not load from checkpoint, starting from scratch!
783
+ [2023-07-08 23:01:02,220][19220] Initialized policy 0 weights for model version 0
784
+ [2023-07-08 23:01:02,223][19220] Using GPUs [0] for process 0 (actually maps to GPUs [0])
785
+ [2023-07-08 23:01:02,236][19220] LearnerWorker_p0 finished initialization!
786
+ [2023-07-08 23:01:02,356][19240] Unhandled exception CUDA error: OS call failed or operation not supported on this OS
787
+ CUDA kernel errors might be asynchronously reported at some other API call, so the stacktrace below might be incorrect.
788
+ For debugging consider passing CUDA_LAUNCH_BLOCKING=1.
789
+ Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.
790
+ in evt loop inference_proc0-0_evt_loop
791
+ [2023-07-08 23:02:53,735][19220] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
792
+ [2023-07-08 23:04:53,736][19220] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
793
+ [2023-07-08 23:05:29,863][19259] Stopping RolloutWorker_w18...
794
+ [2023-07-08 23:05:29,864][19259] Loop rollout_proc18_evt_loop terminating...
795
+ [2023-07-08 23:05:29,864][19260] Stopping RolloutWorker_w19...
796
+ [2023-07-08 23:05:29,864][19260] Loop rollout_proc19_evt_loop terminating...
797
+ [2023-07-08 23:05:29,872][19252] Stopping RolloutWorker_w11...
798
+ [2023-07-08 23:05:29,872][19249] Stopping RolloutWorker_w8...
799
+ [2023-07-08 23:05:29,872][19251] Stopping RolloutWorker_w10...
800
+ [2023-07-08 23:05:29,872][19252] Loop rollout_proc11_evt_loop terminating...
801
+ [2023-07-08 23:05:29,872][19249] Loop rollout_proc8_evt_loop terminating...
802
+ [2023-07-08 23:05:29,872][19251] Loop rollout_proc10_evt_loop terminating...
803
+ [2023-07-08 23:05:29,882][19255] Stopping RolloutWorker_w14...
804
+ [2023-07-08 23:05:29,882][19248] Stopping RolloutWorker_w7...
805
+ [2023-07-08 23:05:29,882][19257] Stopping RolloutWorker_w16...
806
+ [2023-07-08 23:05:29,882][19255] Loop rollout_proc14_evt_loop terminating...
807
+ [2023-07-08 23:05:29,882][19248] Loop rollout_proc7_evt_loop terminating...
808
+ [2023-07-08 23:05:29,882][19257] Loop rollout_proc16_evt_loop terminating...
809
+ [2023-07-08 23:05:29,882][19220] Stopping Batcher_0...
810
+ [2023-07-08 23:05:29,883][19220] Loop batcher_evt_loop terminating...
811
+ [2023-07-08 23:05:29,892][19244] Stopping RolloutWorker_w3...
812
+ [2023-07-08 23:05:29,892][19241] Stopping RolloutWorker_w0...
813
+ [2023-07-08 23:05:29,892][19244] Loop rollout_proc3_evt_loop terminating...
814
+ [2023-07-08 23:05:29,892][19241] Loop rollout_proc0_evt_loop terminating...
815
+ [2023-07-08 23:05:29,892][19220] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
816
+ [2023-07-08 23:05:29,895][19256] Stopping RolloutWorker_w15...
817
+ [2023-07-08 23:05:29,895][19247] Stopping RolloutWorker_w6...
818
+ [2023-07-08 23:05:29,895][19256] Loop rollout_proc15_evt_loop terminating...
819
+ [2023-07-08 23:05:29,896][19253] Stopping RolloutWorker_w12...
820
+ [2023-07-08 23:05:29,896][19247] Loop rollout_proc6_evt_loop terminating...
821
+ [2023-07-08 23:05:29,896][19253] Loop rollout_proc12_evt_loop terminating...
822
+ [2023-07-08 23:05:29,901][19246] Stopping RolloutWorker_w4...
823
+ [2023-07-08 23:05:29,902][19246] Loop rollout_proc4_evt_loop terminating...
824
+ [2023-07-08 23:05:29,903][19242] Stopping RolloutWorker_w2...
825
+ [2023-07-08 23:05:29,905][19242] Loop rollout_proc2_evt_loop terminating...
826
+ [2023-07-08 23:05:29,956][19220] Stopping LearnerWorker_p0...
827
+ [2023-07-08 23:05:29,956][19220] Loop learner_proc0_evt_loop terminating...
828
+ [2023-07-08 23:05:30,040][19250] Stopping RolloutWorker_w9...
829
+ [2023-07-08 23:05:30,041][19250] Loop rollout_proc9_evt_loop terminating...
830
+ [2023-07-08 23:05:30,042][19254] Stopping RolloutWorker_w13...
831
+ [2023-07-08 23:05:30,042][19254] Loop rollout_proc13_evt_loop terminating...
832
+ [2023-07-08 23:05:30,052][19245] Stopping RolloutWorker_w5...
833
+ [2023-07-08 23:05:30,052][19245] Loop rollout_proc5_evt_loop terminating...
834
+ [2023-07-08 23:05:30,062][19258] Stopping RolloutWorker_w17...
835
+ [2023-07-08 23:05:30,062][19258] Loop rollout_proc17_evt_loop terminating...
836
+ [2023-07-08 23:05:30,072][19243] Stopping RolloutWorker_w1...
837
+ [2023-07-08 23:05:30,072][19243] Loop rollout_proc1_evt_loop terminating...
838
+ [2023-07-08 23:06:39,079][19475] Using GPUs [0] for process 0 (actually maps to GPUs [0])
839
+ [2023-07-08 23:06:39,079][19475] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0
840
+ [2023-07-08 23:06:39,116][19475] Num visible devices: 1
841
+ [2023-07-08 23:06:39,240][19475] Setting fixed seed 42
842
+ [2023-07-08 23:06:39,241][19475] Using GPUs [0] for process 0 (actually maps to GPUs [0])
843
+ [2023-07-08 23:06:39,241][19475] Initializing actor-critic model on device cuda:0
844
+ [2023-07-08 23:06:39,241][19475] RunningMeanStd input shape: (3, 72, 128)
845
+ [2023-07-08 23:06:39,242][19475] RunningMeanStd input shape: (1,)
846
+ [2023-07-08 23:06:39,248][19475] ConvEncoder: input_channels=3
847
+ [2023-07-08 23:06:39,280][19499] Worker 3 uses CPU cores [3]
848
+ [2023-07-08 23:06:39,412][19496] Using GPUs [0] for process 0 (actually maps to GPUs [0])
849
+ [2023-07-08 23:06:39,412][19496] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0
850
+ [2023-07-08 23:06:39,470][19496] Num visible devices: 1
851
+ [2023-07-08 23:06:39,462][19500] Worker 4 uses CPU cores [0]
852
+ [2023-07-08 23:06:39,527][19495] Worker 0 uses CPU cores [0]
853
+ [2023-07-08 23:06:39,541][19497] Worker 1 uses CPU cores [1]
854
+ [2023-07-08 23:06:39,541][19502] Worker 6 uses CPU cores [2]
855
+ [2023-07-08 23:06:39,604][19475] Conv encoder output size: 512
856
+ [2023-07-08 23:06:39,605][19475] Policy head output size: 512
857
+ [2023-07-08 23:06:39,608][19507] Worker 12 uses CPU cores [0]
858
+ [2023-07-08 23:06:39,646][19475] Created Actor Critic model with architecture:
859
+ [2023-07-08 23:06:39,646][19475] ActorCriticSharedWeights(
860
+ (obs_normalizer): ObservationNormalizer(
861
+ (running_mean_std): RunningMeanStdDictInPlace(
862
+ (running_mean_std): ModuleDict(
863
+ (obs): RunningMeanStdInPlace()
864
+ )
865
+ )
866
+ )
867
+ (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)
868
+ (encoder): VizdoomEncoder(
869
+ (basic_encoder): ConvEncoder(
870
+ (enc): RecursiveScriptModule(
871
+ original_name=ConvEncoderImpl
872
+ (conv_head): RecursiveScriptModule(
873
+ original_name=Sequential
874
+ (0): RecursiveScriptModule(original_name=Conv2d)
875
+ (1): RecursiveScriptModule(original_name=ReLU)
876
+ (2): RecursiveScriptModule(original_name=Conv2d)
877
+ (3): RecursiveScriptModule(original_name=ReLU)
878
+ (4): RecursiveScriptModule(original_name=Conv2d)
879
+ (5): RecursiveScriptModule(original_name=ReLU)
880
+ )
881
+ (mlp_layers): RecursiveScriptModule(
882
+ original_name=Sequential
883
+ (0): RecursiveScriptModule(original_name=Linear)
884
+ (1): RecursiveScriptModule(original_name=ReLU)
885
+ )
886
+ )
887
+ )
888
+ )
889
+ (core): ModelCoreRNN(
890
+ (core): LSTM(512, 512)
891
+ )
892
+ (decoder): MlpDecoder(
893
+ (mlp): Identity()
894
+ )
895
+ (critic_linear): Linear(in_features=512, out_features=1, bias=True)
896
+ (action_parameterization): ActionParameterizationDefault(
897
+ (distribution_linear): Linear(in_features=512, out_features=5, bias=True)
898
+ )
899
+ )
900
+ [2023-07-08 23:06:39,648][19498] Worker 2 uses CPU cores [2]
901
+ [2023-07-08 23:06:39,753][19513] Worker 15 uses CPU cores [3]
902
+ [2023-07-08 23:06:39,774][19503] Worker 7 uses CPU cores [3]
903
+ [2023-07-08 23:06:39,781][19510] Worker 14 uses CPU cores [2]
904
+ [2023-07-08 23:06:39,800][19511] Worker 16 uses CPU cores [0]
905
+ [2023-07-08 23:06:39,801][19506] Worker 10 uses CPU cores [2]
906
+ [2023-07-08 23:06:39,804][19508] Worker 13 uses CPU cores [1]
907
+ [2023-07-08 23:06:39,805][19505] Worker 9 uses CPU cores [1]
908
+ [2023-07-08 23:06:39,811][19501] Worker 5 uses CPU cores [1]
909
+ [2023-07-08 23:06:39,821][19509] Worker 11 uses CPU cores [3]
910
+ [2023-07-08 23:06:39,888][19514] Worker 17 uses CPU cores [1]
911
+ [2023-07-08 23:06:39,899][19515] Worker 19 uses CPU cores [3]
912
+ [2023-07-08 23:06:39,901][19512] Worker 18 uses CPU cores [2]
913
+ [2023-07-08 23:06:39,968][19504] Worker 8 uses CPU cores [0]
914
+ [2023-07-08 23:06:40,230][19475] Using optimizer <class 'torch.optim.adam.Adam'>
915
+ [2023-07-08 23:06:40,230][19475] Loading state from checkpoint /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000000000_0.pth...
916
+ [2023-07-08 23:06:40,254][19475] Loading model from checkpoint
917
+ [2023-07-08 23:06:40,257][19475] Loaded experiment state at self.train_step=466273, self.env_steps=3819708416
918
+ [2023-07-08 23:06:40,257][19475] Initialized policy 0 weights for model version 466273
919
+ [2023-07-08 23:06:40,260][19475] LearnerWorker_p0 finished initialization!
920
+ [2023-07-08 23:06:40,260][19475] Using GPUs [0] for process 0 (actually maps to GPUs [0])
921
+ [2023-07-08 23:06:40,402][19496] Unhandled exception CUDA error: OS call failed or operation not supported on this OS
922
+ CUDA kernel errors might be asynchronously reported at some other API call, so the stacktrace below might be incorrect.
923
+ For debugging consider passing CUDA_LAUNCH_BLOCKING=1.
924
+ Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.
925
+ in evt loop inference_proc0-0_evt_loop
926
+ [2023-07-08 23:08:32,108][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
927
+ [2023-07-08 23:10:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
928
+ [2023-07-08 23:12:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
929
+ [2023-07-08 23:14:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
930
+ [2023-07-08 23:16:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
931
+ [2023-07-08 23:18:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
932
+ [2023-07-08 23:20:32,106][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
933
+ [2023-07-08 23:21:32,107][19507] Stopping RolloutWorker_w12...
934
+ [2023-07-08 23:21:32,107][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
935
+ [2023-07-08 23:21:32,107][19513] Stopping RolloutWorker_w15...
936
+ [2023-07-08 23:21:32,107][19507] Loop rollout_proc12_evt_loop terminating...
937
+ [2023-07-08 23:21:32,108][19513] Loop rollout_proc15_evt_loop terminating...
938
+ [2023-07-08 23:21:32,108][19505] Stopping RolloutWorker_w9...
939
+ [2023-07-08 23:21:32,108][19508] Stopping RolloutWorker_w13...
940
+ [2023-07-08 23:21:32,109][19514] Stopping RolloutWorker_w17...
941
+ [2023-07-08 23:21:32,109][19501] Stopping RolloutWorker_w5...
942
+ [2023-07-08 23:21:32,109][19501] Loop rollout_proc5_evt_loop terminating...
943
+ [2023-07-08 23:21:32,109][19502] Stopping RolloutWorker_w6...
944
+ [2023-07-08 23:21:32,109][19502] Loop rollout_proc6_evt_loop terminating...
945
+ [2023-07-08 23:21:32,107][19497] Stopping RolloutWorker_w1...
946
+ [2023-07-08 23:21:32,112][19497] Loop rollout_proc1_evt_loop terminating...
947
+ [2023-07-08 23:21:32,112][19509] Stopping RolloutWorker_w11...
948
+ [2023-07-08 23:21:32,112][19495] Stopping RolloutWorker_w0...
949
+ [2023-07-08 23:21:32,112][19512] Stopping RolloutWorker_w18...
950
+ [2023-07-08 23:21:32,112][19495] Loop rollout_proc0_evt_loop terminating...
951
+ [2023-07-08 23:21:32,112][19509] Loop rollout_proc11_evt_loop terminating...
952
+ [2023-07-08 23:21:32,112][19512] Loop rollout_proc18_evt_loop terminating...
953
+ [2023-07-08 23:21:32,117][19499] Stopping RolloutWorker_w3...
954
+ [2023-07-08 23:21:32,117][19506] Stopping RolloutWorker_w10...
955
+ [2023-07-08 23:21:32,107][19515] Stopping RolloutWorker_w19...
956
+ [2023-07-08 23:21:32,116][19503] Stopping RolloutWorker_w7...
957
+ [2023-07-08 23:21:32,117][19506] Loop rollout_proc10_evt_loop terminating...
958
+ [2023-07-08 23:21:32,117][19499] Loop rollout_proc3_evt_loop terminating...
959
+ [2023-07-08 23:21:32,117][19503] Loop rollout_proc7_evt_loop terminating...
960
+ [2023-07-08 23:21:32,122][19505] Loop rollout_proc9_evt_loop terminating...
961
+ [2023-07-08 23:21:32,122][19498] Stopping RolloutWorker_w2...
962
+ [2023-07-08 23:21:32,122][19511] Stopping RolloutWorker_w16...
963
+ [2023-07-08 23:21:32,118][19515] Loop rollout_proc19_evt_loop terminating...
964
+ [2023-07-08 23:21:32,122][19511] Loop rollout_proc16_evt_loop terminating...
965
+ [2023-07-08 23:21:32,122][19498] Loop rollout_proc2_evt_loop terminating...
966
+ [2023-07-08 23:21:32,129][19510] Stopping RolloutWorker_w14...
967
+ [2023-07-08 23:21:32,129][19510] Loop rollout_proc14_evt_loop terminating...
968
+ [2023-07-08 23:21:32,132][19514] Loop rollout_proc17_evt_loop terminating...
969
+ [2023-07-08 23:21:32,132][19504] Stopping RolloutWorker_w8...
970
+ [2023-07-08 23:21:32,132][19504] Loop rollout_proc8_evt_loop terminating...
971
+ [2023-07-08 23:21:32,132][19475] Stopping Batcher_0...
972
+ [2023-07-08 23:21:32,132][19475] Loop batcher_evt_loop terminating...
973
+ [2023-07-08 23:21:32,136][19508] Loop rollout_proc13_evt_loop terminating...
974
+ [2023-07-08 23:21:32,142][19500] Stopping RolloutWorker_w4...
975
+ [2023-07-08 23:21:32,142][19500] Loop rollout_proc4_evt_loop terminating...
976
+ [2023-07-08 23:21:32,239][19475] Saving /home/raj/repos/HF-DeepRL/8-Proximal-Policy-Optimization/train_dir/default_experiment/checkpoint_p0/checkpoint_000466273_3819708416.pth...
977
+ [2023-07-08 23:21:32,373][19475] Stopping LearnerWorker_p0...
978
+ [2023-07-08 23:21:32,373][19475] Loop learner_proc0_evt_loop terminating...