monti-python commited on
Commit
e6ae781
1 Parent(s): 431e49d

First training for SoccerTwos

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88f7b369822750a740c7d6b7361d05ec0175520a6cadee83584b4baa5dbd466f
3
  size 1768747
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e7ba4ea1fddd3c759958d029b95be5ec6eaa5080b4405464b561aa9b84e6fb
3
  size 1768747
SoccerTwos/SoccerTwos-1499597.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e723f024e58ace7987a73987e84562321a0e14c36dbc08382de55fe9f2c48a96
3
+ size 1768747
SoccerTwos/SoccerTwos-1499597.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3dacef54ff80819d0e995efb488faef76fc5b2c98e8ff11be2e0af4aaf2f49a
3
+ size 28432022
SoccerTwos/SoccerTwos-1641770.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e7ba4ea1fddd3c759958d029b95be5ec6eaa5080b4405464b561aa9b84e6fb
3
+ size 1768747
SoccerTwos/SoccerTwos-1641770.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a615b417f5421ece46210146c3debfab30ab6769b8ababa5d730edbb983168dd
3
+ size 28432022
SoccerTwos/SoccerTwos-999240.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eaa032865bb9c7885b54343a0a0301ff6abafb0c56d1974dfd9cdc6eb958607
3
+ size 1768747
SoccerTwos/SoccerTwos-999240.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2979b96ce6d3e0a57338f5170f030ff840307a3081d96d2297092f961d18e56
3
+ size 28431898
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d079a9016a08c94d2882ccd447c56daf56ecf1ed339823aac3181c005558c2e
3
  size 28431030
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:babb9a0b58835eeef474c91c463b6c4be78300ee733a0c82db102f15e8986c7d
3
  size 28431030
SoccerTwos/events.out.tfevents.1724450680.Montana.30364.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d4a52b3163fc62aeaca4e3957c94fe1bd9bc001427a6020c88214f05671143f
3
+ size 739187
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 5000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 200000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SoccerTwos/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos1", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "constant", "beta_schedule": "constant", "epsilon_schedule": "constant"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 5000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 200000, "swap_steps": 2000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SoccerTwos/SoccerTwos.x86_64", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -73,8 +73,8 @@ checkpoint_settings:
73
  run_id: SoccerTwos1
74
  initialize_from: null
75
  load_model: false
76
- resume: false
77
- force: true
78
  train_model: false
79
  inference: false
80
  results_dir: results
 
73
  run_id: SoccerTwos1
74
  initialize_from: null
75
  load_model: false
76
+ resume: true
77
+ force: false
78
  train_model: false
79
  inference: false
80
  results_dir: results
run_logs/Player-0.log CHANGED
@@ -2,8 +2,6 @@ Mono path[0] = '/home/montana/repos/deep-rl/unit7-multi-agents/ml-agents/trainin
2
  Mono config path = '/home/montana/repos/deep-rl/unit7-multi-agents/ml-agents/training-envs-executables/linux/SoccerTwos/SoccerTwos_Data/MonoBleedingEdge/etc'
3
  Preloaded 'lib_burst_generated.so'
4
  Preloaded 'libgrpc_csharp_ext.x64.so'
5
- PlayerPrefs - Creating folder: /home/montana/.config/unity3d/Unity Technologies/SoccerTwos
6
- Unable to load player prefs
7
  Initialize engine version: 2021.3.14f1 (eee1884e7226)
8
  [Subsystems] Discovering subsystems at path /home/montana/repos/deep-rl/unit7-multi-agents/ml-agents/training-envs-executables/linux/SoccerTwos/SoccerTwos_Data/UnitySubsystems
9
  Forcing GfxDevice: Null
@@ -13,7 +11,7 @@ NullGfxDevice:
13
  Renderer: Null Device
14
  Vendor: Unity Technologies
15
  Begin MonoManager ReloadAssembly
16
- - Completed reload, in 0.053 seconds
17
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
18
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
19
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -38,7 +36,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
38
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
39
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
40
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
41
- UnloadTime: 0.515397 ms
42
  Registered Communicator in Agent.
43
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
44
  requesting resize 84 x 84
@@ -330,12 +328,126 @@ TOO LONG
330
  TOO LONG
331
  TOO LONG
332
  TOO LONG
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
333
  Setting up 4 worker threads for Enlighten.
334
  Memory Statistics:
335
  [ALLOC_TEMP_TLS] TLS Allocator
336
  StackAllocators :
337
  [ALLOC_TEMP_MAIN]
338
- Peak usage frame count: [8.0 KB-16.0 KB]: 12715 frames, [2.0 MB-4.0 MB]: 1 frames
339
  Initial Block Size 4.0 MB
340
  Current Block Size 4.0 MB
341
  Peak Allocated Bytes 2.1 MB
@@ -358,7 +470,7 @@ Memory Statistics:
358
  [ALLOC_TEMP_Job.Worker 6]
359
  Initial Block Size 256.0 KB
360
  Current Block Size 256.0 KB
361
- Peak Allocated Bytes 0 B
362
  Overflow Count 0
363
  [ALLOC_TEMP_Job.Worker 0]
364
  Initial Block Size 256.0 KB
@@ -453,7 +565,7 @@ Memory Statistics:
453
  [ALLOC_TEMP_Job.Worker 2]
454
  Initial Block Size 256.0 KB
455
  Current Block Size 256.0 KB
456
- Peak Allocated Bytes 0.7 KB
457
  Overflow Count 0
458
  [ALLOC_TEMP_Background Job.Worker 3]
459
  Initial Block Size 32.0 KB
@@ -487,16 +599,16 @@ Memory Statistics:
487
  Used Block count 1
488
  Peak Allocated bytes 1.0 MB
489
  [ALLOC_DEFAULT_MAIN]
490
- Peak usage frame count: [4.0 MB-8.0 MB]: 12716 frames
491
  Requested Block Size 16.0 MB
492
  Peak Block count 1
493
- Peak Allocated memory 4.8 MB
494
  Peak Large allocation bytes 0 B
495
  [ALLOC_DEFAULT_THREAD]
496
- Peak usage frame count: [16.0 MB-32.0 MB]: 12716 frames
497
  Requested Block Size 16.0 MB
498
  Peak Block count 1
499
- Peak Allocated memory 17.4 MB
500
  Peak Large allocation bytes 16.0 MB
501
  [ALLOC_TEMP_JOB_1_FRAME]
502
  Initial Block Size 2.0 MB
@@ -525,13 +637,13 @@ Memory Statistics:
525
  Used Block count 1
526
  Peak Allocated bytes 1.0 MB
527
  [ALLOC_GFX_MAIN]
528
- Peak usage frame count: [32.0 KB-64.0 KB]: 12715 frames, [64.0 KB-128.0 KB]: 1 frames
529
  Requested Block Size 16.0 MB
530
  Peak Block count 1
531
  Peak Allocated memory 65.6 KB
532
  Peak Large allocation bytes 0 B
533
  [ALLOC_GFX_THREAD]
534
- Peak usage frame count: [128.0 KB-256.0 KB]: 12716 frames
535
  Requested Block Size 16.0 MB
536
  Peak Block count 1
537
  Peak Allocated memory 173.5 KB
@@ -543,13 +655,13 @@ Memory Statistics:
543
  Used Block count 1
544
  Peak Allocated bytes 1.0 MB
545
  [ALLOC_CACHEOBJECTS_MAIN]
546
- Peak usage frame count: [0.5 MB-1.0 MB]: 12716 frames
547
  Requested Block Size 4.0 MB
548
  Peak Block count 1
549
  Peak Allocated memory 0.6 MB
550
  Peak Large allocation bytes 0 B
551
  [ALLOC_CACHEOBJECTS_THREAD]
552
- Peak usage frame count: [0.5 MB-1.0 MB]: 12715 frames, [4.0 MB-8.0 MB]: 1 frames
553
  Requested Block Size 4.0 MB
554
  Peak Block count 2
555
  Peak Allocated memory 4.5 MB
@@ -561,13 +673,13 @@ Memory Statistics:
561
  Used Block count 1
562
  Peak Allocated bytes 1.0 MB
563
  [ALLOC_TYPETREE_MAIN]
564
- Peak usage frame count: [0-1.0 KB]: 12716 frames
565
  Requested Block Size 2.0 MB
566
  Peak Block count 1
567
  Peak Allocated memory 1.0 KB
568
  Peak Large allocation bytes 0 B
569
  [ALLOC_TYPETREE_THREAD]
570
- Peak usage frame count: [1.0 KB-2.0 KB]: 12715 frames, [2.0 KB-4.0 KB]: 1 frames
571
  Requested Block Size 2.0 MB
572
  Peak Block count 1
573
  Peak Allocated memory 2.2 KB
 
2
  Mono config path = '/home/montana/repos/deep-rl/unit7-multi-agents/ml-agents/training-envs-executables/linux/SoccerTwos/SoccerTwos_Data/MonoBleedingEdge/etc'
3
  Preloaded 'lib_burst_generated.so'
4
  Preloaded 'libgrpc_csharp_ext.x64.so'
 
 
5
  Initialize engine version: 2021.3.14f1 (eee1884e7226)
6
  [Subsystems] Discovering subsystems at path /home/montana/repos/deep-rl/unit7-multi-agents/ml-agents/training-envs-executables/linux/SoccerTwos/SoccerTwos_Data/UnitySubsystems
7
  Forcing GfxDevice: Null
 
11
  Renderer: Null Device
12
  Vendor: Unity Technologies
13
  Begin MonoManager ReloadAssembly
14
+ - Completed reload, in 0.135 seconds
15
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
17
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
36
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
37
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
38
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
39
+ UnloadTime: 0.551381 ms
40
  Registered Communicator in Agent.
41
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
42
  requesting resize 84 x 84
 
328
  TOO LONG
329
  TOO LONG
330
  TOO LONG
331
+ TOO LONG
332
+ TOO LONG
333
+ TOO LONG
334
+ TOO LONG
335
+ TOO LONG
336
+ TOO LONG
337
+ TOO LONG
338
+ TOO LONG
339
+ TOO LONG
340
+ TOO LONG
341
+ TOO LONG
342
+ TOO LONG
343
+ TOO LONG
344
+ TOO LONG
345
+ TOO LONG
346
+ TOO LONG
347
+ TOO LONG
348
+ TOO LONG
349
+ TOO LONG
350
+ TOO LONG
351
+ TOO LONG
352
+ TOO LONG
353
+ TOO LONG
354
+ TOO LONG
355
+ TOO LONG
356
+ TOO LONG
357
+ TOO LONG
358
+ TOO LONG
359
+ TOO LONG
360
+ TOO LONG
361
+ TOO LONG
362
+ TOO LONG
363
+ TOO LONG
364
+ TOO LONG
365
+ TOO LONG
366
+ TOO LONG
367
+ TOO LONG
368
+ TOO LONG
369
+ TOO LONG
370
+ TOO LONG
371
+ TOO LONG
372
+ TOO LONG
373
+ TOO LONG
374
+ TOO LONG
375
+ TOO LONG
376
+ TOO LONG
377
+ TOO LONG
378
+ TOO LONG
379
+ TOO LONG
380
+ TOO LONG
381
+ TOO LONG
382
+ TOO LONG
383
+ TOO LONG
384
+ TOO LONG
385
+ TOO LONG
386
+ TOO LONG
387
+ TOO LONG
388
+ TOO LONG
389
+ TOO LONG
390
+ TOO LONG
391
+ TOO LONG
392
+ TOO LONG
393
+ TOO LONG
394
+ TOO LONG
395
+ TOO LONG
396
+ TOO LONG
397
+ TOO LONG
398
+ TOO LONG
399
+ TOO LONG
400
+ TOO LONG
401
+ TOO LONG
402
+ TOO LONG
403
+ TOO LONG
404
+ TOO LONG
405
+ TOO LONG
406
+ TOO LONG
407
+ TOO LONG
408
+ TOO LONG
409
+ TOO LONG
410
+ TOO LONG
411
+ TOO LONG
412
+ TOO LONG
413
+ TOO LONG
414
+ TOO LONG
415
+ TOO LONG
416
+ TOO LONG
417
+ TOO LONG
418
+ TOO LONG
419
+ TOO LONG
420
+ TOO LONG
421
+ TOO LONG
422
+ TOO LONG
423
+ TOO LONG
424
+ TOO LONG
425
+ TOO LONG
426
+ TOO LONG
427
+ TOO LONG
428
+ TOO LONG
429
+ TOO LONG
430
+ TOO LONG
431
+ TOO LONG
432
+ TOO LONG
433
+ TOO LONG
434
+ TOO LONG
435
+ TOO LONG
436
+ TOO LONG
437
+ TOO LONG
438
+ TOO LONG
439
+ TOO LONG
440
+ TOO LONG
441
+ TOO LONG
442
+ TOO LONG
443
+ TOO LONG
444
+ TOO LONG
445
  Setting up 4 worker threads for Enlighten.
446
  Memory Statistics:
447
  [ALLOC_TEMP_TLS] TLS Allocator
448
  StackAllocators :
449
  [ALLOC_TEMP_MAIN]
450
+ Peak usage frame count: [8.0 KB-16.0 KB]: 19248 frames, [2.0 MB-4.0 MB]: 1 frames
451
  Initial Block Size 4.0 MB
452
  Current Block Size 4.0 MB
453
  Peak Allocated Bytes 2.1 MB
 
470
  [ALLOC_TEMP_Job.Worker 6]
471
  Initial Block Size 256.0 KB
472
  Current Block Size 256.0 KB
473
+ Peak Allocated Bytes 0.7 KB
474
  Overflow Count 0
475
  [ALLOC_TEMP_Job.Worker 0]
476
  Initial Block Size 256.0 KB
 
565
  [ALLOC_TEMP_Job.Worker 2]
566
  Initial Block Size 256.0 KB
567
  Current Block Size 256.0 KB
568
+ Peak Allocated Bytes 0 B
569
  Overflow Count 0
570
  [ALLOC_TEMP_Background Job.Worker 3]
571
  Initial Block Size 32.0 KB
 
599
  Used Block count 1
600
  Peak Allocated bytes 1.0 MB
601
  [ALLOC_DEFAULT_MAIN]
602
+ Peak usage frame count: [4.0 MB-8.0 MB]: 19249 frames
603
  Requested Block Size 16.0 MB
604
  Peak Block count 1
605
+ Peak Allocated memory 4.6 MB
606
  Peak Large allocation bytes 0 B
607
  [ALLOC_DEFAULT_THREAD]
608
+ Peak usage frame count: [16.0 MB-32.0 MB]: 19249 frames
609
  Requested Block Size 16.0 MB
610
  Peak Block count 1
611
+ Peak Allocated memory 17.6 MB
612
  Peak Large allocation bytes 16.0 MB
613
  [ALLOC_TEMP_JOB_1_FRAME]
614
  Initial Block Size 2.0 MB
 
637
  Used Block count 1
638
  Peak Allocated bytes 1.0 MB
639
  [ALLOC_GFX_MAIN]
640
+ Peak usage frame count: [32.0 KB-64.0 KB]: 19248 frames, [64.0 KB-128.0 KB]: 1 frames
641
  Requested Block Size 16.0 MB
642
  Peak Block count 1
643
  Peak Allocated memory 65.6 KB
644
  Peak Large allocation bytes 0 B
645
  [ALLOC_GFX_THREAD]
646
+ Peak usage frame count: [128.0 KB-256.0 KB]: 19249 frames
647
  Requested Block Size 16.0 MB
648
  Peak Block count 1
649
  Peak Allocated memory 173.5 KB
 
655
  Used Block count 1
656
  Peak Allocated bytes 1.0 MB
657
  [ALLOC_CACHEOBJECTS_MAIN]
658
+ Peak usage frame count: [0.5 MB-1.0 MB]: 19249 frames
659
  Requested Block Size 4.0 MB
660
  Peak Block count 1
661
  Peak Allocated memory 0.6 MB
662
  Peak Large allocation bytes 0 B
663
  [ALLOC_CACHEOBJECTS_THREAD]
664
+ Peak usage frame count: [0.5 MB-1.0 MB]: 19248 frames, [4.0 MB-8.0 MB]: 1 frames
665
  Requested Block Size 4.0 MB
666
  Peak Block count 2
667
  Peak Allocated memory 4.5 MB
 
673
  Used Block count 1
674
  Peak Allocated bytes 1.0 MB
675
  [ALLOC_TYPETREE_MAIN]
676
+ Peak usage frame count: [0-1.0 KB]: 19249 frames
677
  Requested Block Size 2.0 MB
678
  Peak Block count 1
679
  Peak Allocated memory 1.0 KB
680
  Peak Large allocation bytes 0 B
681
  [ALLOC_TYPETREE_THREAD]
682
+ Peak usage frame count: [1.0 KB-2.0 KB]: 19248 frames, [2.0 KB-4.0 KB]: 1 frames
683
  Requested Block Size 2.0 MB
684
  Peak Block count 1
685
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,261 +2,261 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 3.209474802017212,
6
- "min": 3.1888222694396973,
7
- "max": 3.2957417964935303,
8
- "count": 64
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 73227.375,
12
- "min": 15208.412109375,
13
- "max": 106662.3984375,
14
- "count": 64
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 860.6666666666666,
18
- "min": 498.0,
19
  "max": 999.0,
20
- "count": 64
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 20656.0,
24
- "min": 12220.0,
25
- "max": 26432.0,
26
- "count": 64
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1205.940405594161,
30
- "min": 1199.2562388766496,
31
- "max": 1207.7641443217108,
32
- "count": 48
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 2411.880811188322,
36
- "min": 2398.512477753299,
37
- "max": 14405.181302303918,
38
- "count": 48
 
 
 
 
 
 
 
 
 
 
 
 
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 639300.0,
42
- "min": 9218.0,
43
- "max": 639300.0,
44
- "count": 64
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 639300.0,
48
- "min": 9218.0,
49
- "max": 639300.0,
50
- "count": 64
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": -0.006309721153229475,
54
- "min": -0.013774292543530464,
55
- "max": 0.03452916443347931,
56
- "count": 64
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": -0.06940693408250809,
60
- "min": -0.14126862585544586,
61
- "max": 0.553314208984375,
62
- "count": 64
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": -0.006794257089495659,
66
- "min": -0.01136896014213562,
67
- "max": 0.034900568425655365,
68
- "count": 64
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": -0.0747368261218071,
72
- "min": -0.14779648184776306,
73
- "max": 0.5539351105690002,
74
- "count": 64
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 64
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 64
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": -0.18181818181818182,
90
- "min": -0.46153846153846156,
91
- "max": 0.2861142892922674,
92
- "count": 64
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": -2.0,
96
- "min": -6.0,
97
- "max": 4.0056000500917435,
98
- "count": 64
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": -0.18181818181818182,
102
- "min": -0.46153846153846156,
103
- "max": 0.2861142892922674,
104
- "count": 64
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": -2.0,
108
- "min": -6.0,
109
- "max": 4.0056000500917435,
110
- "count": 64
111
- },
112
- "SoccerTwos.IsTraining.mean": {
113
- "value": 1.0,
114
- "min": 1.0,
115
- "max": 1.0,
116
- "count": 64
117
- },
118
- "SoccerTwos.IsTraining.sum": {
119
- "value": 1.0,
120
- "min": 1.0,
121
- "max": 1.0,
122
- "count": 64
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.018384612671798094,
126
- "min": 0.010855722728107746,
127
- "max": 0.02520257059659343,
128
- "count": 29
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.018384612671798094,
132
- "min": 0.010855722728107746,
133
- "max": 0.02520257059659343,
134
- "count": 29
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.0012903024636519453,
138
- "min": 3.3449284804495012e-06,
139
- "max": 0.004801920638419688,
140
- "count": 29
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.0012903024636519453,
144
- "min": 3.3449284804495012e-06,
145
- "max": 0.004801920638419688,
146
- "count": 29
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.0012918052981452397,
150
- "min": 3.429187124008119e-06,
151
- "max": 0.00484771333479633,
152
- "count": 29
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.0012918052981452397,
156
- "min": 3.429187124008119e-06,
157
- "max": 0.00484771333479633,
158
- "count": 29
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
- "count": 29
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
- "count": 29
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.20000000000000007,
174
- "min": 0.20000000000000004,
175
  "max": 0.20000000000000007,
176
- "count": 29
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.20000000000000007,
180
- "min": 0.20000000000000004,
181
  "max": 0.20000000000000007,
182
- "count": 29
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.005000000000000001,
186
- "min": 0.005000000000000001,
187
  "max": 0.005000000000000001,
188
- "count": 29
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.005000000000000001,
192
- "min": 0.005000000000000001,
193
  "max": 0.005000000000000001,
194
- "count": 29
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1724366390",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
201
- "command_line_arguments": "/home/montana/miniconda3/envs/huggy/bin/mlagents-learn ./config/poca/SoccerTwos_monti-python.yaml --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos1 --no-graphics --force",
202
  "mlagents_version": "1.0.0",
203
  "mlagents_envs_version": "1.0.0",
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.3.0+cu121",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1724367769"
208
  },
209
- "total": 1378.3384690340026,
210
  "count": 1,
211
- "self": 0.21425851999083534,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.01774524900247343,
215
  "count": 1,
216
- "self": 0.01774524900247343
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 1378.1064652650093,
220
  "count": 1,
221
- "self": 0.8799141031340696,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 4.761846583001898,
225
- "count": 4,
226
- "self": 4.761846583001898
227
  },
228
  "TrainerController.advance": {
229
- "total": 1372.1884267508576,
230
- "count": 42697,
231
- "self": 0.9978618613968138,
232
  "children": {
233
  "env_step": {
234
- "total": 1111.4932532657403,
235
- "count": 42697,
236
- "self": 702.9615276714903,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 407.8746179653972,
240
- "count": 42697,
241
- "self": 6.701437480456661,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 401.17318048494053,
245
- "count": 84773,
246
- "self": 401.17318048494053
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.6571076288528275,
252
- "count": 42696,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 1375.734532308139,
257
- "count": 42696,
258
  "is_parallel": true,
259
- "self": 777.0212588943687,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
@@ -265,48 +265,48 @@
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
- "total": 0.0038299079897115007,
269
  "count": 2,
270
  "is_parallel": true,
271
- "self": 0.0012818250252166763,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
- "total": 0.0025480829644948244,
275
  "count": 8,
276
  "is_parallel": true,
277
- "self": 0.0025480829644948244
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
- "total": 0.14370961100212298,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.0017833859892562032,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
- "total": 0.008020116001716815,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.008020116001716815
292
  },
293
  "communicator.exchange": {
294
- "total": 0.1266742670122767,
295
  "count": 1,
296
  "is_parallel": true,
297
- "self": 0.1266742670122767
298
  },
299
  "steps_from_proto": {
300
- "total": 0.0072318419988732785,
301
  "count": 2,
302
  "is_parallel": true,
303
- "self": 0.0031028410012368113,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
- "total": 0.004129000997636467,
307
  "count": 8,
308
  "is_parallel": true,
309
- "self": 0.004129000997636467
310
  }
311
  }
312
  }
@@ -314,53 +314,53 @@
314
  }
315
  }
316
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
317
  "UnityEnvironment.step": {
318
- "total": 598.7091519027599,
319
- "count": 42695,
320
  "is_parallel": true,
321
- "self": 19.94272614219517,
322
  "children": {
323
  "UnityEnvironment._generate_step_input": {
324
- "total": 12.824735618050909,
325
- "count": 42695,
326
  "is_parallel": true,
327
- "self": 12.824735618050909
328
  },
329
  "communicator.exchange": {
330
- "total": 503.6814929730899,
331
- "count": 42695,
332
  "is_parallel": true,
333
- "self": 503.6814929730899
334
  },
335
  "steps_from_proto": {
336
- "total": 62.26019716942392,
337
- "count": 85390,
338
  "is_parallel": true,
339
- "self": 13.469228172602016,
340
  "children": {
341
  "_process_rank_one_or_two_observation": {
342
- "total": 48.7909689968219,
343
- "count": 341560,
344
  "is_parallel": true,
345
- "self": 48.7909689968219
346
  }
347
  }
348
  }
349
  }
350
- },
351
- "steps_from_proto": {
352
- "total": 0.004121511010453105,
353
- "count": 6,
354
- "is_parallel": true,
355
- "self": 0.0009598119795555249,
356
- "children": {
357
- "_process_rank_one_or_two_observation": {
358
- "total": 0.00316169903089758,
359
- "count": 24,
360
- "is_parallel": true,
361
- "self": 0.00316169903089758
362
- }
363
- }
364
  }
365
  }
366
  }
@@ -369,31 +369,31 @@
369
  }
370
  },
371
  "trainer_advance": {
372
- "total": 259.69731162372045,
373
- "count": 42696,
374
- "self": 7.711557417947915,
375
  "children": {
376
  "process_trajectory": {
377
- "total": 92.47993407177273,
378
- "count": 42696,
379
- "self": 91.53840788676462,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
- "total": 0.9415261850081151,
383
- "count": 1,
384
- "self": 0.9415261850081151
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
- "total": 159.5058201339998,
390
- "count": 30,
391
- "self": 88.51124684415117,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
- "total": 70.99457328984863,
395
- "count": 906,
396
- "self": 70.99457328984863
397
  }
398
  }
399
  }
@@ -402,19 +402,19 @@
402
  }
403
  },
404
  "trainer_threads": {
405
- "total": 1.167005393654108e-06,
406
  "count": 1,
407
- "self": 1.167005393654108e-06
408
  },
409
  "TrainerController._save_models": {
410
- "total": 0.27627666101034265,
411
  "count": 1,
412
- "self": 0.0014554330118699,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
- "total": 0.27482122799847275,
416
  "count": 1,
417
- "self": 0.27482122799847275
418
  }
419
  }
420
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 3.147171974182129,
6
+ "min": 3.0757153034210205,
7
+ "max": 3.2128803730010986,
8
+ "count": 100
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 32932.0078125,
12
+ "min": 7447.50390625,
13
+ "max": 158240.28125,
14
+ "count": 100
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 915.8333333333334,
18
+ "min": 405.90909090909093,
19
  "max": 999.0,
20
+ "count": 100
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 21980.0,
24
+ "min": 3700.0,
25
+ "max": 27856.0,
26
+ "count": 100
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1197.294585587241,
30
+ "min": 1197.294585587241,
31
+ "max": 1213.8097241010091,
32
+ "count": 91
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 4789.178342348964,
36
+ "min": 2402.3416809606965,
37
+ "max": 19353.100026898544,
38
+ "count": 91
39
+ },
40
+ "SoccerTwos.IsTraining.mean": {
41
+ "value": 1.0,
42
+ "min": 1.0,
43
+ "max": 1.0,
44
+ "count": 100
45
+ },
46
+ "SoccerTwos.IsTraining.sum": {
47
+ "value": 1.0,
48
+ "min": 1.0,
49
+ "max": 1.0,
50
+ "count": 100
51
  },
52
  "SoccerTwos.Step.mean": {
53
+ "value": 1639180.0,
54
+ "min": 659202.0,
55
+ "max": 1639180.0,
56
+ "count": 99
57
  },
58
  "SoccerTwos.Step.sum": {
59
+ "value": 1639180.0,
60
+ "min": 659202.0,
61
+ "max": 1639180.0,
62
+ "count": 99
63
  },
64
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
65
+ "value": -0.015390798449516296,
66
+ "min": -0.018517760559916496,
67
+ "max": 0.016770390793681145,
68
+ "count": 99
69
  },
70
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
71
+ "value": -0.16929878294467926,
72
+ "min": -0.2552330493927002,
73
+ "max": 0.18447428941726685,
74
+ "count": 99
75
  },
76
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
77
+ "value": -0.01509619690477848,
78
+ "min": -0.018388936296105385,
79
+ "max": 0.017871476709842682,
80
+ "count": 99
81
  },
82
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
83
+ "value": -0.16605816781520844,
84
+ "min": -0.2526383399963379,
85
+ "max": 0.1965862363576889,
86
+ "count": 99
87
  },
88
  "SoccerTwos.Environment.CumulativeReward.mean": {
89
  "value": 0.0,
90
  "min": 0.0,
91
  "max": 0.0,
92
+ "count": 99
93
  },
94
  "SoccerTwos.Environment.CumulativeReward.sum": {
95
  "value": 0.0,
96
  "min": 0.0,
97
  "max": 0.0,
98
+ "count": 99
99
  },
100
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
101
+ "value": -0.36363636363636365,
102
+ "min": -0.5,
103
+ "max": 0.45713333288828534,
104
+ "count": 99
105
  },
106
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
107
+ "value": -4.0,
108
+ "min": -7.0,
109
+ "max": 8.228399991989136,
110
+ "count": 99
111
  },
112
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
113
+ "value": -0.36363636363636365,
114
+ "min": -0.5,
115
+ "max": 0.45713333288828534,
116
+ "count": 99
117
  },
118
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
119
+ "value": -4.0,
120
+ "min": -7.0,
121
+ "max": 8.228399991989136,
122
+ "count": 99
 
 
 
 
 
 
 
 
 
 
 
 
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.016261281779346368,
126
+ "min": 0.013237021410410913,
127
+ "max": 0.02583168828083823,
128
+ "count": 46
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.016261281779346368,
132
+ "min": 0.013237021410410913,
133
+ "max": 0.02583168828083823,
134
+ "count": 46
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.0046276195285220945,
138
+ "min": 0.00021013136767688786,
139
+ "max": 0.006187491274128358,
140
+ "count": 46
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.0046276195285220945,
144
+ "min": 0.00021013136767688786,
145
+ "max": 0.006187491274128358,
146
+ "count": 46
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.004642315007125338,
150
+ "min": 0.00020933844318664563,
151
+ "max": 0.006221231569846471,
152
+ "count": 46
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.004642315007125338,
156
+ "min": 0.00020933844318664563,
157
+ "max": 0.006221231569846471,
158
+ "count": 46
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.0003,
162
  "min": 0.0003,
163
  "max": 0.0003,
164
+ "count": 46
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.0003,
168
  "min": 0.0003,
169
  "max": 0.0003,
170
+ "count": 46
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.20000000000000007,
174
+ "min": 0.2,
175
  "max": 0.20000000000000007,
176
+ "count": 46
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.20000000000000007,
180
+ "min": 0.2,
181
  "max": 0.20000000000000007,
182
+ "count": 46
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.005000000000000001,
186
+ "min": 0.005,
187
  "max": 0.005000000000000001,
188
+ "count": 46
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.005000000000000001,
192
+ "min": 0.005,
193
  "max": 0.005000000000000001,
194
+ "count": 46
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1724450679",
200
  "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
201
+ "command_line_arguments": "/home/montana/miniconda3/envs/huggy/bin/mlagents-learn ./config/poca/SoccerTwos_monti-python.yaml --env=./training-envs-executables/linux/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos1 --no-graphics --resume",
202
  "mlagents_version": "1.0.0",
203
  "mlagents_envs_version": "1.0.0",
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "2.3.0+cu121",
206
  "numpy_version": "1.21.2",
207
+ "end_time_seconds": "1724453053"
208
  },
209
+ "total": 2374.332812839988,
210
  "count": 1,
211
+ "self": 0.3011273759766482,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.023536217006039806,
215
  "count": 1,
216
+ "self": 0.023536217006039806
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 2374.0081492470053,
220
  "count": 1,
221
+ "self": 1.4943843034125166,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 5.1240192109689815,
225
+ "count": 6,
226
+ "self": 5.1240192109689815
227
  },
228
  "TrainerController.advance": {
229
+ "total": 2367.0536718156363,
230
+ "count": 64664,
231
+ "self": 1.674688027051161,
232
  "children": {
233
  "env_step": {
234
+ "total": 1924.810803599612,
235
+ "count": 64664,
236
+ "self": 1164.4117003164429,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 759.3363031045301,
240
+ "count": 64664,
241
+ "self": 13.485134564500186,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 745.8511685400299,
245
+ "count": 128325,
246
+ "self": 745.8511685400299
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 1.0628001786390087,
252
+ "count": 64663,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 2370.424527122552,
257
+ "count": 64663,
258
  "is_parallel": true,
259
+ "self": 1379.279040477617,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
 
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
+ "total": 0.0037540920020546764,
269
  "count": 2,
270
  "is_parallel": true,
271
+ "self": 0.0011440380185376853,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
+ "total": 0.002610053983516991,
275
  "count": 8,
276
  "is_parallel": true,
277
+ "self": 0.002610053983516991
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
+ "total": 0.027154524010256864,
283
  "count": 1,
284
  "is_parallel": true,
285
+ "self": 0.0004653770010918379,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
+ "total": 0.0005320620111888275,
289
  "count": 1,
290
  "is_parallel": true,
291
+ "self": 0.0005320620111888275
292
  },
293
  "communicator.exchange": {
294
+ "total": 0.024583517006249167,
295
  "count": 1,
296
  "is_parallel": true,
297
+ "self": 0.024583517006249167
298
  },
299
  "steps_from_proto": {
300
+ "total": 0.0015735679917270318,
301
  "count": 2,
302
  "is_parallel": true,
303
+ "self": 0.00035226598265580833,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
+ "total": 0.0012213020090712234,
307
  "count": 8,
308
  "is_parallel": true,
309
+ "self": 0.0012213020090712234
310
  }
311
  }
312
  }
 
314
  }
315
  }
316
  },
317
+ "steps_from_proto": {
318
+ "total": 0.007678079025936313,
319
+ "count": 10,
320
+ "is_parallel": true,
321
+ "self": 0.0017173930536955595,
322
+ "children": {
323
+ "_process_rank_one_or_two_observation": {
324
+ "total": 0.0059606859722407535,
325
+ "count": 40,
326
+ "is_parallel": true,
327
+ "self": 0.0059606859722407535
328
+ }
329
+ }
330
+ },
331
  "UnityEnvironment.step": {
332
+ "total": 991.1378085659089,
333
+ "count": 64662,
334
  "is_parallel": true,
335
+ "self": 32.84578116021294,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
+ "total": 21.35030674104928,
339
+ "count": 64662,
340
  "is_parallel": true,
341
+ "self": 21.35030674104928
342
  },
343
  "communicator.exchange": {
344
+ "total": 832.1024990279402,
345
+ "count": 64662,
346
  "is_parallel": true,
347
+ "self": 832.1024990279402
348
  },
349
  "steps_from_proto": {
350
+ "total": 104.8392216367065,
351
+ "count": 129324,
352
  "is_parallel": true,
353
+ "self": 22.7072764007753,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
+ "total": 82.1319452359312,
357
+ "count": 517296,
358
  "is_parallel": true,
359
+ "self": 82.1319452359312
360
  }
361
  }
362
  }
363
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
364
  }
365
  }
366
  }
 
369
  }
370
  },
371
  "trainer_advance": {
372
+ "total": 440.5681801889732,
373
+ "count": 64663,
374
+ "self": 13.549240465261391,
375
  "children": {
376
  "process_trajectory": {
377
+ "total": 163.02262107680144,
378
+ "count": 64663,
379
+ "self": 162.17994571680902,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
+ "total": 0.8426753599924268,
383
+ "count": 2,
384
+ "self": 0.8426753599924268
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
+ "total": 263.99631864691037,
390
+ "count": 46,
391
+ "self": 147.70801077308715,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
+ "total": 116.28830787382321,
395
+ "count": 1383,
396
+ "self": 116.28830787382321
397
  }
398
  }
399
  }
 
402
  }
403
  },
404
  "trainer_threads": {
405
+ "total": 2.496992237865925e-06,
406
  "count": 1,
407
+ "self": 2.496992237865925e-06
408
  },
409
  "TrainerController._save_models": {
410
+ "total": 0.3360714199952781,
411
  "count": 1,
412
+ "self": 0.004281576999346726,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
+ "total": 0.3317898429959314,
416
  "count": 1,
417
+ "self": 0.3317898429959314
418
  }
419
  }
420
  }
run_logs/training_status.json CHANGED
@@ -18,16 +18,43 @@
18
  "auxillary_file_paths": [
19
  "results/SoccerTwos1/SoccerTwos/SoccerTwos-649402.pt"
20
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  }
22
  ],
23
- "elo": 1205.7002450014797,
24
  "final_checkpoint": {
25
- "steps": 649402,
26
  "file_path": "results/SoccerTwos1/SoccerTwos.onnx",
27
  "reward": 0.0,
28
- "creation_time": 1724367769.0234501,
29
  "auxillary_file_paths": [
30
- "results/SoccerTwos1/SoccerTwos/SoccerTwos-649402.pt"
31
  ]
32
  }
33
  },
 
18
  "auxillary_file_paths": [
19
  "results/SoccerTwos1/SoccerTwos/SoccerTwos-649402.pt"
20
  ]
21
+ },
22
+ {
23
+ "steps": 999240,
24
+ "file_path": "results/SoccerTwos1/SoccerTwos/SoccerTwos-999240.onnx",
25
+ "reward": 0.0,
26
+ "creation_time": 1724451538.155989,
27
+ "auxillary_file_paths": [
28
+ "results/SoccerTwos1/SoccerTwos/SoccerTwos-999240.pt"
29
+ ]
30
+ },
31
+ {
32
+ "steps": 1499597,
33
+ "file_path": "results/SoccerTwos1/SoccerTwos/SoccerTwos-1499597.onnx",
34
+ "reward": 0.0,
35
+ "creation_time": 1724452736.5620186,
36
+ "auxillary_file_paths": [
37
+ "results/SoccerTwos1/SoccerTwos/SoccerTwos-1499597.pt"
38
+ ]
39
+ },
40
+ {
41
+ "steps": 1641770,
42
+ "file_path": "results/SoccerTwos1/SoccerTwos/SoccerTwos-1641770.onnx",
43
+ "reward": 0.0,
44
+ "creation_time": 1724453053.1768804,
45
+ "auxillary_file_paths": [
46
+ "results/SoccerTwos1/SoccerTwos/SoccerTwos-1641770.pt"
47
+ ]
48
  }
49
  ],
50
+ "elo": 1197.6010693474466,
51
  "final_checkpoint": {
52
+ "steps": 1641770,
53
  "file_path": "results/SoccerTwos1/SoccerTwos.onnx",
54
  "reward": 0.0,
55
+ "creation_time": 1724453053.1768804,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos1/SoccerTwos/SoccerTwos-1641770.pt"
58
  ]
59
  }
60
  },