|
@@ -27,8 +27,8 @@ def get_args():
|
|
|
help='value loss coefficient (default: 0.5)')
|
|
|
parser.add_argument('--seed', type=int, default=1,
|
|
|
help='random seed (default: 1)')
|
|
|
- parser.add_argument('--num-processes', type=int, default=16,
|
|
|
- help='how many training CPU processes to use (default: 16)')
|
|
|
+ parser.add_argument('--num-processes', type=int, default=32,
|
|
|
+ help='how many training CPU processes to use (default: 32)')
|
|
|
parser.add_argument('--num-steps', type=int, default=5,
|
|
|
help='number of forward steps in A2C (default: 5)')
|
|
|
parser.add_argument('--ppo-epoch', type=int, default=4,
|
|
@@ -37,8 +37,8 @@ def get_args():
|
|
|
help='number of batches for ppo (default: 32)')
|
|
|
parser.add_argument('--clip-param', type=float, default=0.2,
|
|
|
help='ppo clip parameter (default: 0.2)')
|
|
|
- parser.add_argument('--num-stack', type=int, default=4,
|
|
|
- help='number of frames to stack (default: 4)')
|
|
|
+ parser.add_argument('--num-stack', type=int, default=1,
|
|
|
+ help='number of frames to stack (default: 1)')
|
|
|
parser.add_argument('--log-interval', type=int, default=10,
|
|
|
help='log interval, one log per n updates (default: 10)')
|
|
|
parser.add_argument('--save-interval', type=int, default=100,
|