tweak config

This commit is contained in:
Connor Olding 2018-05-07 16:22:02 +02:00
parent 946f05bd3e
commit e3a8a6b87f

View file

@ -26,17 +26,20 @@ local common_cfg = {
det_epsilon = false, -- take random actions with probability eps. det_epsilon = false, -- take random actions with probability eps.
layernorm = false, layernorm = false,
learning_rate = 1.0,
init_zeros = true, -- instead of he_normal noise or whatever. init_zeros = true, -- instead of he_normal noise or whatever.
graycode = false, graycode = false,
unperturbed_trial = true, -- do a trial without any noise. unperturbed_trial = true, -- do a trial without any noise.
negate_trials = true, -- try pairs of normal and negated noise directions. negate_trials = true, -- try pairs of normal and negated noise directions.
-- ^ note that this now doubles the effective trials. -- ^ note that this now doubles the effective trials.
time_inputs = true, -- binary inputs of global frame count time_inputs = true, -- binary inputs of global frame count
normalize_inputs = false,
ars_lips = false, ars_lips = false,
adamant = false, -- run steps through AMSgrad. adamant = false, -- run steps through AMSgrad.
adam_b1 = math.pow(10, -1 / 1), -- fewer trials, more momentum!
adam_b2 = math.pow(10, -1 / 50),
adam_eps = intmap(-1), -- focus on b1 rather than b2.
adam_debias = true,
cap_time = 300, cap_time = 300,
timer_loser = 1/2, timer_loser = 1/2,
@ -44,21 +47,19 @@ local common_cfg = {
} }
local cfg = { local cfg = {
-- best performance so far, albeit a bit slow to train.
-- NOTE: uncomment for original values used.
log_fn = 'log.csv', -- can be nil to disable logging. log_fn = 'log.csv', -- can be nil to disable logging.
params_fn = nil, -- can be nil to generate based on param count. params_fn = nil, -- can be nil to generate based on param count.
deterministic = true,
epoch_trials = 20,
epoch_top_trials = 10,
learning_rate = 1.0,
ars_lips = true,
deviation = 0.1,
weight_decay = 0.004,
cap_time = 300,
starting_lives = 1, starting_lives = 1,
deterministic = true,
layernorm = true,
epoch_trials = 24, --20,
epoch_top_trials = 18, --10,
ars_lips = true,
deviation = 0.05, --0.1,
weight_decay = 0.0002, --0.0004,
learning_rate = 2.0, --1.0
} }
-- TODO: so, uhh.. -- TODO: so, uhh..