tweak config

2018-05-07 16:22:02 +02:00 · 2018-05-07 16:22:02 +02:00 · e3a8a6b87f
commit e3a8a6b87f
parent 946f05bd3e
1 changed files with 15 additions and 14 deletions
--- a/config.lua
+++ b/config.lua
@ -26,17 +26,20 @@ local common_cfg = {
    det_epsilon = false, -- take random actions with probability eps.
    layernorm = false,
    learning_rate = 1.0,
    init_zeros = true, -- instead of he_normal noise or whatever.
    graycode = false,
    unperturbed_trial = true, -- do a trial without any noise.
    negate_trials = true, -- try pairs of normal and negated noise directions.
    -- ^ note that this now doubles the effective trials.
    time_inputs = true, -- binary inputs of global frame count
    normalize_inputs = false,
    ars_lips = false,
    adamant = false, -- run steps through AMSgrad.
    adam_b1 = math.pow(10, -1 / 1), -- fewer trials, more momentum!
    adam_b2 = math.pow(10, -1 / 50),
    adam_eps = intmap(-1), -- focus on b1 rather than b2.
    adam_debias = true,
    cap_time = 300,
    timer_loser = 1/2,
@ -44,21 +47,19 @@ local common_cfg = {
 }
 local cfg = {
    -- best performance so far, albeit a bit slow to train.
    -- NOTE: uncomment for original values used.
    log_fn = 'log.csv', -- can be nil to disable logging.
    params_fn = nil, -- can be nil to generate based on param count.
    deterministic = true,
    epoch_trials = 20,
    epoch_top_trials = 10,
    learning_rate = 1.0,
    ars_lips = true,
    deviation = 0.1,
    weight_decay = 0.004,
    cap_time = 300,
    starting_lives = 1,
    deterministic = true,
    layernorm = true,
    epoch_trials = 24, --20,
    epoch_top_trials = 18, --10,
    ars_lips = true,
    deviation = 0.05, --0.1,
    weight_decay = 0.0002, --0.0004,
    learning_rate = 2.0, --1.0
 }
 -- TODO: so, uhh..