smbot/config.lua

82 lines
2.2 KiB
Lua

local function approx_cossim(dim)
return math.pow(1.521 * dim - 0.521, -0.5026)
end
local function intmap(x)
-- 0 -> 1.0
-- -1 -> 0.316
-- -2 -> 0.1
-- -3 -> 0.0316
-- -4 -> 0.01
-- etc.
return math.pow(10, x / 2)
end
local common_cfg = {
defer_prints = true,
playable_mode = false,
playback_mode = false,
start_big = false,
starting_lives = 0,
frameskip = 4,
-- true greedy epsilon has both deterministic and det_epsilon set.
deterministic = false, -- use argmax on outputs instead of random sampling.
det_epsilon = false, -- take random actions with probability eps.
layernorm = false,
init_zeros = true, -- instead of he_normal noise or whatever.
graycode = false,
unperturbed_trial = true, -- do a trial without any noise.
negate_trials = true, -- try pairs of normal and negated noise directions.
-- ^ note that this now doubles the effective trials.
time_inputs = true, -- binary inputs of global frame count
adamant = false, -- run steps through AMSgrad.
cap_time = 300,
timer_loser = 1/2,
decrement_reward = false, -- bad idea, encourages mario to run into goombas.
}
local cfg = {
log_fn = 'log.csv', -- can be nil to disable logging.
params_fn = nil, -- can be nil to generate based on param count.
deterministic = true,
epoch_trials = 20,
epoch_top_trials = 10,
learning_rate = 1.0,
deviation = 0.1,
weight_decay = 0.004,
cap_time = 300,
starting_lives = 1,
}
-- TODO: so, uhh..
-- what happens when playback_mode is true but unperturbed_trial is false?
setmetatable(cfg, {
__index = function(t, n)
if common_cfg[n] ~= nil then return common_cfg[n] end
if n == 'params_fn' then return nil end
error("cannot use undeclared config '" .. tostring(n) .. "'", 2)
end
})
cfg.epoch_top_trials = math.min(cfg.epoch_trials, cfg.epoch_top_trials)
cfg.eps_start = 1.0 * cfg.frameskip / 64
cfg.eps_stop = 0.1 * cfg.eps_start
cfg.eps_frames = 1000000
cfg.enable_overlay = cfg.playable_mode
cfg.enable_network = not cfg.playable_mode
assert(not cfg.ars_lips or cfg.unperturbed_trial,
"cfg.unperturbed_trial must be true to use cfg.ars_lips")
return cfg