add snes2 xnes2 presets, cleanup, tweaks etc.
This commit is contained in:
parent
33eeaf9c76
commit
655cb6f5b3
1 changed files with 78 additions and 10 deletions
88
config.lua
88
config.lua
|
@ -22,10 +22,10 @@ local common_cfg = {
|
||||||
init_zeros = false, -- instead of random normal noise.
|
init_zeros = false, -- instead of random normal noise.
|
||||||
|
|
||||||
-- network inputs (connections):
|
-- network inputs (connections):
|
||||||
time_inputs = true, -- binary inputs of global frame count
|
time_inputs = true, -- insert binary inputs of a frame counter.
|
||||||
|
|
||||||
-- network layers:
|
-- network layers:
|
||||||
layernorm = false,
|
layernorm = false, -- (doesn't do anything right now)
|
||||||
reduce_tiles = false,
|
reduce_tiles = false,
|
||||||
bias_out = true,
|
bias_out = true,
|
||||||
|
|
||||||
|
@ -43,6 +43,7 @@ local common_cfg = {
|
||||||
-- sampling:
|
-- sampling:
|
||||||
deviation = 1.0,
|
deviation = 1.0,
|
||||||
unperturbed_trial = true, -- perform an extra trial without any noise.
|
unperturbed_trial = true, -- perform an extra trial without any noise.
|
||||||
|
-- this is good for logging, so i'd recommend it.
|
||||||
graycode = false, -- for ARS.
|
graycode = false, -- for ARS.
|
||||||
negate_trials = true, -- try pairs of normal and negated noise directions.
|
negate_trials = true, -- try pairs of normal and negated noise directions.
|
||||||
-- AKA antithetic sampling. note that this doubles the number of trials.
|
-- AKA antithetic sampling. note that this doubles the number of trials.
|
||||||
|
@ -80,6 +81,39 @@ if preset == 'snes' then
|
||||||
sigma_decay = 0.01, -- note: multiplied by learning_rate.
|
sigma_decay = 0.01, -- note: multiplied by learning_rate.
|
||||||
}
|
}
|
||||||
|
|
||||||
|
elseif preset == 'snes2' then
|
||||||
|
|
||||||
|
cfg = {
|
||||||
|
es = 'snes',
|
||||||
|
|
||||||
|
log_fn = 'logs-snes2.csv',
|
||||||
|
params_fn = 'params-snes2.txt',
|
||||||
|
|
||||||
|
start_big = true,
|
||||||
|
min_time = 300,
|
||||||
|
timer_loser = 1.0,
|
||||||
|
|
||||||
|
score_multiplier = 0,
|
||||||
|
|
||||||
|
init_zeros = true,
|
||||||
|
|
||||||
|
reduce_tiles = true,
|
||||||
|
bias_out = false,
|
||||||
|
|
||||||
|
deterministic = false,
|
||||||
|
|
||||||
|
deviation = 0.5,
|
||||||
|
negate_trials = false,
|
||||||
|
min_refresh = 0.5,
|
||||||
|
|
||||||
|
epoch_trials = 100,
|
||||||
|
|
||||||
|
learning_rate = 0.01,
|
||||||
|
mean_adapt = 1.0,
|
||||||
|
weight_decay = 0.02,
|
||||||
|
sigma_decay = 0.01,
|
||||||
|
}
|
||||||
|
|
||||||
elseif preset == 'xnes' then
|
elseif preset == 'xnes' then
|
||||||
|
|
||||||
cfg = {
|
cfg = {
|
||||||
|
@ -92,7 +126,6 @@ elseif preset == 'xnes' then
|
||||||
min_time = 300,
|
min_time = 300,
|
||||||
timer_loser = 1.0,
|
timer_loser = 1.0,
|
||||||
|
|
||||||
decrement_reward = false,
|
|
||||||
score_multiplier = 0,
|
score_multiplier = 0,
|
||||||
|
|
||||||
init_zeros = true,
|
init_zeros = true,
|
||||||
|
@ -104,32 +137,67 @@ elseif preset == 'xnes' then
|
||||||
|
|
||||||
deviation = 0.5,
|
deviation = 0.5,
|
||||||
negate_trials = false,
|
negate_trials = false,
|
||||||
min_refresh = 0.1,
|
|
||||||
|
|
||||||
epoch_trials = 50,
|
epoch_trials = 50,
|
||||||
|
|
||||||
learning_rate = 0.01,
|
learning_rate = 0.01,
|
||||||
mean_adapt = 1.0,
|
}
|
||||||
weight_decay = 0.0,
|
|
||||||
sigma_decay = 0.0,
|
elseif preset == 'xnes2' then
|
||||||
|
|
||||||
|
cfg = {
|
||||||
|
es = 'xnes',
|
||||||
|
|
||||||
|
log_fn = 'logs-xnes2.csv',
|
||||||
|
params_fn = 'params-xnes2.txt',
|
||||||
|
|
||||||
|
start_big = true,
|
||||||
|
min_time = 300,
|
||||||
|
timer_loser = 1.0,
|
||||||
|
|
||||||
|
score_multiplier = 0,
|
||||||
|
|
||||||
|
init_zeros = true,
|
||||||
|
|
||||||
|
reduce_tiles = true,
|
||||||
|
bias_out = false,
|
||||||
|
|
||||||
|
deterministic = false,
|
||||||
|
|
||||||
|
deviation = 0.5,
|
||||||
|
negate_trials = true,
|
||||||
|
|
||||||
|
epoch_trials = 25,
|
||||||
|
|
||||||
|
learning_rate = 0.01,
|
||||||
|
mean_adapt = 0.5,
|
||||||
|
weight_decay = 0.01,
|
||||||
|
sigma_decay = 0.0016, --0.00128,
|
||||||
}
|
}
|
||||||
|
|
||||||
elseif preset == 'ars' then
|
elseif preset == 'ars' then
|
||||||
|
|
||||||
cfg = {
|
cfg = {
|
||||||
es = 'ars',
|
es = 'ars',
|
||||||
epoch_top_trials = 20,
|
epoch_top_trials = 20 * 2,
|
||||||
ars_lips = false,
|
ars_lips = false,
|
||||||
|
|
||||||
log_fn = 'logs-ars.csv',
|
log_fn = 'logs-ars.csv',
|
||||||
params_fn = 'params-ars.txt',
|
params_fn = 'params-ars.txt',
|
||||||
|
|
||||||
|
start_big = true,
|
||||||
min_time = 300,
|
min_time = 300,
|
||||||
timer_loser = 1.0,
|
timer_loser = 1.0,
|
||||||
|
|
||||||
deviation = 0.1,
|
bias_out = false,
|
||||||
|
|
||||||
epoch_trials = 25,
|
deterministic = false,
|
||||||
|
|
||||||
|
graycode = false,
|
||||||
|
deviation = 0.1,
|
||||||
|
negate_trials = false,
|
||||||
|
|
||||||
|
epoch_trials = 25 * 2,
|
||||||
|
|
||||||
learning_rate = 1.0,
|
learning_rate = 1.0,
|
||||||
weight_decay = 0.0025,
|
weight_decay = 0.0025,
|
||||||
|
|
Loading…
Add table
Reference in a new issue