コード例 #1
0
state.lr = 8.2 * 1e-3
state.batch_size = 160
state.sub_mb_size = 160
state.max_iters = 90000
state.n_hids = 180
state.mem_nel = 120
state.mem_size = 28
state.renormalization_scale = 5.0
state.use_ff_controller = True
state.seed = args.seed

state.use_gru_inp = True
state.use_bow_inp = False

state.std = 0.034
state.bow_size = 100
state.bow_weight_start = 0.64
state.learn_h0 = False

state.n_reading_steps = 1
state.n_read_heads = 1
state.max_seq_len = 300
state.max_fact_len = 15
state.use_reinforce_baseline = False
state.use_reinforce = False
state.address_size = 16
state.path = "/rap/jvb-000-aa/data/sarath/en-10k/splitted_trainval/"

state.lambda1_rein = 9e-5
state.lambda2_rein = 1e-5
コード例 #2
0
state = DD()

state.lr = 3e-3
state.batch_size = 160
state.sub_mb_size = 160
state.std = 0.05
state.max_iters = 40000
state.n_hids = 240
state.mem_nel = 150
state.mem_size = 28
state.renormalization_scale = 5.0
state.bowout = True
state.use_ff_controller = False
state.std = 0.01
state.bow_size = 80
state.n_reading_steps = 1
state.n_read_heads = 1
state.max_seq_len = 300
state.max_fact_len = 15
state.use_reinforce_baseline = False
state.use_reinforce = True
state.debug = False
state.address_size = 24
state.path = "/scratch/jvb-000-aa/gulcehre/tasks_1-20_v1-2/en-10k/"
state.lambda1_rein = 3e-5
state.lambda2_rein = 1e-5
state.theano_function_mode = None  #NanGuardMode(nan_is_error=True, inf_is_error=True)
state.print_every = 50
np.random.seed(3)