def main(): title = 'test_bc' ap = framework.get_args() args = vars(ap.parse_args()) args = framework.load_config(args) framework.startup(title, args, Test)
def main(): title = 'test_iso' ap = framework.get_args() ap.add_argument('--scale', required=True, type=float) # amount to scale the identity matrix args = vars(ap.parse_args()) args = framework.load_config(args) framework.startup(title, args, Test)
def main(): title = 'test_rand' ap = framework.get_args() ap.add_argument( '--trace', required=True, type=float) # trace on the amount of error one expects in the learner args = vars(ap.parse_args()) args = framework.load_config(args) framework.startup(title, args, Test)
def main(): title = 'test_dagger' ap = framework.get_args() ap.add_argument('--update_period', required=True, type=int) # period between updates to the policy ap.add_argument('--beta', required=True, type=float) # beta term, see Ross et al. args = vars(ap.parse_args()) args = framework.load_config(args) framework.startup(title, args, Test)
def main(): title = 'test_dart' ap = framework.get_args() ap.add_argument('--update_period', required=True, type=int) # period between updates to the policy ap.add_argument('--partition', required=True, type=float) # Integer between 1 and 450 (exclusive), args = vars(ap.parse_args()) args = framework.load_config(args) assert args['partition'] < 1.0 and args['partition'] > 0.0 framework.startup(title, args, Test)