示例#1
0
         }
     else:
         kwargs = {
             'D': D,
             'M': M,
             'learning_rate': args.alpha,
             'F': [(1, 1)],
             'c0': c0,
             'C': [(c0, )]
         }
     graph_f = cnn.build_graph
 else:
     kwargs = {'D': D, 'M': M, 'learning_rate': args.alpha}
     graph_f = ann.build_graph
 pol = EpsilonGreedyPolicy(eps=1.0, decay_f=decay_f)
 pol.n = args.eps_start
 if args.mode == 'leaf':
     sv = tdleaf.TDLeafSupervisor(pol,
                                  mv_limit=args.move_count,
                                  depth=args.depth,
                                  y=args.gamma,
                                  l=args.lambd)
 else:
     sv = tdstem.TDStemSupervisor(pol,
                                  mv_limit=args.move_count,
                                  depth=args.depth,
                                  y=args.gamma,
                                  l=args.lambd)
 sv.run(args.I,
        args.N,
        graph_f,