Beispiel #1
0
def rmpyl_icaps14():
    """
    Example from (Santana & Williams, ICAPS14).
    """
    prog = RMPyL()
    prog *= prog.decide(
                {'name':'transport-choice','domain':['Bike','Car','Stay'],
                 'utility':[100,70,0]},
                 prog.observe(
                    {'name':'slip','domain':[True,False],
                     'ctype':'probabilistic','probability':[0.051,1.0-0.051]},
                     prog.sequence(Episode(action='(ride-bike)',
                                           duration={'ctype':'controllable','lb':15,'ub':25}),
                                   Episode(action='(change)',
                                           duration={'ctype':'controllable','lb':20,'ub':30})),
                      Episode(action='(ride-bike)',duration={'ctype':'controllable','lb':15,'ub':25})),
                 prog.observe(
                    {'name':'accident','domain':[True,False],
                     'ctype':'probabilistic','probability':[0.013,1.0-0.013]},
                     prog.sequence(Episode(action='(tow-vehicle)',
                                          duration={'ctype':'controllable','lb':30,'ub':90}),
                                  Episode(action='(cab-ride)',
                                          duration={'ctype':'controllable','lb':10,'ub':20})),
                     Episode(action='(drive)',duration={'ctype':'controllable','lb':10,'ub':20})),
                 Episode(action='(stay)'))

    prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=30.0)
    return prog
Beispiel #2
0
def rmpyl_nested_uav():
    hello = UAV('hello')
    uav = UAV('uav')

    prog = RMPyL()
    prog.plan = prog.sequence(
        hello.scan(), uav.scan(),
        prog.decide(
            {
                'name': 'UAV-choice',
                'domain': ['Hello', 'UAV'],
                'utility': [7, 5]
            },
            prog.sequence(
                hello.fly(),
                prog.observe(
                    {
                        'name': 'hello-success',
                        'domain': ['Success', 'Failure'],
                        'ctype': 'probabilistic',
                        'probability': [0.8, 0.2]
                    },
                    prog.decide(
                        {
                            'name': 'hello-assert-success',
                            'domain': ['Success'],
                            'utility': [10]
                        }, hello.stop()),
                    prog.decide(
                        {
                            'name': 'hello-assert-failure',
                            'domain': ['Failure'],
                            'utility': [0]
                        }, hello.stop()))),
            prog.sequence(
                uav.fly(),
                prog.observe(
                    {
                        'name': 'uav-success',
                        'domain': ['Success', 'Failure'],
                        'ctype': 'probabilistic',
                        'probability': [0.95, 0.05]
                    },
                    prog.decide(
                        {
                            'name': 'uav-assert-success',
                            'domain': ['Success'],
                            'utility': [10]
                        }, uav.stop()),
                    prog.decide(
                        {
                            'name': 'uav-assert-failure',
                            'domain': ['Failure'],
                            'utility': [0]
                        }, uav.stop())))))
    return prog
Beispiel #3
0
def rmpyl_original_verbose(hello,uav):
    """
    Implementation of the original RMPL using a more verbose syntax and adding
    a chance constraint.

    ##### Original RMPL

    class UAV {
        value on;
        value off;

        primitive method fly() [3,10];
        primitive method scan() [1,10];
    }

    class Main {
      UAV helo;
      UAV uav;

      method run () {
        [0, 18] sequence {
            parallel {
                sequence {
                    helo.scan();
                    helo.fly();
                }
                sequence {
                    uav.fly();
                    uav.scan();
                }
            }
            choose {
                with reward: 5 {helo.fly();}
                with reward: 7 {uav.fly();}
            }
        }
      }
    }
    """
    prog = RMPyL()
    prog.plan = prog.sequence(
                prog.parallel(
                    prog.sequence(
                        hello.scan(),
                        hello.fly()),
                    prog.sequence(
                        uav.fly(),
                        uav.scan())),
                prog.decide({'name':'UAV-choice','domain':['Hello','UAV'],'utility':[5,7]},
                            hello.fly(),
                            uav.fly()))
    overall_tc = prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=18.0)
    cc_time = ChanceConstraint(constraint_scope=[overall_tc],risk=0.1)
    prog.add_chance_constraint(cc_time)
    return prog
def nominal_case(blocks, time_window=-1, dur_dict=None):
    """
    Nominal case, where the robot observes what the human has already completed,
    and acts accordingly
    """
    agent = 'Baxter'
    manip = 'BaxterRight'

    prog = RMPyL(name='run()')

    prog *= prog.sequence(
        say('Should I start?'),
        prog.observe(
            {
                'name': 'ask-human',
                'ctype': 'probabilistic',
                'domain': ['YES', 'NO'],
                'probability': [0.9, 0.1]
            }, observe_decide_act(prog, blocks, manip, agent, dur_dict),
            say('All done!')))
    if time_window > 0.0:
        prog.add_overall_temporal_constraint(ctype='controllable',
                                             lb=0.0,
                                             ub=time_window)

    return prog
Beispiel #5
0
def rmpyl_parallel_uav():
    hello = UAV('hello')
    uav = UAV('uav')

    prog = RMPyL()
    prog.plan = prog.parallel(
        prog.sequence(
            prog.decide(
                {
                    'name': 'hello-action',
                    'domain': ['Fly', 'Scan'],
                    'utility': [0, 1]
                }, hello.fly(), hello.scan()),
            prog.decide(
                {
                    'name': 'hello-action',
                    'domain': ['Fly', 'Scan'],
                    'utility': [0, 1]
                }, hello.fly(), hello.scan()),
            prog.decide(
                {
                    'name': 'hello-action',
                    'domain': ['Fly', 'Scan'],
                    'utility': [0, 1]
                }, hello.fly(), hello.scan())),
        prog.sequence(
            prog.decide(
                {
                    'name': 'uav-action',
                    'domain': ['Fly', 'Scan'],
                    'utility': [0, 1]
                }, uav.fly(), uav.scan()),
            prog.decide(
                {
                    'name': 'uav-action',
                    'domain': ['Fly', 'Scan'],
                    'utility': [0, 1]
                }, uav.fly(), uav.scan()),
            prog.decide(
                {
                    'name': 'uav-action',
                    'domain': ['Fly', 'Scan'],
                    'utility': [0, 1]
                }, uav.fly(), uav.scan())))
    return prog
Beispiel #6
0
def rmpyl_nested_uav():
    hello = UAV('hello')
    uav = UAV('uav')

    prog = RMPyL()
    prog.plan = prog.sequence(
                    hello.scan(),
                    uav.scan(),
                    prog.decide(
                        {'name':'UAV-choice','domain':['Hello','UAV'],
                        'utility':[7,5]},
                        prog.sequence(
                            hello.fly(),
                            prog.observe(
                                {'name':'hello-success','domain':['Success','Failure'],
                                 'ctype':'probabilistic','probability':[0.8,0.2]},
                                prog.decide(
                                    {'name':'hello-assert-success',
                                     'domain':['Success'],
                                     'utility':[10]},
                                    hello.stop()),
                                prog.decide(
                                    {'name':'hello-assert-failure',
                                     'domain':['Failure'],
                                     'utility':[0]},
                                    hello.stop()))),
                         prog.sequence(
                            uav.fly(),
                            prog.observe(
                                {'name':'uav-success','domain':['Success','Failure'],
                                 'ctype':'probabilistic','probability':[0.95,0.05]},
                                prog.decide(
                                    {'name':'uav-assert-success',
                                     'domain':['Success'],
                                     'utility':[10]},
                                    uav.stop()),
                                prog.decide(
                                    {'name':'uav-assert-failure',
                                     'domain':['Failure'],
                                     'utility':[0]},
                                    uav.stop())))))
    return prog
Beispiel #7
0
def rmpyl_episode_ids(hello,uav):
    """Example of how episode ID's can be used to retrieve them."""
    prog = RMPyL()

    first_uav_seq = prog.sequence(uav.scan(),uav.fly(),id='uav-1-seq')
    second_uav_seq = prog.sequence(uav.scan(),uav.fly(),id='uav-2-seq')

    first_hello_seq = prog.sequence(hello.scan(),hello.fly(),id='hello-1-seq')
    second_hello_seq = prog.sequence(hello.scan(),hello.fly(),id='hello-2-seq')

    prog *= prog.parallel(prog.sequence(first_uav_seq,second_uav_seq,id='uav-seqs'),
                          prog.sequence(first_hello_seq,second_hello_seq,id='hello-seqs'),id='par-seqs')

    #This could have been accomplished much more easily by using the sequence
    #variables directly, but I wanted to show how episodes can be retrieved by
    #ID.
    tc1 = TemporalConstraint(start=prog.episode_by_id('uav-1-seq').end,
                            end=prog.episode_by_id('hello-2-seq').start,
                            ctype='controllable',lb=2.0,ub=3.0)

    tc2 = TemporalConstraint(start=prog.episode_by_id('hello-1-seq').end,
                            end=prog.episode_by_id('uav-2-seq').start,
                            ctype='controllable',lb=0.5,ub=1.0)

    prog.add_temporal_constraint(tc1)
    prog.add_temporal_constraint(tc2)

    return prog
Beispiel #8
0
def pysat_planner(dom_file,prob_file,max_steps,duration_func):
    """
    Uses PySAT as the planner.
    """
    py_sat = PySAT(dom_file,prob_file,precompute_steps=max_steps,remove_static=True,
                   write_dimacs=False,verbose=True)

    domain,problem,task = model_parser(dom_file,prob_file,remove_static=True)

    print('\n##### Determining optimal plan length!\n')
    start = time.time()
    min_steps = len(task.goals-task.initial_state)
    plans = py_sat.plan(task.initial_state,task.goals,time_steps=max_steps,
                        find_shortest=True,min_steps=min_steps)
    elapsed = time.time()-start
    print('\n##### All solving took %.4f s'%(elapsed))

    if len(plans)>0:
        plan = plans[0]
        print('\n##### Plan found!\n')
        for t,action in enumerate(plan):
            print('%d: %s'%(t,action))

        prog = RMPyL(name='run()')
        if duration_func!=None:
            prog.plan = prog.sequence(*[Episode(start=Event(name='start-of-'+op),
                                                end=Event(name='end-of-'+op),
                                                action=op,
                                                duration=duration_func(op)) for op in plan])
        else:
            prog.plan = prog.sequence(*[Episode(start=Event(name='start-of-'+op),
                                                end=Event(name='end-of-'+op),
                                                action=op) for op in plan])
    else:
        prog = None

    return {'policy':None,'explicit':None,'performance':None,'rmpyl':prog}
Beispiel #9
0
def rmpyl_parallel_uav():
    hello = UAV('hello')
    uav = UAV('uav')

    prog = RMPyL()
    prog.plan = prog.parallel(
                    prog.sequence(
                        prog.decide({'name':'hello-action','domain':['Fly','Scan'],
                                     'utility':[0,1]},
                                     hello.fly(),
                                     hello.scan()),
                        prog.decide({'name':'hello-action','domain':['Fly','Scan'],
                                     'utility':[0,1]},
                                     hello.fly(),
                                     hello.scan()),
                        prog.decide({'name':'hello-action','domain':['Fly','Scan'],
                                     'utility':[0,1]},
                                     hello.fly(),
                                     hello.scan())
                    ),
                    prog.sequence(
                        prog.decide({'name':'uav-action','domain':['Fly','Scan'],
                                     'utility':[0,1]},
                                     uav.fly(),
                                     uav.scan()),
                        prog.decide({'name':'uav-action','domain':['Fly','Scan'],
                                     'utility':[0,1]},
                                     uav.fly(),
                                     uav.scan()),
                        prog.decide({'name':'uav-action','domain':['Fly','Scan'],
                                     'utility':[0,1]},
                                     uav.fly(),
                                     uav.scan())

                    ))
    return prog
Beispiel #10
0
def nominal_case(blocks):
    """
    Nominal case, where the robot observes what the human has already completed,
    and acts accordingly
    """
    agent='Baxter'
    manip='BaxterRight'

    prog = RMPyL(name='run()')

    prog *= prog.sequence(say('Should I start?'),
                          prog.observe({'name':'observe-human-%d'%(len(blocks)),
                                        'ctype':'uncontrollable',
                                        'domain':['YES','NO']},
                                        observe_and_act(prog,blocks,manip,agent),
                                        say('All done!')))
    return prog
Beispiel #11
0
def rmpyl_uav():
    hello = UAV('hello')
    uav = UAV('uav')

    prog = RMPyL()
    # prog *= hello.fly()
    prog.plan = prog.sequence(
        hello.scan(), hello.fly(), uav.fly(), uav.scan(),
        prog.decide(
            {
                'name': 'UAV-choice',
                'domain': ['Hello', 'UAV'],
                'utility': [5, 7]
            }, hello.fly(), uav.fly()))

    prog.add_overall_temporal_constraint(ctype='controllable', lb=0.0, ub=18.0)
    return prog
Beispiel #12
0
def rmpyl_uav():
    hello = UAV('hello')
    uav = UAV('uav')

    prog = RMPyL()
    # prog *= hello.fly()
    prog.plan = prog.sequence(
                    hello.scan(),
                    hello.fly(),
                    uav.fly(),
                    uav.scan(),
                    prog.decide({'name':'UAV-choice','domain':['Hello','UAV'],
                                 'utility':[5,7]},
                                 hello.fly(),
                                 uav.fly()))

    prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=18.0)
    return prog
Beispiel #13
0
def nominal_case(blocks,time_window=-1,dur_dict=None):
    """
    Nominal case, where the robot observes what the human has already completed,
    and acts accordingly
    """
    agent='Baxter'
    manip='BaxterRight'

    prog = RMPyL(name='run()')

    prog *= prog.sequence(say('Should I start?'),
                          prog.observe({'name':'ask-human',
                                        'ctype':'probabilistic',
                                        'domain':['YES','NO'],
                                        'probability':[0.9,0.1]},
                                        observe_decide_act(prog,blocks,manip,agent,dur_dict),
                                        say('All done!')))
    if time_window>0.0:
        prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=time_window)

    return prog
Beispiel #14
0
        for t, op in enumerate(plan):
            print('%d: %s' % (t, op))

        elapsed = time.time() - start
        print('\n##### All solving took %.4f s' % (elapsed))

        prog = RMPyL(name='run()')
        pddl_episodes = [
            Episode(id=make_episode_id(t, op),
                    start=Event(name='start-of-%d-%s' % (t, op)),
                    end=Event(name='end-of-%d-%s' % (t, op)),
                    action=op,
                    duration=rss_duration_model_func(op))
            for t, op in enumerate(plan)
        ]
        prog.plan = prog.sequence(*pddl_episodes)
        # prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=2000.0)
        #Adds temporal window to the plan
        for t, op in enumerate(plan):
            bounds, tc_type = rss_time_window_model_func(op)
            for tc in time_window_constraints(
                    tc_type, bounds, prog.first_event,
                    prog.episode_by_id(make_episode_id(t, op))):
                prog.add_temporal_constraint(tc)

        #Dummy episodes that enable transmissions
        activation_episodes = []
        activation_tcs = []
        global_start = Event(name='global-start')

        for op_name, op_param_dict in time_windows['time_windows'].items():
Beispiel #15
0
start = time.time()
sat_plans = py_sat.plan(task.initial_state, task.goals, time_steps=18)
elapsed = time.time() - start
print('\n##### All solving took %.4f s' % (elapsed))

if len(sat_plans) > 0:
    plan = sat_plans[0]
    print('\n##### Plan found!\n')
    for t, action in enumerate(plan):
        print('%d: %s' % (t, action))

    prog = RMPyL(name='run()')
    prog.plan = prog.sequence(*[
        Episode(start=Event(name='start-of-' + op),
                end=Event(name='end-of-' + op),
                action=op,
                duration=rss_duration_func(op)) for op in plan
    ])
    prog.add_overall_temporal_constraint(ctype='controllable',
                                         lb=0.0,
                                         ub=2000.0)
    prog.to_ptpn(filename='rss_pysat_before_stnu_reform.tpn')

    paris = PARIS()
    risk_bound, sc_sched = paris.stnu_reformulation(prog,
                                                    makespan=True,
                                                    cc=0.001)
    if risk_bound != None:
        risk_bound = min(risk_bound, 1.0)
        print(
            '\nSuccessfully performed STNU reformulation with scheduling risk %f %%!'
Beispiel #16
0
def rmpyl_breakfast():
    """
    Example from (Levine & Williams, ICAPS14).
    """
    #Actions that Alice performs
    get_mug_ep = Episode(action='(get alice mug)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})
    get_glass_ep = Episode(action='(get alice glass)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})

    make_cofee_ep = Episode(action='(make-coffee alice)',duration={'ctype':'controllable','lb':3.0,'ub':5.0})
    pour_cofee_ep = Episode(action='(pour-coffee alice mug)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})
    pour_juice_glass = Episode(action='(pour-juice alice glass)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})

    get_bagel_ep = Episode(action='(get alice bagel)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})
    get_cereal_ep = Episode(action='(get alice cereal)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})

    toast_bagel_ep = Episode(action='(toast alice bagel)',duration={'ctype':'controllable','lb':3.0,'ub':5.0})
    add_cheese_bagel_ep = Episode(action='(add-cheese alice bagel)',duration={'ctype':'controllable','lb':1.0,'ub':2.0})
    mix_cereal_ep = Episode(action='(mix-cereal alice milk)',duration={'ctype':'controllable','lb':1.0,'ub':2.0})

    #Actions that the robot performs
    get_grounds_ep = Episode(action='(get grounds robot)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})
    get_juice_ep = Episode(action='(get juice robot)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})
    get_milk_ep = Episode(action='(get milk robot)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})
    get_cheese_ep = Episode(action='(get cheese robot)',duration={'ctype':'controllable','lb':0.5,'ub':1.0})

    prog = RMPyL()
    prog *= prog.sequence(
                prog.parallel(
                    prog.observe(
                        {'name':'observe-utensil','domain':['Mug','Glass'],'ctype':'uncontrollable'},
                        get_mug_ep,
                        get_glass_ep,
                        id='observe-utensil-ep'),
                    prog.decide(
                        {'name':'choose-beverage-ingredient','domain':['Grounds','Juice'],'utility':[0,0]},
                        get_grounds_ep,
                        get_juice_ep,
                        id='choose-beverage-ingredient-ep')),
                prog.observe(
                    {'name':'observe-alice-drink','domain':['Coffee','Juice'],'ctype':'uncontrollable'},
                    prog.sequence(make_cofee_ep,pour_cofee_ep),
                    pour_juice_glass,
                    id='observe-alice-drink-ep'),
                prog.parallel(
                    prog.observe(
                        {'name':'observe-food','domain':['Bagel','Cereal'],'ctype':'uncontrollable'},
                        get_bagel_ep,
                        get_cereal_ep,
                        id='observe-food-ep'),
                    prog.decide(
                        {'name':'choose-food-ingredient','domain':['Milk','Cheese'],'utility':[0,0]},
                        get_milk_ep,
                        get_cheese_ep,
                        id='choose-food-ingredient-ep'),
                    id='parallel-food-ep'),
                prog.observe(
                    {'name':'observe-alice-food','domain':['Bagel','Cereal'],'ctype':'uncontrollable'},
                    prog.sequence(toast_bagel_ep,add_cheese_bagel_ep),
                    mix_cereal_ep),
                id='breakfast-sequence')

    extra_tcs = [TemporalConstraint(start=prog.episode_by_id('breakfast-sequence').start,
                                  end=prog.episode_by_id('observe-utensil-ep').start,
                                  ctype='controllable',lb=0.0,ub=0.0),
                 TemporalConstraint(start=prog.episode_by_id('breakfast-sequence').start,
                                    end=prog.episode_by_id('choose-beverage-ingredient-ep').start,
                                    ctype='controllable',lb=0.2,ub=0.3),
                 TemporalConstraint(start=prog.episode_by_id('parallel-food-ep').start,
                                    end=prog.episode_by_id('observe-food-ep').start,
                                    ctype='controllable',lb=0.0,ub=0.0),
                 TemporalConstraint(start=prog.episode_by_id('parallel-food-ep').start,
                                    end=prog.episode_by_id('choose-food-ingredient-ep').start,
                                    ctype='controllable',lb=0.2,ub=0.3)]

    for tc in extra_tcs:
        prog.add_temporal_constraint(tc)

    prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=7.0)
    prog.simplify_temporal_constraints()

    return prog
Beispiel #17
0
def rmpyl_breakfast():
    """
    Example from (Levine & Williams, ICAPS14).
    """
    #Actions that Alice performs
    get_mug_ep = Episode(action='(get alice mug)',
                         duration={
                             'ctype': 'controllable',
                             'lb': 0.5,
                             'ub': 1.0
                         })
    get_glass_ep = Episode(action='(get alice glass)',
                           duration={
                               'ctype': 'controllable',
                               'lb': 0.5,
                               'ub': 1.0
                           })

    make_cofee_ep = Episode(action='(make-coffee alice)',
                            duration={
                                'ctype': 'controllable',
                                'lb': 3.0,
                                'ub': 5.0
                            })
    pour_cofee_ep = Episode(action='(pour-coffee alice mug)',
                            duration={
                                'ctype': 'controllable',
                                'lb': 0.5,
                                'ub': 1.0
                            })
    pour_juice_glass = Episode(action='(pour-juice alice glass)',
                               duration={
                                   'ctype': 'controllable',
                                   'lb': 0.5,
                                   'ub': 1.0
                               })

    get_bagel_ep = Episode(action='(get alice bagel)',
                           duration={
                               'ctype': 'controllable',
                               'lb': 0.5,
                               'ub': 1.0
                           })
    get_cereal_ep = Episode(action='(get alice cereal)',
                            duration={
                                'ctype': 'controllable',
                                'lb': 0.5,
                                'ub': 1.0
                            })

    toast_bagel_ep = Episode(action='(toast alice bagel)',
                             duration={
                                 'ctype': 'controllable',
                                 'lb': 3.0,
                                 'ub': 5.0
                             })
    add_cheese_bagel_ep = Episode(action='(add-cheese alice bagel)',
                                  duration={
                                      'ctype': 'controllable',
                                      'lb': 1.0,
                                      'ub': 2.0
                                  })
    mix_cereal_ep = Episode(action='(mix-cereal alice milk)',
                            duration={
                                'ctype': 'controllable',
                                'lb': 1.0,
                                'ub': 2.0
                            })

    #Actions that the robot performs
    get_grounds_ep = Episode(action='(get grounds robot)',
                             duration={
                                 'ctype': 'controllable',
                                 'lb': 0.5,
                                 'ub': 1.0
                             })
    get_juice_ep = Episode(action='(get juice robot)',
                           duration={
                               'ctype': 'controllable',
                               'lb': 0.5,
                               'ub': 1.0
                           })
    get_milk_ep = Episode(action='(get milk robot)',
                          duration={
                              'ctype': 'controllable',
                              'lb': 0.5,
                              'ub': 1.0
                          })
    get_cheese_ep = Episode(action='(get cheese robot)',
                            duration={
                                'ctype': 'controllable',
                                'lb': 0.5,
                                'ub': 1.0
                            })

    prog = RMPyL()
    prog *= prog.sequence(
        prog.parallel(
            prog.observe(
                {
                    'name': 'observe-utensil',
                    'domain': ['Mug', 'Glass'],
                    'ctype': 'uncontrollable'
                },
                get_mug_ep,
                get_glass_ep,
                id='observe-utensil-ep'),
            prog.decide(
                {
                    'name': 'choose-beverage-ingredient',
                    'domain': ['Grounds', 'Juice'],
                    'utility': [0, 0]
                },
                get_grounds_ep,
                get_juice_ep,
                id='choose-beverage-ingredient-ep')),
        prog.observe(
            {
                'name': 'observe-alice-drink',
                'domain': ['Coffee', 'Juice'],
                'ctype': 'uncontrollable'
            },
            prog.sequence(make_cofee_ep, pour_cofee_ep),
            pour_juice_glass,
            id='observe-alice-drink-ep'),
        prog.parallel(prog.observe(
            {
                'name': 'observe-food',
                'domain': ['Bagel', 'Cereal'],
                'ctype': 'uncontrollable'
            },
            get_bagel_ep,
            get_cereal_ep,
            id='observe-food-ep'),
                      prog.decide(
                          {
                              'name': 'choose-food-ingredient',
                              'domain': ['Milk', 'Cheese'],
                              'utility': [0, 0]
                          },
                          get_milk_ep,
                          get_cheese_ep,
                          id='choose-food-ingredient-ep'),
                      id='parallel-food-ep'),
        prog.observe(
            {
                'name': 'observe-alice-food',
                'domain': ['Bagel', 'Cereal'],
                'ctype': 'uncontrollable'
            }, prog.sequence(toast_bagel_ep, add_cheese_bagel_ep),
            mix_cereal_ep),
        id='breakfast-sequence')

    extra_tcs = [
        TemporalConstraint(
            start=prog.episode_by_id('breakfast-sequence').start,
            end=prog.episode_by_id('observe-utensil-ep').start,
            ctype='controllable',
            lb=0.0,
            ub=0.0),
        TemporalConstraint(
            start=prog.episode_by_id('breakfast-sequence').start,
            end=prog.episode_by_id('choose-beverage-ingredient-ep').start,
            ctype='controllable',
            lb=0.2,
            ub=0.3),
        TemporalConstraint(start=prog.episode_by_id('parallel-food-ep').start,
                           end=prog.episode_by_id('observe-food-ep').start,
                           ctype='controllable',
                           lb=0.0,
                           ub=0.0),
        TemporalConstraint(
            start=prog.episode_by_id('parallel-food-ep').start,
            end=prog.episode_by_id('choose-food-ingredient-ep').start,
            ctype='controllable',
            lb=0.2,
            ub=0.3)
    ]

    for tc in extra_tcs:
        prog.add_temporal_constraint(tc)

    prog.add_overall_temporal_constraint(ctype='controllable', lb=0.0, ub=7.0)
    prog.simplify_temporal_constraints()

    return prog
Beispiel #18
0
def rmpyl_simple_verbose(hello,uav):
    """Simple RMPyL example using verbose syntax."""
    prog = RMPyL()
    prog *= prog.sequence(hello.scan(),uav.scan(),prog.parallel(hello.fly(),uav.fly()))
    return prog
Beispiel #19
0
        """
        return Episode(duration={'ctype':'controllable','lb':5,'ub':30},
                       action='(relay %s)'%(self.name))

loc={'start':(8.751,-8.625),
     'minerals':(0.0,-10.0),
     'funny_rock':(-5.0,-2.0),
     'relay':(0.0,0.0),
     'alien_lair':(0.0,10.0)}


rov1 = Rover(name='spirit')

prog = RMPyL(name='run()')#name=run() is a requirement for Enterprise at the moment
prog *= prog.sequence(
            rov1.go_to(start=loc['start'],goal=loc['minerals'],risk=0.01),
            rov1.go_to(start=loc['minerals'],goal=loc['funny_rock'],risk=0.01),
            rov1.go_to(start=loc['funny_rock'],goal=loc['alien_lair'],risk=0.01),
            rov1.go_to(start=loc['alien_lair'],goal=loc['relay'],risk=0.01))
tc=prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=2000.0)
cc_time = ChanceConstraint(constraint_scope=[tc],risk=0.1)
prog.add_chance_constraint(cc_time)

#Option to export the RMPyL program to an Enterprise-compliant TPN.
prog.to_ptpn(filename='picard_rovers_rmpyl.tpn')

#Writes RMPyL program to pickle file.
with open('picard_rovers_rmpyl.pickle','wb') as f:
    print('Writing RMPyL program to pickle file.')
    pickle.dump(prog,f)
Beispiel #20
0
domain,problem,task = model_parser(dom_file,prob_file,remove_static=True)

start = time.time()
sat_plans = py_sat.plan(task.initial_state,task.goals,time_steps=18)
elapsed = time.time()-start
print('\n##### All solving took %.4f s'%(elapsed))

if len(sat_plans)>0:
    plan = sat_plans[0]
    print('\n##### Plan found!\n')
    for t,action in enumerate(plan):
        print('%d: %s'%(t,action))

    prog = RMPyL(name='run()')
    prog.plan = prog.sequence(*[Episode(start=Event(name='start-of-'+op),
                                        end=Event(name='end-of-'+op),
                                        action=op,
                                        duration=rss_duration_func(op)) for op in plan])
    prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=2000.0)
    prog.to_ptpn(filename='rss_pysat_before_stnu_reform.tpn')

    paris = PARIS()
    risk_bound,sc_sched = paris.stnu_reformulation(prog,makespan=True,cc=0.001)
    if risk_bound != None:
        risk_bound = min(risk_bound,1.0)
        print('\nSuccessfully performed STNU reformulation with scheduling risk %f %%!'%(risk_bound*100.0))
        prog.to_ptpn(filename='rss_pysat_after_stnu_reform.tpn')

        print('\nThis is the schedule:')
        for e,t in sorted([(e,t) for e,t in sc_sched.items()],key=lambda x: x[1]):
            print('\t%s: %.2f s'%(e,t))
    else:
Beispiel #21
0
    # print("---------plan: %d" % len(sat_plans))
    if len(sat_plans)>0:
        plan = sat_plans[0] # get the first plan (default returns a list with one plan)
        for t,op in enumerate(plan):
            print('%d: %s'%(t,op))

        elapsed = time.time()-start
        print('\n##### All solving took %.4f s'%(elapsed))

        prog = RMPyL(name='run()')
        pddl_episodes = [Episode(id=make_episode_id(t,op),
                                 start=Event(name='start-of-%d-%s'%(t,op)),
                                 end=Event(name='end-of-%d-%s'%(t,op)),
                                 action=op,
                                 duration=rss_duration_model_func(op)) for t,op in enumerate(plan)]
        prog.plan = prog.sequence(*pddl_episodes)
        # prog.add_overall_temporal_constraint(ctype='controllable',lb=0.0,ub=2000.0)
        #Adds temporal window to the plan
        for t,op in enumerate(plan):
            bounds, tc_type = rss_time_window_model_func(op)
            for tc in time_window_constraints(tc_type,bounds,prog.first_event,prog.episode_by_id(make_episode_id(t,op))):
                prog.add_temporal_constraint(tc)

        #Dummy episodes that enable transmissions
        activation_episodes=[]
        activation_tcs=[]
        global_start=Event(name='global-start')

        for op_name,op_param_dict in time_windows['time_windows'].items():
            for arg_set,window_dict in op_param_dict.items():
                for ev_type,time_bound in window_dict.items():
Beispiel #22
0
                  verbose=1)

#Searches for the optimal policy
policy, explicit, performance = planner.search(b0)

#Converts policy to graphical SVG format
dot_policy = policy_to_dot(explicit, policy)
dot_policy.write('flightgear_policy.svg', format='svg')

#Converts optimal exploration policy into an RMPyL program
exploration_policy = policy_to_rmpyl(explicit, policy)

#The flight policy has the additional actions of taking off and landing.
flight_policy = RMPyL(name='run()')
flight_policy *= flight_policy.sequence(Episode(action='(takeoff plane)'),
                                        exploration_policy,
                                        Episode(action='(land plane)'))

#Eliminates probabilistic choices from the policy, since Pike (in fact, the
#Lisp tpn package) cannot properly handle them.
for obs in flight_policy.observations:
    if obs.type == 'probabilistic':
        obs.type = 'uncontrollable'
        del obs.properties['probability']

#Converts the program to a TPN
flight_policy.to_ptpn(filename='flightgear_rmpyl.tpn')

# Writes control program to pickle file
with open('flightgear_rmpyl.pickle', 'wb') as f:
    pickle.dump(flight_policy, f, protocol=2)
                  halt_on_violation=False,verbose=1)

#Searches for the optimal policy
policy,explicit,performance = planner.search(b0)

#Converts policy to graphical SVG format
dot_policy = policy_to_dot(explicit,policy)
dot_policy.write('flightgear_policy.svg',format='svg')

#Converts optimal exploration policy into an RMPyL program
exploration_policy = policy_to_rmpyl(explicit,policy)

#The flight policy has the additional actions of taking off and landing.
flight_policy = RMPyL(name='run()')
flight_policy *= flight_policy.sequence(Episode(action='(takeoff plane)'),
                                        exploration_policy,
                                        Episode(action='(land plane)'))

#Eliminates probabilistic choices from the policy, since Pike (in fact, the
#Lisp tpn package) cannot properly handle them.
for obs in flight_policy.observations:
    if obs.type=='probabilistic':
        obs.type = 'uncontrollable'
        del obs.properties['probability']

#Converts the program to a TPN
flight_policy.to_ptpn(filename='flightgear_rmpyl.tpn')

# Writes control program to pickle file
with open('flightgear_rmpyl.pickle','wb') as f:
   pickle.dump(flight_policy,f,protocol=2)
Beispiel #24
0
def rmpyl_icaps14():
    """
    Example from (Santana & Williams, ICAPS14).
    """
    prog = RMPyL()
    prog *= prog.decide(
        {
            'name': 'transport-choice',
            'domain': ['Bike', 'Car', 'Stay'],
            'utility': [100, 70, 0]
        },
        prog.observe(
            {
                'name': 'slip',
                'domain': [True, False],
                'ctype': 'probabilistic',
                'probability': [0.051, 1.0 - 0.051]
            },
            prog.sequence(
                Episode(action='(ride-bike)',
                        duration={
                            'ctype': 'controllable',
                            'lb': 15,
                            'ub': 25
                        }),
                Episode(action='(change)',
                        duration={
                            'ctype': 'controllable',
                            'lb': 20,
                            'ub': 30
                        })),
            Episode(action='(ride-bike)',
                    duration={
                        'ctype': 'controllable',
                        'lb': 15,
                        'ub': 25
                    })),
        prog.observe(
            {
                'name': 'accident',
                'domain': [True, False],
                'ctype': 'probabilistic',
                'probability': [0.013, 1.0 - 0.013]
            },
            prog.sequence(
                Episode(action='(tow-vehicle)',
                        duration={
                            'ctype': 'controllable',
                            'lb': 30,
                            'ub': 90
                        }),
                Episode(action='(cab-ride)',
                        duration={
                            'ctype': 'controllable',
                            'lb': 10,
                            'ub': 20
                        })),
            Episode(action='(drive)',
                    duration={
                        'ctype': 'controllable',
                        'lb': 10,
                        'ub': 20
                    })), Episode(action='(stay)'))

    prog.add_overall_temporal_constraint(ctype='controllable', lb=0.0, ub=30.0)
    return prog