tempestpy/examples/shields/07_pre_shield_simulator.py


								import stormpy

								import stormpy.core

								import stormpy.simulator


								import stormpy.shields


								import stormpy.examples

								import stormpy.examples.files


								import random


								"""

								Simulating a model with the usage of a pre shield

								"""


								def example_pre_shield_simulator():

								    path = stormpy.examples.files.prism_mdp_cliff_walking

								    formula_str = "Pmax=? [G !\"AgentIsInLavaAndNotDone\"]"


								    program = stormpy.parse_prism_program(path)

								    formulas = stormpy.parse_properties_for_prism_program(formula_str, program)


								    options = stormpy.BuilderOptions([p.raw_formula for p in formulas])

								    options.set_build_state_valuations(True)

								    options.set_build_choice_labels(True)

								    options.set_build_all_labels()

								    model = stormpy.build_sparse_model_with_options(program, options)


								    initial_state = model.initial_states[0]

								    assert initial_state == 0


								    shield_specification = stormpy.logic.ShieldExpression(stormpy.logic.ShieldingType.PRE_SAFETY, stormpy.logic.ShieldComparison.RELATIVE, 0.9)

								    result = stormpy.model_checking(model, formulas[0], extract_scheduler=True, shield_expression=shield_specification)


								    assert result.has_scheduler

								    assert result.has_shield


								    shield = result.shield


								    pre_scheduler = shield.construct()


								    simulator = stormpy.simulator.create_simulator(model, seed=42)


								    while not simulator.is_done():

								        current_state = simulator.get_current_state()

								        state_string = model.state_valuations.get_string(current_state)

								        print(F"Simulator is in state {state_string}.")

								        choices = [x for x in pre_scheduler.get_choice(current_state).choice_map if x[0] > 0]

								        choice_labels =  [model.choice_labeling.get_labels_of_choice(model.get_choice_index(current_state, choice[1])) for choice in choices]


								        if not choices:

								            break


								        index = random.randint(0, len(choices) - 1)

								        selected_action = choices[index]

								        choice_label = model.choice_labeling.get_labels_of_choice(model.get_choice_index(current_state, selected_action[1]))

								        print(F"Allowed Choices are {choice_labels}. Selected Action: {choice_label}")

								        observation, reward = simulator.step(selected_action[1])


								if __name__ == '__main__':

								    example_pre_shield_simulator()