updates ....

more changes for rom_evaluate
updated formula computation YRanges
3 changed files with 1191 additions and 128 deletions
--- a/new_method.py
+++ b/new_method.py
@ -0,0 +1,605 @@
+import sys
+import operator
+from copy import deepcopy
+from os import listdir, system
+import subprocess
+import re
+from collections import defaultdict
+
+from random import randrange
+from ale_py import ALEInterface, SDL_SUPPORT, Action
+from PIL import Image
+from matplotlib import pyplot as plt
+import cv2
+import pickle
+import queue
+from dataclasses import dataclass, field
+
+from sklearn.cluster import KMeans, DBSCAN
+
+from enum import Enum
+
+from copy import deepcopy
+
+import numpy as np
+
+import logging
+logger = logging.getLogger(__name__)
+
+#import readchar
+
+from sample_factory.algo.utils.tensor_dict import TensorDict
+from query_sample_factory_checkpoint import SampleFactoryNNQueryWrapper
+
+import time
+
+tempest_binary = "/home/spranger/projects/tempest-devel/ranking_release/bin/storm"
+rom_file = "/home/spranger/research/Skiing/env/lib/python3.10/site-packages/AutoROM/roms/skiing.bin"
+
+def tic():
+    import time
+    global startTime_for_tictoc
+    startTime_for_tictoc = time.time()
+
+def toc():
+    import time
+    if 'startTime_for_tictoc' in globals():
+        return time.time() - startTime_for_tictoc
+
+class Verdict(Enum):
+    INCONCLUSIVE = 1
+    GOOD = 2
+    BAD = 3
+
+verdict_to_color_map = {Verdict.BAD: "200,0,0", Verdict.INCONCLUSIVE: "40,40,200", Verdict.GOOD: "00,200,100"}
+
+def convert(tuples):
+    return dict(tuples)
+
+@dataclass(frozen=True)
+class State:
+    x: int
+    y: int
+    ski_position: int
+    velocity: int
+def default_value():
+    return {'action' : None, 'choiceValue' : None}
+
+@dataclass(frozen=True)
+class StateValue:
+    ranking: float
+    choices: dict = field(default_factory=default_value)
+
+@dataclass(frozen=False)
+class TestResult:
+    init_check_pes_min: float
+    init_check_pes_max: float
+    init_check_pes_avg: float
+    init_check_opt_min: float
+    init_check_opt_max: float
+    init_check_opt_avg: float
+    safe_states: int
+    unsafe_states: int
+    safe_cluster: int
+    unsafe_cluster: int
+    good_verdicts: int
+    bad_verdicts: int
+    policy_queries: int
+    def __str__(self):
+        return f"""Test Result:
+    init_check_pes_min: {self.init_check_pes_min}
+    init_check_pes_max: {self.init_check_pes_max}
+    init_check_pes_avg: {self.init_check_pes_avg}
+    init_check_opt_min: {self.init_check_opt_min}
+    init_check_opt_max: {self.init_check_opt_max}
+    init_check_opt_avg: {self.init_check_opt_avg}
+"""
+    @staticmethod
+    def csv_header(ws=" "):
+        string =  f"pesmin{ws}pesmax{ws}pesavg{ws}"
+        string += f"optmin{ws}optmax{ws}optavg{ws}"
+        string += f"sState{ws}uState{ws}"
+        string += f"sClust{ws}uClust{ws}"
+        string += f"gVerd{ws}bVerd{ws}queries"
+        return string
+
+    def csv(self):
+        ws = " "
+        string =  f"{self.init_check_pes_min:0.04f}{ws}{self.init_check_pes_max:0.04f}{ws}{self.init_check_pes_avg:0.04f}{ws}"
+        string += f"{self.init_check_opt_min:0.04f}{ws}{self.init_check_opt_max:0.04f}{ws}{self.init_check_opt_avg:0.04f}{ws}"
+        ws = "\t"
+        string += f"{self.safe_states}{ws}{self.unsafe_states}{ws}"
+        string += f"{self.safe_cluster}{ws}{self.unsafe_cluster}{ws}"
+        string += f"{self.good_verdicts}{ws}{self.bad_verdicts}{ws}{self.policy_queries}"
+        return string
+
+
+def exec(command,verbose=True):
+    if verbose: print(f"Executing {command}")
+    system(f"echo {command} >> list_of_exec")
+    return system(command)
+
+num_tests_per_cluster = 50
+#factor_tests_per_cluster = 0.2
+num_ski_positions = 8
+num_velocities = 5
+
+def input_to_action(char):
+    if char == "0":
+        return Action.NOOP
+    if char == "1":
+        return Action.RIGHT
+    if char == "2":
+        return Action.LEFT
+    if char == "3":
+        return "reset"
+    if char == "4":
+        return "set_x"
+    if char == "5":
+        return "set_vel"
+    if char in ["w", "a", "s", "d"]:
+        return char
+
+def saveObservations(observations, verdict, testDir):
+    testDir = f"images/testing_{experiment_id}/{verdict.name}_{testDir}_{len(observations)}"
+    if len(observations) < 20:
+        logger.warn(f"Potentially spurious test case for {testDir}")
+        testDir = f"{testDir}_pot_spurious"
+    exec(f"mkdir {testDir}", verbose=False)
+    for i, obs in enumerate(observations):
+        img = Image.fromarray(obs)
+        img.save(f"{testDir}/{i:003}.png")
+
+ski_position_counter = {1: (Action.LEFT, 40), 2: (Action.LEFT, 35), 3: (Action.LEFT, 30), 4: (Action.LEFT, 10), 5: (Action.NOOP, 1), 6: (Action.RIGHT, 10), 7: (Action.RIGHT, 30), 8: (Action.RIGHT, 40) }
+
+def run_single_test(ale, nn_wrapper, x,y,ski_position, velocity, duration=50):
+    #print(f"Running Test from x: {x:04}, y: {y:04}, ski_position: {ski_position}", end="")
+    testDir = f"{x}_{y}_{ski_position}_{velocity}"
+    try:
+        for i, r in enumerate(ramDICT[y]):
+            ale.setRAM(i,r)
+        ski_position_setting = ski_position_counter[ski_position]
+        for i in range(0,ski_position_setting[1]):
+            ale.act(ski_position_setting[0])
+            ale.setRAM(14,0)
+            ale.setRAM(25,x)
+        ale.setRAM(14,180) # TODO
+    except Exception as e:
+        print(e)
+        logger.warn(f"Could not run test for x: {x}, y: {y}, ski_position: {ski_position}, velocity: {velocity}")
+        return (Verdict.INCONCLUSIVE, 0)
+
+    num_queries = 0
+    all_obs = list()
+    speed_list = list()
+    resized_obs = cv2.resize(ale.getScreenGrayscale(), (84,84), interpolation=cv2.INTER_AREA)
+    for i in range(0,4):
+        all_obs.append(resized_obs)
+    for i in range(0,duration-4):
+        resized_obs = cv2.resize(ale.getScreenGrayscale(), (84,84), interpolation=cv2.INTER_AREA)
+        all_obs.append(resized_obs)
+        if i % 4 == 0:
+            stack_tensor = TensorDict({"obs": np.array(all_obs[-4:])})
+            action = nn_wrapper.query(stack_tensor)
+            num_queries += 1
+            ale.act(input_to_action(str(action)))
+        else:
+            ale.act(input_to_action(str(action)))
+        speed_list.append(ale.getRAM()[14])
+        if len(speed_list) > 15 and sum(speed_list[-6:-1]) == 0:
+            #saveObservations(all_obs, Verdict.BAD, testDir)
+            return (Verdict.BAD, num_queries)
+    #saveObservations(all_obs, Verdict.GOOD, testDir)
+    return (Verdict.GOOD, num_queries)
+
+def skiPositionFormulaList(name):
+    formulas = list()
+    for i in range(1, num_ski_positions+1):
+        formulas.append(f"\"{name}_{i}\"")
+    return createBalancedDisjunction(formulas)
+
+
+def computeStateRanking(mdp_file, iteration):
+    logger.info("Computing state ranking")
+    tic()
+    prop =  f"filter(min, Pmin=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(max, Pmin=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(avg, Pmin=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(min, Pmax=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(max, Pmax=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(avg, Pmax=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += 'Rmax=? [C <= 200]'
+    results = list()
+    try:
+        command = f"{tempest_binary} --prism {mdp_file} --buildchoicelab --buildstateval --build-all-labels --prop '{prop}'"
+        output = subprocess.check_output(command, shell=True).decode("utf-8").split('\n')
+        num_states = 0
+        for line in output:
+            #print(line)
+            if "States:" in line:
+                num_states = int(line.split(" ")[-1])
+            if "Result" in line and not len(results) >= 6:
+                range_value = re.search(r"(.*:).*\[(-?\d+\.?\d*), (-?\d+\.?\d*)\].*", line)
+                if range_value:
+                    results.append(float(range_value.group(2)))
+                    results.append(float(range_value.group(3)))
+                else:
+                    value = re.search(r"(.*:)(.*)", line)
+                    results.append(float(value.group(2)))
+        exec(f"mv action_ranking action_ranking_{iteration:03}")
+    except subprocess.CalledProcessError as e:
+        # todo die gracefully if ranking is uniform
+        print(e.output)
+    logger.info(f"Computing state ranking - DONE: took {toc()} seconds")
+    return TestResult(*tuple(results),0,0,0,0,0,0,0), num_states
+
+def fillStateRanking(file_name, match=""):
+    logger.info(f"Parsing state ranking, {file_name}")
+    tic()
+    state_ranking = dict()
+    try:
+        with open(file_name, "r") as f:
+            file_content = f.readlines()
+        for line in file_content:
+            if not "move=0" in line: continue
+            ranking_value = float(re.search(r"Value:([+-]?(\d*\.\d+)|\d+)", line)[0].replace("Value:",""))
+            if ranking_value <= 0.1:
+                continue
+            stateMapping = convert(re.findall(r"([a-zA-Z_]*[a-zA-Z])=(\d+)?", line))
+            choices = convert(re.findall(r"[a-zA-Z_]*(left|right|noop)[a-zA-Z_]*:(-?\d+\.?\d*)", line))
+            choices = {key:float(value) for (key,value) in choices.items()}
+            state = State(int(stateMapping["x"]), int(stateMapping["y"]), int(stateMapping["ski_position"]), int(stateMapping["velocity"])//2)
+            value = StateValue(ranking_value, choices)
+            state_ranking[state] = value
+        logger.info(f"Parsing state ranking - DONE: took {toc()} seconds")
+        return state_ranking
+    except EnvironmentError:
+        print("Ranking file not available. Exiting.")
+        toc()
+        sys.exit(-1)
+    except:
+        toc()
+
+def createDisjunction(formulas):
+    return " | ".join(formulas)
+
+def statesFormulaTrimmed(states, name):
+    #states = [(s[0].x,s[0].y, s[0].ski_position) for s in cluster]
+    skiPositionGroup = defaultdict(list)
+    for item in states:
+        skiPositionGroup[item[2]].append(item)
+
+    formulas = list()
+    for skiPosition, skiPos_group in skiPositionGroup.items():
+        formula = f"formula {name}_{skiPosition} = ( ski_position={skiPosition} & "
+        #print(f"{name} ski_pos:{skiPosition}")
+        velocityGroup = defaultdict(list)
+        velocityFormulas = list()
+        for item in skiPos_group:
+            velocityGroup[item[3]].append(item)
+        for velocity, velocity_group in velocityGroup.items():
+            #print(f"\tvel:{velocity}")
+            formulasPerSkiPosition = list()
+            yPosGroup = defaultdict(list)
+            yFormulas = list()
+            for item in velocity_group:
+                yPosGroup[item[1]].append(item)
+            for y, y_group in yPosGroup.items():
+                #print(f"\t\ty:{y}")
+                sorted_y_group = sorted(y_group, key=lambda s: s[0])
+                current_x_min = sorted_y_group[0][0]
+                current_x = sorted_y_group[0][0]
+                x_ranges = list()
+                for state in sorted_y_group[1:-1]:
+                    if state[0] - current_x == 1:
+                        current_x = state[0]
+                    else:
+                        x_ranges.append(f" ({current_x_min}<=x&x<={current_x})")
+                        current_x_min = state[0]
+                        current_x = state[0]
+                x_ranges.append(f" {current_x_min}<=x&x<={sorted_y_group[-1][0]}")
+                yFormulas.append(f" (y={y} & {createBalancedDisjunction(x_ranges)})")
+                #x_ranges.clear()
+
+            #velocityFormulas.append(f"(velocity={velocity} & {createBalancedDisjunction(yFormulas)})")
+            velocityFormulas.append(f"({createBalancedDisjunction(yFormulas)})")
+            #yFormulas.clear()
+        formula += createBalancedDisjunction(velocityFormulas) + ");"
+        #velocityFormulas.clear()
+        formulas.append(formula)
+    for i in range(1, num_ski_positions+1):
+        if i in skiPositionGroup:
+            continue
+        formulas.append(f"formula {name}_{i} = false;")
+    return "\n".join(formulas) + "\n"
+
+# https://stackoverflow.com/questions/5389507/iterating-over-every-two-elements-in-a-list
+def pairwise(iterable):
+    "s -> (s0, s1), (s2, s3), (s4, s5), ..."
+    a = iter(iterable)
+    return zip(a, a)
+
+def createBalancedDisjunction(formulas):
+    if len(formulas) == 0:
+        return "false"
+    while len(formulas) > 1:
+        formulas_tmp = [f"({f} | {g})"  for f,g in pairwise(formulas)]
+        if len(formulas) % 2 == 1:
+            formulas_tmp.append(formulas[-1])
+        formulas = formulas_tmp
+    return " ".join(formulas)
+
+def updatePrismFile(newFile, iteration, safeStates, unsafeStates):
+    logger.info("Creating next prism file")
+    tic()
+    initFile = f"{newFile}_no_formulas.prism"
+    newFile = f"{newFile}_{iteration:03}.prism"
+    exec(f"cp {initFile} {newFile}", verbose=False)
+    with open(newFile, "a") as prism:
+        prism.write(statesFormulaTrimmed(safeStates, "Safe"))
+        prism.write(statesFormulaTrimmed(unsafeStates, "Unsafe"))
+        for i in range(1,num_ski_positions+1):
+            prism.write(f"label \"Safe_{i}\" = Safe_{i};\n")
+            prism.write(f"label \"Unsafe_{i}\" = Unsafe_{i};\n")
+
+    logger.info(f"Creating next prism file - DONE: took {toc()} seconds")
+
+
+ale = ALEInterface()
+
+
+#if SDL_SUPPORT:
+#    ale.setBool("sound", True)
+#    ale.setBool("display_screen", True)
+
+# Load the ROM file
+ale.loadROM(rom_file)
+
+with open('all_positions_v2.pickle', 'rb') as handle:
+    ramDICT = pickle.load(handle)
+y_ram_setting = 60
+x = 70
+
+
+nn_wrapper = SampleFactoryNNQueryWrapper()
+
+experiment_id = int(time.time())
+init_mdp = "velocity_safety"
+exec(f"mkdir -p images/testing_{experiment_id}", verbose=False)
+
+
+imagesDir = f"images/testing_{experiment_id}"
+
+def drawOntoSkiPosImage(states, color, target_prefix="cluster_", alpha_factor=1.0, markerSize=1, drawCircle=False):
+    #markerList = {ski_position:list() for ski_position in range(1,num_ski_positions + 1)}
+    markerList = {(ski_position, velocity):list() for velocity in range(0, num_velocities) for ski_position in range(1,num_ski_positions + 1)}
+    images = dict()
+    mergedImages = dict()
+    for ski_position in range(1, num_ski_positions + 1):
+        for velocity in range(0,num_velocities):
+            images[(ski_position, velocity)] = cv2.imread(f"{imagesDir}/{target_prefix}_{ski_position:02}_{velocity:02}_individual.png")
+        mergedImages[ski_position] = cv2.imread(f"{imagesDir}/{target_prefix}_{ski_position:02}_individual.png")
+    for state in states:
+        s = state[0]
+        marker = [color, alpha_factor * state[1].ranking, (s.x-markerSize, s.y-markerSize), (s.x+markerSize, s.y+markerSize)]
+        markerList[(s.ski_position, s.velocity)].append(marker)
+    for (pos, vel), marker in markerList.items():
+        if len(marker) == 0: continue
+        if drawCircle:
+            for m in marker:
+                images[(pos,vel)] = cv2.circle(images[(pos,vel)], m[2], 1, m[0], thickness=-1)
+                mergedImages[pos] = cv2.circle(mergedImages[pos], m[2], 1, m[0], thickness=-1)
+        else:
+            for m in marker:
+                images[(pos,vel)] = cv2.rectangle(images[(pos,vel)], m[2], m[3], m[0], cv2.FILLED)
+                mergedImages[pos] = cv2.rectangle(mergedImages[pos], m[2], m[3], m[0], cv2.FILLED)
+    for (ski_position, velocity), image in images.items():
+        cv2.imwrite(f"{imagesDir}/{target_prefix}_{ski_position:02}_{velocity:02}_individual.png", image)
+    for ski_position, image in mergedImages.items():
+        cv2.imwrite(f"{imagesDir}/{target_prefix}_{ski_position:02}_individual.png", image)
+
+
+def concatImages(prefix, iteration):
+    logger.info(f"Concatenating images")
+    images = [f"{imagesDir}/{prefix}_{pos:02}_{vel:02}_individual.png" for vel in range(0,num_velocities) for pos in range(1,num_ski_positions+1)]
+    mergedImages = [f"{imagesDir}/{prefix}_{pos:02}_individual.png" for pos in range(1,num_ski_positions+1)]
+    for vel in range(0, num_velocities):
+        for pos in range(1, num_ski_positions + 1):
+            command =  f"convert {imagesDir}/{prefix}_{pos:02}_{vel:02}_individual.png "
+            command += f"-pointsize 10 -gravity NorthEast -annotate +8+0 'p{pos:02}v{vel:02}' "
+            command += f"{imagesDir}/{prefix}_{pos:02}_{vel:02}_individual.png"
+            exec(command, verbose=False)
+    exec(f"montage {' '.join(images)} -geometry +0+0 -tile 8x9 {imagesDir}/{prefix}_{iteration:03}.png", verbose=False)
+    exec(f"montage {' '.join(mergedImages)} -geometry +0+0 -tile 8x9 {imagesDir}/{prefix}_{iteration:03}_merged.png", verbose=False)
+    #exec(f"sxiv {imagesDir}/{prefix}_{iteration}.png&", verbose=False)
+    logger.info(f"Concatenating images - DONE")
+
+def drawStatesOntoTiledImage(states, color, target, source="images/1_full_scaled_down.png", alpha_factor=1.0):
+    """
+    Useful to draw a set of states, e.g. a single cluster
+    TODO
+    markerList = {1: list(), 2:list(), 3:list(), 4:list(), 5:list(), 6:list(), 7:list(), 8:list()}
+    logger.info(f"Drawing {len(states)} states onto {target}")
+    tic()
+    for state in states:
+        s = state[0]
+        marker = f"-fill 'rgba({color}, {alpha_factor * state[1].ranking})' -draw 'rectangle {s.x-markerSize},{s.y-markerSize} {s.x+markerSize},{s.y+markerSize} '"
+        markerList[s.ski_position].append(marker)
+    for pos, marker in markerList.items():
+        command = f"convert {source} {' '.join(marker)} {imagesDir}/{target}_{pos:02}_individual.png"
+        exec(command, verbose=False)
+    exec(f"montage {imagesDir}/{target}_*_individual.png -geometry +0+0 -tile x1 {imagesDir}/{target}.png", verbose=False)
+    logger.info(f"Drawing {len(states)} states onto {target} - Done: took {toc()} seconds")
+    """
+
+def drawClusters(clusterDict, target, iteration, alpha_factor=1.0):
+    logger.info(f"Drawing {len(clusterDict)} clusters")
+    tic()
+    for _, clusterStates in clusterDict.items():
+        color = (np.random.choice(range(256)), np.random.choice(range(256)), np.random.choice(range(256)))
+        color = (int(color[0]), int(color[1]), int(color[2]))
+        drawOntoSkiPosImage(clusterStates, color, target, alpha_factor=alpha_factor)
+    concatImages(target, iteration)
+    logger.info(f"Drawing {len(clusterDict)} clusters - DONE: took {toc()} seconds")
+
+def drawResult(clusterDict, target, iteration, drawnCluster=set()):
+    logger.info(f"Drawing {len(clusterDict)} results")
+    tic()
+    for id, (clusterStates, result) in clusterDict.items():
+        if id in drawnCluster: continue
+        # opencv wants BGR
+        color = (100,100,100)
+        if result == Verdict.GOOD:
+            color = (0,200,0)
+        elif result == Verdict.BAD:
+            color = (0,0,200)
+        drawOntoSkiPosImage(clusterStates, color, target, alpha_factor=0.7)
+    logger.info(f"Drawing {len(clusterDict)} results - DONE: took {toc()} seconds")
+
+def _init_logger():
+    logger = logging.getLogger('main')
+    logger.setLevel(logging.INFO)
+    handler = logging.StreamHandler(sys.stdout)
+    formatter = logging.Formatter(       '[%(levelname)s] %(module)s - %(message)s')
+    handler.setFormatter(formatter)
+    logger.addHandler(handler)
+
+def clusterImportantStates(ranking, iteration):
+    logger.info(f"Starting to cluster {len(ranking)} states into clusters")
+    tic()
+    states = [[s[0].x,s[0].y, s[0].ski_position * 20, s[0].velocity * 20, s[1].ranking] for s in ranking]
+    #states = [[s[0].x,s[0].y, s[0].ski_position * 30, s[1].ranking] for s in ranking]
+    kmeans = KMeans(len(states) // 15, random_state=0, n_init="auto").fit(states)
+    #dbscan = DBSCAN(eps=5).fit(states)
+    #labels = dbscan.labels_
+    labels = kmeans.labels_
+    n_clusters = len(set(labels)) - (1 if -1 in labels else 0)
+    logger.info(f"Starting to cluster {len(ranking)} states into clusters - DONE: took {toc()} seconds with {n_clusters} cluster")
+    clusterDict = {i : list() for i in range(0,n_clusters)}
+    strayStates = list()
+    for i, state in enumerate(ranking):
+        if labels[i] == -1:
+            clusterDict[n_clusters + len(strayStates) + 1] = list()
+            clusterDict[n_clusters + len(strayStates) + 1].append(state)
+            strayStates.append(state)
+            continue
+        clusterDict[labels[i]].append(state)
+    if len(strayStates) > 0: logger.warning(f"{len(strayStates)} stray states with label -1")
+    #drawClusters(clusterDict, f"clusters", iteration)
+    return clusterDict
+
+
+def run_experiment(factor_tests_per_cluster):
+    logger.info("Starting")
+    num_queries = 0
+
+    source = "images/1_full_scaled_down.png"
+    for ski_position in range(1, num_ski_positions + 1):
+        for velocity in range(0,num_velocities):
+            exec(f"cp {source} {imagesDir}/clusters_{ski_position:02}_{velocity:02}_individual.png", verbose=False)
+            exec(f"cp {source} {imagesDir}/result_{ski_position:02}_{velocity:02}_individual.png", verbose=False)
+        exec(f"cp {source} {imagesDir}/clusters_{ski_position:02}_individual.png", verbose=False)
+        exec(f"cp {source} {imagesDir}/result_{ski_position:02}_individual.png", verbose=False)
+
+    goodVerdicts = 0
+    badVerdicts = 0
+    goodVerdictTestCases = list()
+    badVerdictTestCases = list()
+    safeClusters = 0
+    unsafeClusters = 0
+    safeStates = set()
+    unsafeStates = set()
+    iteration = 0
+    results = list()
+
+    eps = 0.1
+    updatePrismFile(init_mdp, iteration, set(), set())
+    #modelCheckingResult, numStates = TestResult(0,0,0,0,0,0,0,0,0,0,0,0,0), 10
+    modelCheckingResult, numStates = computeStateRanking(f"{init_mdp}_000.prism", iteration)
+    results.append(modelCheckingResult)
+    ranking = fillStateRanking(f"action_ranking_000")
+
+    sorted_ranking = sorted( (x for x in ranking.items() if x[1].ranking > 0.1), key=lambda x: x[1].ranking)
+    try:
+        clusters = clusterImportantStates(sorted_ranking, iteration)
+    except Exception as e:
+        print(e)
+        sys.exit(-1)
+
+    clusterResult = dict()
+    logger.info(f"Running tests")
+    tic()
+    num_cluster_tested = 0
+    iteration = 0
+    drawnCluster = set()
+    for id, cluster in clusters.items():
+        num_tests = int(factor_tests_per_cluster * len(cluster))
+        if num_tests == 0: num_tests = 1
+        logger.info(f"Testing {num_tests} states (from {len(cluster)} states) from cluster {id}")
+        randomStates = np.random.choice(len(cluster), num_tests, replace=False)
+        randomStates = [cluster[i] for i in randomStates]
+
+        verdictGood = True
+        for state in randomStates:
+            x = state[0].x
+            y = state[0].y
+            ski_pos = state[0].ski_position
+            velocity = state[0].velocity
+            result, num_queries_this_test_case = run_single_test(ale,nn_wrapper,x,y,ski_pos, velocity, duration=50)
+            num_queries += num_queries_this_test_case
+            if result == Verdict.BAD:
+                clusterResult[id] = (cluster, Verdict.BAD)
+                verdictGood = False
+                unsafeStates.update([(s[0].x,s[0].y, s[0].ski_position, s[0].velocity) for s in cluster])
+                badVerdicts += 1
+                badVerdictTestCases.append(state)
+
+            elif result == Verdict.GOOD:
+                goodVerdicts += 1
+                goodVerdictTestCases.append(state)
+        if verdictGood:
+            clusterResult[id] = (cluster, Verdict.GOOD)
+            safeClusters += 1
+            safeStates.update([(s[0].x,s[0].y, s[0].ski_position, s[0].velocity) for s in cluster])
+        else:
+            unsafeClusters += 1
+        results[-1].safe_states = len(safeStates)
+        results[-1].unsafe_states = len(unsafeStates)
+        results[-1].policy_queries = num_queries
+        results[-1].safe_cluster = safeClusters
+        results[-1].unsafe_cluster = unsafeClusters
+        results[-1].good_verdicts = goodVerdicts
+        results[-1].bad_verdicts = badVerdicts
+        num_cluster_tested += 1
+        if num_cluster_tested % (len(clusters)//20) == 0:
+            iteration += 1
+            logger.info(f"Tested Cluster: {num_cluster_tested:03}\tSafe Cluster States : {len(safeStates)}({safeClusters}/{len(clusters)})\tUnsafe Cluster States:{len(unsafeStates)}({unsafeClusters}/{len(clusters)})\tGood Test Cases:{goodVerdicts}\tFailing Test Cases:{badVerdicts}\t{len(safeStates)/len(unsafeStates)} - {goodVerdicts/badVerdicts}")
+            drawResult(clusterResult, "result", iteration, drawnCluster)
+            drawOntoSkiPosImage(goodVerdictTestCases, (10,255,50), "result", alpha_factor=0.7, markerSize=0, drawCircle=True)
+            drawOntoSkiPosImage(badVerdictTestCases, (0,0,0), "result", alpha_factor=0.7, markerSize=0, drawCircle=True)
+            concatImages("result", iteration)
+            drawnCluster.update(clusterResult.keys())
+            #updatePrismFile(init_mdp, iteration, safeStates, unsafeStates)
+            #modelCheckingResult, numStates = computeStateRanking(f"{init_mdp}_{iteration:03}.prism", iteration)
+            results.append(deepcopy(modelCheckingResult))
+            logger.info(f"Model Checking Result: {modelCheckingResult}")
+            # Account for self-loop states after first iteration
+            if iteration > 0:
+                results[-1].init_check_pes_avg = 1/(numStates+len(safeStates)+len(unsafeStates)) * (results[-1].init_check_pes_avg*numStates + 1.0*results[-2].unsafe_states + 0.0*results[-2].safe_states)
+                results[-1].init_check_opt_avg = 1/(numStates+len(safeStates)+len(unsafeStates)) * (results[-1].init_check_opt_avg*numStates + 0.0*results[-2].unsafe_states + 1.0*results[-2].safe_states)
+            print(TestResult.csv_header())
+            for result in results[:-1]:
+                print(result.csv())
+
+
+    with open(f"data_new_method_{factor_tests_per_cluster}", "w") as f:
+        f.write(TestResult.csv_header() + "\n")
+        for result in results[:-1]:
+            f.write(result.csv() + "\n")
+
+
+_init_logger()
+logger = logging.getLogger('main')
+if __name__ == '__main__':
+    for factor_tests_per_cluster in [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0]:
+        run_experiment(factor_tests_per_cluster)
--- a/rom_evaluate.py
+++ b/rom_evaluate.py
@ -1,9 +1,12 @@
 import sys
 import operator
 from os import listdir, system
+import subprocess
+import re
+from collections import defaultdict
+
 from random import randrange
 from ale_py import ALEInterface, SDL_SUPPORT, Action
-from colors import *
 from PIL import Image
 from matplotlib import pyplot as plt
 import cv2
@ -11,13 +14,18 @@ import pickle
 import queue
 from dataclasses import dataclass, field

+from sklearn.cluster import KMeans, DBSCAN
+
 from enum import Enum

 from copy import deepcopy

 import numpy as np

-import readchar
+import logging
+logger = logging.getLogger(__name__)
+
+#import readchar

 from sample_factory.algo.utils.tensor_dict import TensorDict
 from query_sample_factory_checkpoint import SampleFactoryNNQueryWrapper
@ -25,9 +33,17 @@ from query_sample_factory_checkpoint import SampleFactoryNNQueryWrapper
 import time

 tempest_binary = "/home/spranger/projects/tempest-devel/ranking_release/bin/storm"
-rom_file = "/home/spranger/research/Skiing/env/lib/python3.8/site-packages/AutoROM/roms/skiing.bin"
+rom_file = "/home/spranger/research/Skiing/env/lib/python3.10/site-packages/AutoROM/roms/skiing.bin"

+def tic():
+    import time
+    global startTime_for_tictoc
+    startTime_for_tictoc = time.time()

+def toc():
+    import time
+    if 'startTime_for_tictoc' in globals():
+        return time.time() - startTime_for_tictoc

 class Verdict(Enum):
    INCONCLUSIVE = 1
@ -44,35 +60,47 @@ class State:
    x: int
    y: int
    ski_position: int
+    velocity: int
 def default_value():
    return {'action' : None, 'choiceValue' : None}
+
@dataclass(frozen=True)
 class StateValue:
    ranking: float
    choices: dict = field(default_factory=default_value)

+@dataclass(frozen=False)
+class TestResult:
+    init_check_pes_min: float
+    init_check_pes_max: float
+    init_check_pes_avg: float
+    init_check_opt_min: float
+    init_check_opt_max: float
+    init_check_opt_avg: float
+    safe_states: int
+    unsafe_states: int
+    policy_queries: int
+    def __str__(self):
+        return f"""Test Result:
+    init_check_pes_min: {self.init_check_pes_min}
+    init_check_pes_max: {self.init_check_pes_max}
+    init_check_pes_avg: {self.init_check_pes_avg}
+    init_check_opt_min: {self.init_check_opt_min}
+    init_check_opt_max: {self.init_check_opt_max}
+    init_check_opt_avg: {self.init_check_opt_avg}
+"""
+    def csv(self, ws=" "):
+        return f"{self.init_check_pes_min:0.04f}{ws}{self.init_check_pes_max:0.04f}{ws}{self.init_check_pes_avg:0.04f}{ws}{self.init_check_opt_min:0.04f}{ws}{self.init_check_opt_max:0.04f}{ws}{self.init_check_opt_avg:0.04f}{ws}{self.safe_states}{ws}{self.unsafe_states}{ws}{self.policy_queries}"
+
 def exec(command,verbose=True):
    if verbose: print(f"Executing {command}")
    system(f"echo {command} >> list_of_exec")
    return system(command)

-def model_to_actual(ski_position):
-    if ski_position == 1:
-        return 1
-    elif ski_position in [2,3]:
-        return 2
-    elif ski_position in [4,5]:
-        return 3
-    elif ski_position in [6,7]:
-        return 4
-    elif ski_position in [8,9]:
-        return 5
-    elif ski_position in [10,11]:
-        return 6
-    elif ski_position in [12,13]:
-        return 7
-    elif ski_position == 14:
-        return 8
+num_tests_per_cluster = 50
+factor_tests_per_cluster = 0.2
+num_ski_positions = 8
+num_velocities = 5

 def input_to_action(char):
    if char == "0":
@ -90,115 +118,210 @@ def input_to_action(char):
    if char in ["w", "a", "s", "d"]:
        return char

-def drawImportantStates(important_states):
-    draw_commands = {1: list(), 2:list(), 3:list(), 4:list(), 5:list(), 6:list(), 7:list(), 8:list(), 9:list(), 10:list(), 11:list(), 12:list(), 13:list(), 14:list()}
-    for state in important_states:
-        x = state[0].x
-        y = state[0].y
-        markerSize = 2
-        ski_position = state[0].ski_position
-        draw_commands[ski_position].append(f"-fill 'rgba(255,204,0,{state[1].ranking})' -draw 'rectangle {x-markerSize},{y-markerSize} {x+markerSize},{y+markerSize} '")
-    for i in range(1,15):
-        command = f"convert images/1_full_scaled_down.png {' '.join(draw_commands[i])} first_try_{i:02}.png"
-        exec(command)
+def saveObservations(observations, verdict, testDir):
+    testDir = f"images/testing_{experiment_id}/{verdict.name}_{testDir}_{len(observations)}"
+    if len(observations) < 20:
+        logger.warn(f"Potentially spurious test case for {testDir}")
+        testDir = f"{testDir}_pot_spurious"
+    exec(f"mkdir {testDir}", verbose=False)
+    for i, obs in enumerate(observations):
+        img = Image.fromarray(obs)
+        img.save(f"{testDir}/{i:003}.png")

 ski_position_counter = {1: (Action.LEFT, 40), 2: (Action.LEFT, 35), 3: (Action.LEFT, 30), 4: (Action.LEFT, 10), 5: (Action.NOOP, 1), 6: (Action.RIGHT, 10), 7: (Action.RIGHT, 30), 8: (Action.RIGHT, 40) }
-def run_single_test(ale, nn_wrapper, x,y,ski_position, duration=200):
-    #print(f"Running Test from x: {x:04}, y: {y:04}, ski_position: {ski_position}", end="")
-    for i, r in enumerate(ramDICT[y]):
-        ale.setRAM(i,r)
-    ski_position_setting = ski_position_counter[ski_position]
-    for i in range(0,ski_position_setting[1]):
-        ale.act(ski_position_setting[0])
-        ale.setRAM(14,0)
-        ale.setRAM(25,x)
-    ale.setRAM(14,180)

+def run_single_test(ale, nn_wrapper, x,y,ski_position, velocity, duration=50):
+    #print(f"Running Test from x: {x:04}, y: {y:04}, ski_position: {ski_position}", end="")
+    testDir = f"{x}_{y}_{ski_position}_{velocity}"
+    try:
+        for i, r in enumerate(ramDICT[y]):
+            ale.setRAM(i,r)
+        ski_position_setting = ski_position_counter[ski_position]
+        for i in range(0,ski_position_setting[1]):
+            ale.act(ski_position_setting[0])
+            ale.setRAM(14,0)
+            ale.setRAM(25,x)
+        ale.setRAM(14,180) # TODO
+    except Exception as e:
+        print(e)
+        logger.warn(f"Could not run test for x: {x}, y: {y}, ski_position: {ski_position}, velocity: {velocity}")
+        return (Verdict.INCONCLUSIVE, 0)
+
+    num_queries = 0
    all_obs = list()
    speed_list = list()
-    first_action_set = False
-    first_action = 0
-    for i in range(0,duration):
-        resized_obs = cv2.resize(ale.getScreenGrayscale() , (84,84), interpolation=cv2.INTER_AREA)
+    resized_obs = cv2.resize(ale.getScreenGrayscale(), (84,84), interpolation=cv2.INTER_AREA)
+    for i in range(0,4):
        all_obs.append(resized_obs)
-        if len(all_obs) >= 4:
+    for i in range(0,duration-4):
+        resized_obs = cv2.resize(ale.getScreenGrayscale(), (84,84), interpolation=cv2.INTER_AREA)
+        all_obs.append(resized_obs)
+        if i % 4 == 0:
            stack_tensor = TensorDict({"obs": np.array(all_obs[-4:])})
            action = nn_wrapper.query(stack_tensor)
-            if not first_action_set:
-                first_action_set = True
-                first_action = input_to_action(str(action))
+            num_queries += 1
            ale.act(input_to_action(str(action)))
        else:
-            ale.act(Action.NOOP)
+            ale.act(input_to_action(str(action)))
        speed_list.append(ale.getRAM()[14])
        if len(speed_list) > 15 and sum(speed_list[-6:-1]) == 0:
-            return (Verdict.BAD, first_action)
-        #time.sleep(0.005)
-    return (Verdict.INCONCLUSIVE, first_action)
-
-def optimalAction(choices):
-    return max(choices.items(), key=operator.itemgetter(1))[0]
-
-def computeStateRanking(mdp_file):
-    command = f"{tempest_binary} --prism {mdp_file} --buildchoicelab --buildstateval --prop 'Rmax=? [C <= 1000]'"
-    exec(command)
+            #saveObservations(all_obs, Verdict.BAD, testDir)
+            return (Verdict.BAD, num_queries)
+    #saveObservations(all_obs, Verdict.GOOD, testDir)
+    return (Verdict.GOOD, num_queries)
+
+def skiPositionFormulaList(name):
+    formulas = list()
+    for i in range(1, num_ski_positions+1):
+        formulas.append(f"\"{name}_{i}\"")
+    return createBalancedDisjunction(formulas)
+
+
+def computeStateRanking(mdp_file, iteration):
+    logger.info("Computing state ranking")
+    tic()
+    prop =  f"filter(min, Pmin=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(max, Pmin=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(avg, Pmin=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(min, Pmax=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(max, Pmax=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += f"filter(avg, Pmax=? [ G !(\"Hit_Tree\" | \"Hit_Gate\" | {skiPositionFormulaList('Unsafe')}) ], (!\"S_Hit_Tree\" & !\"S_Hit_Gate\") | ({skiPositionFormulaList('Safe')} | {skiPositionFormulaList('Unsafe')}) );"
+    prop += 'Rmax=? [C <= 200]'
+    results = list()
+    try:
+        command = f"{tempest_binary} --prism {mdp_file} --buildchoicelab --buildstateval --build-all-labels --prop '{prop}'"
+        output = subprocess.check_output(command, shell=True).decode("utf-8").split('\n')
+        num_states = 0
+        for line in output:
+            #print(line)
+            if "States:" in line:
+                num_states = int(line.split(" ")[-1])
+            if "Result" in line and not len(results) >= 6:
+                range_value = re.search(r"(.*:).*\[(-?\d+\.?\d*), (-?\d+\.?\d*)\].*", line)
+                if range_value:
+                    results.append(float(range_value.group(2)))
+                    results.append(float(range_value.group(3)))
+                else:
+                    value = re.search(r"(.*:)(.*)", line)
+                    results.append(float(value.group(2)))
+        exec(f"mv action_ranking action_ranking_{iteration:03}")
+    except subprocess.CalledProcessError as e:
+        # todo die gracefully if ranking is uniform
+        print(e.output)
+    logger.info(f"Computing state ranking - DONE: took {toc()} seconds")
+    return TestResult(*tuple(results),0,0,0), num_states

 def fillStateRanking(file_name, match=""):
+    logger.info(f"Parsing state ranking, {file_name}")
+    tic()
    state_ranking = dict()
    try:
        with open(file_name, "r") as f:
            file_content = f.readlines()
        for line in file_content:
            if not "move=0" in line: continue
+            ranking_value = float(re.search(r"Value:([+-]?(\d*\.\d+)|\d+)", line)[0].replace("Value:",""))
+            if ranking_value <= 0.1:
+                continue
            stateMapping = convert(re.findall(r"([a-zA-Z_]*[a-zA-Z])=(\d+)?", line))
-            #print("stateMapping", stateMapping)
            choices = convert(re.findall(r"[a-zA-Z_]*(left|right|noop)[a-zA-Z_]*:(-?\d+\.?\d*)", line))
            choices = {key:float(value) for (key,value) in choices.items()}
-            #print("choices", choices)
-            ranking_value = float(re.search(r"Value:([+-]?(\d*\.\d+)|\d+)", line)[0].replace("Value:",""))
-            #print("ranking_value", ranking_value)
-            state = State(int(stateMapping["x"]), int(stateMapping["y"]), int(stateMapping["ski_position"]))
+            state = State(int(stateMapping["x"]), int(stateMapping["y"]), int(stateMapping["ski_position"]), int(stateMapping["velocity"])//2)
            value = StateValue(ranking_value, choices)
            state_ranking[state] = value
+        logger.info(f"Parsing state ranking - DONE: took {toc()} seconds")
        return state_ranking
-
    except EnvironmentError:
        print("Ranking file not available. Exiting.")
-        sys.exit(1)
-
-
-fixed_left_states = list()
-fixed_right_states = list()
-fixed_noop_states = list()
-
-def populate_fixed_actions(state, action):
-    if action == Action.LEFT:
-        fixed_left_states.append(state)
-    if action == Action.RIGHT:
-        fixed_right_states.append(state)
-    if action == Action.NOOP:
-        fixed_noop_states.append(state)
-
-def update_prism_file(old_prism_file, new_prism_file):
-    fixed_left_formula = "formula Fixed_Left = false "
-    fixed_right_formula = "formula Fixed_Right = false "
-    fixed_noop_formula = "formula Fixed_Noop = false "
-    for state in fixed_left_states:
-        fixed_left_formula += f" | (x={state.x}&y={state.y}&ski_position={state.ski_position}) "
-    for state in fixed_right_states:
-        fixed_right_formula += f" | (x={state.x}&y={state.y}&ski_position={state.ski_position}) "
-    for state in fixed_noop_states:
-        fixed_noop_formula += f" | (x={state.x}&y={state.y}&ski_position={state.ski_position}) "
-    fixed_left_formula += ";\n"
-    fixed_right_formula += ";\n"
-    fixed_noop_formula += ";\n"
-    with open(f'{old_prism_file}', 'r') as file :
-      filedata = file.read()
-    if len(fixed_left_states)  > 0: filedata = re.sub(r"^formula Fixed_Left =.*$", fixed_left_formula, filedata, flags=re.MULTILINE)
-    if len(fixed_right_states) > 0: filedata = re.sub(r"^formula Fixed_Right =.*$", fixed_right_formula, filedata, flags=re.MULTILINE)
-    if len(fixed_noop_states)  > 0: filedata = re.sub(r"^formula Fixed_Noop =.*$", fixed_noop_formula, filedata, flags=re.MULTILINE)
-    with open(f'{new_prism_file}', 'w') as file:
-      file.write(filedata)
+        toc()
+        sys.exit(-1)
+    except:
+        toc()
+
+def createDisjunction(formulas):
+    return " | ".join(formulas)
+
+def statesFormulaTrimmed(states, name):
+    #states = [(s[0].x,s[0].y, s[0].ski_position) for s in cluster]
+    skiPositionGroup = defaultdict(list)
+    for item in states:
+        skiPositionGroup[item[2]].append(item)
+
+    formulas = list()
+    for skiPosition, skiPos_group in skiPositionGroup.items():
+        formula = f"formula {name}_{skiPosition} = ( ski_position={skiPosition} & "
+        #print(f"{name} ski_pos:{skiPosition}")
+        velocityGroup = defaultdict(list)
+        velocityFormulas = list()
+        for item in skiPos_group:
+            velocityGroup[item[3]].append(item)
+        for velocity, velocity_group in velocityGroup.items():
+            #print(f"\tvel:{velocity}")
+            formulasPerSkiPosition = list()
+            yPosGroup = defaultdict(list)
+            yFormulas = list()
+            for item in velocity_group:
+                yPosGroup[item[1]].append(item)
+            for y, y_group in yPosGroup.items():
+                #print(f"\t\ty:{y}")
+                sorted_y_group = sorted(y_group, key=lambda s: s[0])
+                current_x_min = sorted_y_group[0][0]
+                current_x = sorted_y_group[0][0]
+                x_ranges = list()
+                for state in sorted_y_group[1:-1]:
+                    if state[0] - current_x == 1:
+                        current_x = state[0]
+                    else:
+                        x_ranges.append(f" ({current_x_min}<=x&x<={current_x})")
+                        current_x_min = state[0]
+                        current_x = state[0]
+                x_ranges.append(f" {current_x_min}<=x&x<={sorted_y_group[-1][0]}")
+                yFormulas.append(f" (y={y} & {createBalancedDisjunction(x_ranges)})")
+                #x_ranges.clear()
+
+            #velocityFormulas.append(f"(velocity={velocity} & {createBalancedDisjunction(yFormulas)})")
+            velocityFormulas.append(f"({createBalancedDisjunction(yFormulas)})")
+            #yFormulas.clear()
+        formula += createBalancedDisjunction(velocityFormulas) + ");"
+        #velocityFormulas.clear()
+        formulas.append(formula)
+    for i in range(1, num_ski_positions+1):
+        if i in skiPositionGroup:
+            continue
+        formulas.append(f"formula {name}_{i} = false;")
+    return "\n".join(formulas) + "\n"
+
+# https://stackoverflow.com/questions/5389507/iterating-over-every-two-elements-in-a-list
+def pairwise(iterable):
+    "s -> (s0, s1), (s2, s3), (s4, s5), ..."
+    a = iter(iterable)
+    return zip(a, a)
+
+def createBalancedDisjunction(formulas):
+    if len(formulas) == 0:
+        return "false"
+    while len(formulas) > 1:
+        formulas_tmp = [f"({f} | {g})"  for f,g in pairwise(formulas)]
+        if len(formulas) % 2 == 1:
+            formulas_tmp.append(formulas[-1])
+        formulas = formulas_tmp
+    return " ".join(formulas)
+
+def updatePrismFile(newFile, iteration, safeStates, unsafeStates):
+    logger.info("Creating next prism file")
+    tic()
+    initFile = f"{newFile}_no_formulas.prism"
+    newFile = f"{newFile}_{iteration:03}.prism"
+    exec(f"cp {initFile} {newFile}", verbose=False)
+    with open(newFile, "a") as prism:
+        prism.write(statesFormulaTrimmed(safeStates, "Safe"))
+        prism.write(statesFormulaTrimmed(unsafeStates, "Unsafe"))
+        for i in range(1,num_ski_positions+1):
+            prism.write(f"label \"Safe_{i}\" = Safe_{i};\n")
+            prism.write(f"label \"Unsafe_{i}\" = Unsafe_{i};\n")
+
+    logger.info(f"Creating next prism file - DONE: took {toc()} seconds")
+

 ale = ALEInterface()

@ -218,34 +341,232 @@ x = 70

 nn_wrapper = SampleFactoryNNQueryWrapper()

-iteration = 0
-id = int(time.time())
-init_mdp = "velocity"
-exec(f"mkdir -p images/testing_{id}")
-exec(f"cp 1_full_scaled_down.png images/testing_{id}/testing_0000.png")
-exec(f"cp {init_mdp}.prism {init_mdp}_000.prism")
+experiment_id = int(time.time())
+init_mdp = "velocity_safety"
+exec(f"mkdir -p images/testing_{experiment_id}", verbose=False)

 markerSize = 1
-markerList = {1: list(), 2:list(), 3:list(), 4:list(), 5:list(), 6:list(), 7:list(), 8:list()}
-
-while True:
-    computeStateRanking(f"{init_mdp}_{iteration:03}.prism")
-    ranking = fillStateRanking("action_ranking")
-    sorted_ranking = sorted(ranking.items(), key=lambda x: x[1].ranking)
-    for important_state in sorted_ranking[-100:-1]:
-        optimal_choice = optimalAction(important_state[1].choices)
-        #print(important_state[1].choices, f"\t\tOptimal: {optimal_choice}")
-        x = important_state[0].x
-        y = important_state[0].y
-        ski_pos = model_to_actual(important_state[0].ski_position)
-        result = run_single_test(ale,nn_wrapper,x,y,ski_pos, duration=50)
-        #print(f".... {result}")
-        marker = f"-fill 'rgba({verdict_to_color_map[result[0]],0.7})' -draw 'rectangle {x-markerSize},{y-markerSize} {x+markerSize},{y+markerSize} '"
-        markerList[ski_pos].append(marker)
-        populate_fixed_actions(important_state[0], result[1])
+
+imagesDir = f"images/testing_{experiment_id}"
+
+def drawOntoSkiPosImage(states, color, target_prefix="cluster_", alpha_factor=1.0, markerSize=1, drawCircle=False):
+    #markerList = {ski_position:list() for ski_position in range(1,num_ski_positions + 1)}
+    markerList = {(ski_position, velocity):list() for velocity in range(0, num_velocities) for ski_position in range(1,num_ski_positions + 1)}
+    images = dict()
+    mergedImages = dict()
+    for ski_position in range(1, num_ski_positions + 1):
+        for velocity in range(0,num_velocities):
+            images[(ski_position, velocity)] = cv2.imread(f"{imagesDir}/{target_prefix}_{ski_position:02}_{velocity:02}_individual.png")
+        mergedImages[ski_position] = cv2.imread(f"{imagesDir}/{target_prefix}_{ski_position:02}_individual.png")
+    for state in states:
+        s = state[0]
+        marker = [color, alpha_factor * state[1].ranking, (s.x-markerSize, s.y-markerSize), (s.x+markerSize, s.y+markerSize)]
+        markerList[(s.ski_position, s.velocity)].append(marker)
+    for (pos, vel), marker in markerList.items():
+        if len(marker) == 0: continue
+        if drawCircle:
+            for m in marker:
+                images[(pos,vel)] = cv2.circle(images[(pos,vel)], m[2], 1, m[0], thickness=-1)
+                mergedImages[pos] = cv2.circle(mergedImages[pos], m[2], 1, m[0], thickness=-1)
+        else:
+            for m in marker:
+                images[(pos,vel)] = cv2.rectangle(images[(pos,vel)], m[2], m[3], m[0], cv2.FILLED)
+                mergedImages[pos] = cv2.rectangle(mergedImages[pos], m[2], m[3], m[0], cv2.FILLED)
+    for (ski_position, velocity), image in images.items():
+        cv2.imwrite(f"{imagesDir}/{target_prefix}_{ski_position:02}_{velocity:02}_individual.png", image)
+    for ski_position, image in mergedImages.items():
+        cv2.imwrite(f"{imagesDir}/{target_prefix}_{ski_position:02}_individual.png", image)
+
+def concatImages(prefix, iteration):
+    logger.info(f"Concatenating images")
+    images = [f"{imagesDir}/{prefix}_{pos:02}_{vel:02}_individual.png" for vel in range(0,num_velocities) for pos in range(1,num_ski_positions+1)]
+    mergedImages = [f"{imagesDir}/{prefix}_{pos:02}_individual.png" for pos in range(1,num_ski_positions+1)]
+    for vel in range(0, num_velocities):
+        for pos in range(1, num_ski_positions + 1):
+            command =  f"convert {imagesDir}/{prefix}_{pos:02}_{vel:02}_individual.png "
+            command += f"-pointsize 10 -gravity NorthEast -annotate +8+0 'p{pos:02}v{vel:02}' "
+            command += f"{imagesDir}/{prefix}_{pos:02}_{vel:02}_individual.png"
+            exec(command, verbose=False)
+    exec(f"montage {' '.join(images)} -geometry +0+0 -tile 8x9 {imagesDir}/{prefix}_{iteration}.png", verbose=False)
+    exec(f"montage {' '.join(mergedImages)} -geometry +0+0 -tile 8x9 {imagesDir}/{prefix}_{iteration}_merged.png", verbose=False)
+    #exec(f"sxiv {imagesDir}/{prefix}_{iteration}.png&", verbose=False)
+    logger.info(f"Concatenating images - DONE")
+
+def drawStatesOntoTiledImage(states, color, target, source="images/1_full_scaled_down.png", alpha_factor=1.0):
+    """
+    Useful to draw a set of states, e.g. a single cluster
+    markerList = {1: list(), 2:list(), 3:list(), 4:list(), 5:list(), 6:list(), 7:list(), 8:list()}
+    logger.info(f"Drawing {len(states)} states onto {target}")
+    tic()
+    for state in states:
+        s = state[0]
+        marker = f"-fill 'rgba({color}, {alpha_factor * state[1].ranking})' -draw 'rectangle {s.x-markerSize},{s.y-markerSize} {s.x+markerSize},{s.y+markerSize} '"
+        markerList[s.ski_position].append(marker)
    for pos, marker in markerList.items():
-        command = f"convert images/testing_{id}/testing_0000.png {' '.join(marker)} images/testing_{id}/testing_{iteration+1:03}_{pos:02}.png"
+        command = f"convert {source} {' '.join(marker)} {imagesDir}/{target}_{pos:02}_individual.png"
        exec(command, verbose=False)
-    exec(f"montage images/testing_{id}/testing_{iteration+1:03}_*png -geometry +0+0 -tile x1 images/testing_{id}/{iteration+1:03}.png", verbose=False)
-    iteration += 1
-    update_prism_file(f"{init_mdp}_{iteration-1:03}.prism", f"{init_mdp}_{iteration:03}.prism")
+    exec(f"montage {imagesDir}/{target}_*_individual.png -geometry +0+0 -tile x1 {imagesDir}/{target}.png", verbose=False)
+    logger.info(f"Drawing {len(states)} states onto {target} - Done: took {toc()} seconds")
+    """
+
+def drawClusters(clusterDict, target, iteration, alpha_factor=1.0): # TODO do not draw already drawn clusters
+    logger.info(f"Drawing {len(clusterDict)} clusters")
+    tic()
+    for _, clusterStates in clusterDict.items():
+        color = (np.random.choice(range(256)), np.random.choice(range(256)), np.random.choice(range(256)))
+        color = (int(color[0]), int(color[1]), int(color[2]))
+        drawOntoSkiPosImage(clusterStates, color, target, alpha_factor=alpha_factor)
+    concatImages(target, iteration)
+    logger.info(f"Drawing {len(clusterDict)} clusters - DONE: took {toc()} seconds")
+
+def drawResult(clusterDict, target, iteration): # TODO do not draw already drawn clusters
+    logger.info(f"Drawing {len(clusterDict)} results")
+    tic()
+    for id, (clusterStates, result) in clusterDict.items():
+        # opencv wants BGR
+        color = (100,100,100)
+        if result == Verdict.GOOD:
+            color = (0,200,0)
+        elif result == Verdict.BAD:
+            color = (0,0,200)
+        drawOntoSkiPosImage(clusterStates, color, target, alpha_factor=0.7)
+    logger.info(f"Drawing {len(clusterDict)} results - DONE: took {toc()} seconds")
+
+def _init_logger():
+    logger = logging.getLogger('main')
+    logger.setLevel(logging.INFO)
+    handler = logging.StreamHandler(sys.stdout)
+    formatter = logging.Formatter(       '[%(levelname)s] %(module)s - %(message)s')
+    handler.setFormatter(formatter)
+    logger.addHandler(handler)
+
+def clusterImportantStates(ranking, iteration):
+    logger.info(f"Starting to cluster {len(ranking)} states into clusters")
+    tic()
+    states = [[s[0].x,s[0].y, s[0].ski_position * 20, s[0].velocity * 20, s[1].ranking] for s in ranking]
+    kmeans = KMeans(len(states) // 15, random_state=0, n_init="auto").fit(states)
+    #dbscan = DBSCAN(eps=5).fit(states)
+    labels = kmeans.labels_
+    n_clusters = len(set(labels)) - (1 if -1 in labels else 0)
+    logger.info(f"Starting to cluster {len(ranking)} states into clusters - DONE: took {toc()} seconds with {n_clusters} cluster")
+    clusterDict = {i : list() for i in range(0,n_clusters)}
+    strayStates = list()
+    for i, state in enumerate(ranking):
+        if labels[i] == -1:
+            clusterDict[n_clusters + len(strayStates) + 1] = list()
+            clusterDict[n_clusters + len(strayStates) + 1].append(state)
+            strayStates.append(state)
+            continue
+        clusterDict[labels[i]].append(state)
+    if len(strayStates) > 0: logger.warning(f"{len(strayStates)} stray states with label -1")
+    drawClusters(clusterDict, f"clusters", iteration)
+    return clusterDict
+
+if __name__ == '__main__':
+    _init_logger()
+    logger = logging.getLogger('main')
+    logger.info("Starting")
+    testAll = False
+    num_queries = 0
+
+    source = "images/1_full_scaled_down.png"
+    for ski_position in range(1, num_ski_positions + 1):
+        for velocity in range(0,num_velocities):
+            exec(f"cp {source} {imagesDir}/clusters_{ski_position:02}_{velocity:02}_individual.png", verbose=False)
+            exec(f"cp {source} {imagesDir}/result_{ski_position:02}_{velocity:02}_individual.png", verbose=False)
+        exec(f"cp {source} {imagesDir}/clusters_{ski_position:02}_individual.png", verbose=False)
+        exec(f"cp {source} {imagesDir}/result_{ski_position:02}_individual.png", verbose=False)
+    safeStates = set()
+    unsafeStates = set()
+    iteration = 0
+    results = list()
+    goodVerdicts = 0
+    badVerdicts = 0
+    goodVerdictTestCases = list()
+    badVerdictTestCases = list()
+    safeClusters = 0
+    unsafeClusters = 0
+    eps = 0.1
+
+
+    while True:
+        updatePrismFile(init_mdp, iteration, safeStates, unsafeStates)
+        modelCheckingResult, numStates = computeStateRanking(f"{init_mdp}_{iteration:03}.prism", iteration)
+        if len(results) > 0:
+            modelCheckingResult.safeStates     = results[-1].safeStates
+            modelCheckingResult.unsafeStates   = results[-1].unsafeStates
+            modelCheckingResult.policy_queries = results[-1].policy_queries
+        results.append(modelCheckingResult)
+        logger.info(f"Model Checking Result: {modelCheckingResult}")
+        if abs(modelCheckingResult.init_check_pes_avg - modelCheckingResult.init_check_opt_avg) < eps:
+            logger.info(f"Absolute difference between average estimates is below eps = {eps}... finishing!")
+            break
+
+
+        ranking = fillStateRanking(f"action_ranking_{iteration:03}")
+        sorted_ranking = sorted( (x for x in ranking.items() if x[1].ranking > 0.1), key=lambda x: x[1].ranking)
+        try:
+            clusters = clusterImportantStates(sorted_ranking, iteration)
+        except Exception as e:
+            print(e)
+            break
+
+        if testAll: failingPerCluster = {i: list() for i in range(0, n_clusters)}
+        clusterResult = dict()
+        logger.info(f"Running tests")
+        tic()
+        for id, cluster in clusters.items():
+            num_tests = int(factor_tests_per_cluster * len(cluster))
+            #logger.info(f"Testing {num_tests} states (from {len(cluster)} states) from cluster {id}")
+            randomStates = np.random.choice(len(cluster), num_tests, replace=False)
+            randomStates = [cluster[i] for i in randomStates]
+
+            verdictGood = True
+            for state in randomStates:
+                x = state[0].x
+                y = state[0].y
+                ski_pos = state[0].ski_position
+                velocity = state[0].velocity
+                result, num_queries_this_test_case = run_single_test(ale,nn_wrapper,x,y,ski_pos, velocity, duration=50)
+                num_queries += num_queries_this_test_case
+                if result == Verdict.BAD:
+                    if testAll:
+                        failingPerCluster[id].append(state)
+                    else:
+                        clusterResult[id] = (cluster, Verdict.BAD)
+                        verdictGood = False
+                        unsafeStates.update([(s[0].x,s[0].y, s[0].ski_position, s[0].velocity) for s in cluster])
+                        badVerdictTestCases.append(state)
+                elif result == Verdict.GOOD:
+                    goodVerdicts += 1
+                    goodVerdictTestCases.append(state)
+            if verdictGood:
+                clusterResult[id] = (cluster, Verdict.GOOD)
+                safeClusters += 1
+                safeStates.update([(s[0].x,s[0].y, s[0].ski_position, s[0].velocity) for s in cluster])
+            else:
+                unsafeClusters += 1
+        logger.info(f"Tested Cluster: {iteration:03}\tSafe Cluster States : {len(safeStates)}({safeClusters}/{len(clusters)})\tUnsafe Cluster States:{len(unsafeStates)}({unsafeClusters}/{len(clusters)})\tGood Test Cases:{goodVerdicts}\tFailing Test Cases:{badVerdicts}\t{len(safeStates)/len(unsafeStates)} - {goodVerdicts/badVerdicts}")
+        results[-1].safeStates = len(safeStates)
+        results[-1].unsafeStates = len(unsafeStates)
+        results[-1].policy_queries = num_queries
+        results[-1].safe_cluster = safeClusters
+        results[-1].unsafe_cluster = unsafeClusters
+        results[-1].good_verdicts = goodVerdicts
+        results[-1].bad_verdicts = badVerdicts
+        # Account for self-loop states after first iteration
+        if iteration > 0:
+            results[-1].init_check_pes_avg = 1/(numStates+len(safeStates)+len(unsafeStates)) * (results[-1].init_check_pes_avg*numStates + 1.0*results[-2].unsafeStates + 0.0*results[-2].safeStates)
+            results[-1].init_check_opt_avg = 1/(numStates+len(safeStates)+len(unsafeStates)) * (results[-1].init_check_opt_avg*numStates + 0.0*results[-2].unsafeStates + 1.0*results[-2].safeStates)
+        for result in results:
+            print(result.csv())
+        if testAll: drawClusters(failingPerCluster, f"failing", iteration)
+
+        drawResult(clusterResult, "result", iteration)
+        drawOntoSkiPosImage(goodVerdictTestCases, (10,255,50), "result", alpha_factor=0.7, markerSize=0, drawCircle=True)
+        drawOntoSkiPosImage(badVerdictTestCases, (0,0,0), "result", alpha_factor=0.7, markerSize=0, drawCircle=True)
+        concatImages(target, iteration)
+        iteration += 1
+
+    for result in results:
+        print(result.csv())
--- a/velocity_safety_no_formulas.prism
+++ b/velocity_safety_no_formulas.prism
@ -0,0 +1,137 @@
+mdp
+
+const int initY = 40;
+const int initX = 80;
+
+const int maxY = 580;
+//const int maxY = 360;
+//const int maxY = 200;
+const int minX = 10;
+const int maxX = 152;
+const int maxVel = 8;
+
+
+formula Gate_1 = (((42<x & x<50) | (74<x  & x<82))  & 164<y & y<172);
+formula Gate_2 = (((72<x & x<80) | (104<x & x<112)) & 256<y & y<264);
+formula Gate_3 = (((80<x & x<88) | (112<x & x<120)) & 349<y & y<357);
+formula Gate_4 = (((54<x & x<62) | (88<x  & x<96))  & 442<y & y<450);
+formula Gate_5 = (((80<x & x<88) | (112<x & x<120)) & 530<y & y<538);
+
+formula S_Gate_1 = (((32<x & x<60) | (64<x  & x<92))  & 124<y & y<172);
+formula S_Gate_2 = (((62<x & x<90) | (94<x & x<132)) & 216<y & y<264);
+formula S_Gate_3 = (((70<x & x<98) | (102<x & x<130)) & 309<y & y<357);
+formula S_Gate_4 = (((44<x & x<72) | (78<x  & x<106))  & 402<y & y<450);
+formula S_Gate_5 = (((70<x & x<98) | (102<x & x<130)) & 490<y & y<538);
+
+
+formula Tree_1 = ((x>=124 & x<=142) & (y>=190 & y<=200));
+formula Tree_2 = ((x>=32 & x<=49)   & (y>=284 & y<=295));
+formula Tree_3 = ((x>=30 & x<=49)   & (y>=317 & y<=327));
+formula Tree_4 = ((x>=12 & x<=30)   & (y>=408 & y<=418));
+formula Tree_5 = ((x>=129 & x<=146) & (y>=468 & y<=480));
+formula Tree_6 = ((x>=140 & x<=152) & (y>=496 & y<=510));
+
+formula S_Tree_1 = ((x>=114 & x<=152) & (y>=150 & y<=200));
+formula S_Tree_2 = ((x>=22 & x<=59)   & (y>=244 & y<=295));
+formula S_Tree_3 = ((x>=20 & x<=59)   & (y>=277 & y<=327));
+formula S_Tree_4 = ((x>=2 & x<=40)   & (y>=368 & y<=418));
+formula S_Tree_5 = ((x>=119 & x<=156) & (y>=438 & y<=480));
+formula S_Tree_6 = ((x>=130 & x<=162) & (y>=456 & y<=510));
+
+formula Hit_Tree = Tree_1 | Tree_2 | Tree_3 | Tree_4 | Tree_5 | Tree_6;
+formula Hit_Gate = Gate_1 | Gate_2 | Gate_3 | Gate_4 | Gate_5;
+formula S_Hit_Tree = S_Tree_1 | S_Tree_2 | S_Tree_3 | S_Tree_4 | S_Tree_5 | S_Tree_6;
+formula S_Hit_Gate = S_Gate_1 | S_Gate_2 | S_Gate_3 | S_Gate_4 | S_Gate_5;
+
+formula Safe = ( (Safe_1 | Safe_2) | (Safe_3 | Safe_4) ) | ( (Safe_5 | Safe_6) | (Safe_7 | Safe_8) );
+formula Unsafe = ( (Unsafe_1 | Unsafe_2) | (Unsafe_3 | Unsafe_4) ) | ( (Unsafe_5 | Unsafe_6) | (Unsafe_7 | Unsafe_8) );
+
+
+label "Hit_Tree" = Hit_Tree;
+label "Hit_Gate" = Hit_Gate;
+label "S_Hit_Tree" = S_Hit_Tree;
+label "S_Hit_Gate" = S_Hit_Gate;
+
+
+global move : [0..3];
+
+
+
+module skier
+  ski_position : [1..8] init 4;
+  reward_given: bool init false;
+  //done: bool init false;
+
+
+  [left]  !reward_given & !Safe & !Unsafe & !Hit_Gate & !Hit_Tree & move=0 & ski_position>1 -> (ski_position'=ski_position-1) & (move'=1);
+  [right] !reward_given & !Safe & !Unsafe & !Hit_Gate & !Hit_Tree & move=0 & ski_position<8 -> (ski_position'=ski_position+1) & (move'=1);
+  [noop]  !reward_given & !Safe & !Unsafe & !Hit_Gate & !Hit_Tree & move=0 -> (move'=1);
+
+
+  [done] !reward_given & (Hit_Tree | Hit_Gate | Safe | Unsafe) & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_1 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_2 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_3 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_4 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_5 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_6 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_7 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Unsafe_8 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_1 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_2 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_3 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_4 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_5 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_6 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_7 & move=0 -> (reward_given'=true);
+  //[done] !reward_given & Safe_8 & move=0 -> (reward_given'=true);
+
+
+endmodule
+
+module updateY
+  y : [initY..maxY] ;
+
+  velocity: [0..16];
+  standstill : [0..8] ;
+  [update_y] move=1 & standstill>=5 -> (y'=y) & (move'=2);
+  [update_y] move=1 & standstill<5  -> (y'=min(maxY,y+velocity)) & (move'=2);
+
+  [update_y] move=2 & (ski_position=1 | ski_position = 8) & standstill>=5 -> (standstill'=min(8,standstill+1)) & (move'=3);
+  [update_y] move=2 & (ski_position=1 | ski_position = 8) & standstill<5  -> (velocity'=max(0,velocity-4)) &(move'=3);
+  [update_y] move=2 & (ski_position=2 | ski_position = 7) -> (velocity'=max(0 ,velocity-2)) & (standstill'=0) & (move'=3);
+  [update_y] move=2 & (ski_position=3 | ski_position = 6) -> (velocity'=min(maxVel,velocity+2)) & (standstill'=0) & (move'=3);
+  [update_y] move=2 & (ski_position=4 | ski_position = 5) -> (velocity'=min(maxVel,velocity+4)) & (standstill'=0) & (move'=3);
+endmodule
+
+module updateX
+  x : [minX..maxX] init initX;
+
+  [update_x]  move=3 & standstill>=8                                       -> (move'=0);
+  [update_x]  move=3 & standstill<8 & (ski_position=4 | ski_position=5)    -> (move'=0);
+
+  [update_x]  move=3 & standstill<8 & (ski_position=3)  -> 0.4: (x'=max(minX,x-0)) & (move'=0) + 0.6: (x'=max(minX,x-1)) & (move'=0);
+  [update_x]  move=3 & standstill<8 & (ski_position=6)  -> 0.4: (x'=min(maxX,x+0)) & (move'=0) + 0.6: (x'=min(maxX,x+1)) & (move'=0);
+
+  [update_x]  move=3 & standstill<8 & (ski_position=2)  -> 0.3: (x'=max(minX,x-1)) & (move'=0) + 0.7: (x'=max(minX,x-2)) & (move'=0);
+  [update_x]  move=3 & standstill<8 & (ski_position=7)  -> 0.3: (x'=min(maxX,x+1)) & (move'=0) + 0.7: (x'=min(maxX,x+2)) & (move'=0);
+
+  [update_x]  move=3 & standstill<8 & (ski_position=1)  -> 0.2: (x'=max(minX,x-2)) & (move'=0) + 0.8: (x'=max(minX,x-3)) & (move'=0);
+  [update_x]  move=3 & standstill<8 & (ski_position=8)  -> 0.2: (x'=min(maxX,x+2)) & (move'=0) + 0.8: (x'=min(maxX,x+3)) & (move'=0);
+endmodule
+
+//rewards
+//  [left] !done & !reward_given & Hit_Tree : -100;
+//  [left] !done & !reward_given & Hit_Gate : -100;
+//  [left] !done & !reward_given & (Unsafe_1 | Unsafe_2 | Unsafe_3 | Unsafe_4 | Unsafe_5 | Unsafe_6 | Unsafe_7 | Unsafe_8) : -100;
+//  [right] !done & !reward_given & Hit_Tree : -100;
+//  [right] !done & !reward_given & Hit_Gate : -100;
+//  [right] !done & !reward_given & (Unsafe_1 | Unsafe_2 | Unsafe_3 | Unsafe_4 | Unsafe_5 | Unsafe_6 | Unsafe_7 | Unsafe_8) : -100;
+//  [noop] !done & !reward_given & Hit_Tree : -100;
+//  [noop] !done & !reward_given & Hit_Gate : -100;
+//  [noop] !done & !reward_given & (Unsafe_1 | Unsafe_2 | Unsafe_3 | Unsafe_4 | Unsafe_5 | Unsafe_6 | Unsafe_7 | Unsafe_8) : -100;
+//endrewards
+
+rewards
+  [done] !reward_given & (Hit_Gate | Hit_Tree | Unsafe_1 | Unsafe_2 | Unsafe_3 | Unsafe_4 | Unsafe_5 | Unsafe_6 | Unsafe_7 | Unsafe_8) : -100;
+endrewards
Author	SHA1	Message	Date
sp	570fa4c166	updates ....	2 years ago
sp	99f5d833db	more changes for rom_evaluate	2 years ago
sp	bfa808983b	updated formula computation YRanges	2 years ago
sp	3d05a4aeda	mdp update	2 years ago
sp	6fce864656	more changes...	2 years ago
sp	3fc7278c60	more work on testing framework	2 years ago
sp	d7e1c14863	some fixes in init mdp	2 years ago
sp	b30a3b8bf2	added method to just consider XY for restriction formulas	2 years ago
sp	69d06c48d0	added velocity to rom_evaluate	2 years ago
sp	622338b7b0	more tries with init mdp	2 years ago
sp	e04d141419	WIP rom_evaluate update	2 years ago
sp	812c42b105	small update for init mdp	2 years ago
sp	019ea0ad1e	redid querying	2 years ago
sp	4d6733b6d8	added velocity, unsure about it though	2 years ago
sp	37e9675022	small changes regarding image bookkeeping	2 years ago
sp	746795cd40	added vanilla mdp file	2 years ago
sp	bf5b21872c	started working on iterative workflow - cluster result to formula - etc TODO: Properly implement naming scheme for images	2 years ago
sp	5d5f6ea38c	more work on setting up the framework - changed querying of NN - drawing of clusters - drawing of test results - save each test runs individual observations - etc.	2 years ago
sp	e7b5f8344b	started working on clustering via kmeans	2 years ago