extended mec eliminator to minimal rewards

8 years ago · 820f2ddf4c
2 changed files with 111 additions and 39 deletions
--- a/src/storm-pomdp/transformer/GlobalPomdpMecChoiceEliminator.cpp
+++ b/src/storm-pomdp/transformer/GlobalPomdpMecChoiceEliminator.cpp
@ -31,13 +31,60 @@ namespace storm {
                subformula = std::make_shared<storm::logic::UntilFormula>(storm::logic::Formula::getTrueFormula(), subformula->asEventuallyFormula().getSubformula().asSharedPointer());
            }
            
-            if (subformula->isUntilFormula()) {
+            if (formula.isProbabilityOperatorFormula() && subformula->isUntilFormula()) {
                if (!minimizes) {
                    return transformMax(subformula->asUntilFormula());
                }
+            } else if (formula.isRewardOperatorFormula() && subformula->isEventuallyFormula()) {
+                if (minimizes) {
+                    return transformMinReward(subformula->asEventuallyFormula());
+                }
            }
            STORM_LOG_THROW(false, storm::exceptions::InvalidPropertyException, "Mec elimination is not supported for the property " << formula);
+            return nullptr;
+        }
+        
+        template<typename ValueType>
+        std::shared_ptr<storm::models::sparse::Pomdp<ValueType>> GlobalPomdpMecChoiceEliminator<ValueType>::transformMinReward(storm::logic::EventuallyFormula const& formula) const {
+            assert (formula.isRewardPathFormula());
+            auto backwardTransitions = pomdp.getBackwardTransitions();
+            storm::storage::BitVector allStates(pomdp.getNumberOfStates(), true);
+            auto prob1EStates = storm::utility::graph::performProb1E(pomdp.getTransitionMatrix(), pomdp.getTransitionMatrix().getRowGroupIndices(), backwardTransitions, allStates, checkPropositionalFormula(formula.getSubformula()));
+            STORM_LOG_THROW(prob1EStates.full(), storm::exceptions::InvalidPropertyException, "There are states from which the set of target states is not reachable. This is not supported.");
+            auto prob1AStates = storm::utility::graph::performProb1A(pomdp.getTransitionMatrix(), pomdp.getTransitionMatrix().getRowGroupIndices(), backwardTransitions, allStates, checkPropositionalFormula(formula.getSubformula()));
+            
+            auto mecs = decomposeEndComponents(~prob1AStates, ~allStates);
+            
+            // Get the 'out' state for every MEC with just a single out state
+            storm::storage::BitVector uniqueOutStates = getEndComponentsWithSingleOutStates(mecs);
+            
+            // For each observation of some 'out' state get the intersection of the choices that lead to the corresponding MEC
+            std::vector<storm::storage::BitVector> mecChoicesPerObservation = getEndComponentChoicesPerObservation(mecs, uniqueOutStates);
+
+            
+            // Filter the observations that have a state that is not an out state
+            storm::storage::BitVector stateFilter = ~uniqueOutStates;
+            for (auto const& state : stateFilter) {
+                mecChoicesPerObservation[pomdp.getObservation(state)].clear();
+            }
+            
+            // It should not be possible to clear all choices for an observation since we only consider states that lead outside of its MEC.
+            for (auto& clearedChoices : mecChoicesPerObservation) {
+                STORM_LOG_ASSERT(clearedChoices.size() == 0 || !clearedChoices.full(), "Tried to clear all choices for an observation.");
+            }
+            
+            // transform the set of selected choices to global choice indices
+            storm::storage::BitVector choiceFilter(pomdp.getNumberOfChoices(), true);
+            stateFilter.complement();
+            for (auto const& state : stateFilter) {
+                uint64_t offset = pomdp.getTransitionMatrix().getRowGroupIndices()[state];
+                for (auto const& choice : mecChoicesPerObservation[pomdp.getObservation(state)]) {
+                    choiceFilter.set(offset + choice, false);
+                }
+            }
            
+            ChoiceSelector<ValueType> cs(pomdp);
+            return cs.transform(choiceFilter)->template as<storm::models::sparse::Pomdp<ValueType>>();
        }
        
        template<typename ValueType>
@ -46,9 +93,41 @@ namespace storm {
            auto prob01States = storm::utility::graph::performProb01Max(pomdp.getTransitionMatrix(), pomdp.getTransitionMatrix().getRowGroupIndices(), backwardTransitions, checkPropositionalFormula(formula.getLeftSubformula()), checkPropositionalFormula(formula.getRightSubformula()));
            auto mecs = decomposeEndComponents(~(prob01States.first | prob01States.second), prob01States.first);
            
-            std::vector<storm::storage::BitVector> mecChoicesPerObservation(pomdp.getNrObservations());
-            storm::storage::BitVector uniqueOutStates(pomdp.getNumberOfStates(), false);
-            // Find the MECs that have only one 'out' state
+            // Get the 'out' state for every MEC with just a single out state
+            storm::storage::BitVector uniqueOutStates = getEndComponentsWithSingleOutStates(mecs);
+            
+            // For each observation of some 'out' state get the intersection of the choices that lead to the corresponding MEC
+            std::vector<storm::storage::BitVector> mecChoicesPerObservation = getEndComponentChoicesPerObservation(mecs, uniqueOutStates);
+
+            
+            // Filter the observations that have a state that is neither an out state, nor a prob0A state
+            storm::storage::BitVector stateFilter = ~(uniqueOutStates | prob01States.first);
+            for (auto const& state : stateFilter) {
+                mecChoicesPerObservation[pomdp.getObservation(state)].clear();
+            }
+            
+            // It should not be possible to clear all choices for an observation since we only consider states that lead outside of its MEC.
+            for (auto& clearedChoices : mecChoicesPerObservation) {
+                STORM_LOG_ASSERT(clearedChoices.size() == 0 || !clearedChoices.full(), "Tried to clear all choices for an observation.");
+            }
+            
+            // transform the set of selected choices to global choice indices
+            storm::storage::BitVector choiceFilter(pomdp.getNumberOfChoices(), true);
+            stateFilter.complement();
+            for (auto const& state : stateFilter) {
+                uint64_t offset = pomdp.getTransitionMatrix().getRowGroupIndices()[state];
+                for (auto const& choice : mecChoicesPerObservation[pomdp.getObservation(state)]) {
+                    choiceFilter.set(offset + choice, false);
+                }
+            }
+            
+            ChoiceSelector<ValueType> cs(pomdp);
+            return cs.transform(choiceFilter)->template as<storm::models::sparse::Pomdp<ValueType>>();
+        }
+        
+        template<typename ValueType>
+        storm::storage::BitVector GlobalPomdpMecChoiceEliminator<ValueType>::getEndComponentsWithSingleOutStates(storm::storage::MaximalEndComponentDecomposition<ValueType> const& mecs) const {
+            storm::storage::BitVector result(pomdp.getNumberOfStates(), false);
            for (auto const& mec : mecs) {
                boost::optional<uint64_t> uniqueOutState = boost::none;
                for (auto const& stateActionsPair : mec) {
@ -64,16 +143,27 @@ namespace storm {
                    }
                }
                if (uniqueOutState) {
-                    uniqueOutStates.set(uniqueOutState.get(), true);
+                    result.set(uniqueOutState.get(), true);
+                }
+            }
+            return result;
+        }
        
-                    storm::storage::BitVector localChoiceIndices(pomdp.getNumberOfChoices(uniqueOutState.get()), false);
-                    uint64_t offset = pomdp.getTransitionMatrix().getRowGroupIndices()[uniqueOutState.get()];
-                    for (auto const& choice : mec.getChoicesForState(uniqueOutState.get())) {
+        template<typename ValueType>
+        std::vector<storm::storage::BitVector> GlobalPomdpMecChoiceEliminator<ValueType>::getEndComponentChoicesPerObservation(storm::storage::MaximalEndComponentDecomposition<ValueType> const& mecs, storm::storage::BitVector const& consideredStates) const {
+            
+            std::vector<storm::storage::BitVector> result(pomdp.getNrObservations());
+            for (auto const& mec : mecs) {
+                for (auto const& stateActions : mec) {
+                    if (consideredStates.get(stateActions.first)) {
+                        storm::storage::BitVector localChoiceIndices(pomdp.getNumberOfChoices(stateActions.first), false);
+                        uint64_t offset = pomdp.getTransitionMatrix().getRowGroupIndices()[stateActions.first];
+                        for (auto const& choice : stateActions.second) {
                            assert(choice >= offset);
                            localChoiceIndices.set(choice - offset, true);
                        }
                        
-                    auto& mecChoices = mecChoicesPerObservation[pomdp.getObservation(uniqueOutState.get())];
+                        auto& mecChoices = result[pomdp.getObservation(stateActions.first)];
                        if (mecChoices.size() == 0) {
                            mecChoices = localChoiceIndices;
                        } else {
@ -82,31 +172,10 @@ namespace storm {
                        }
                    }
                }
-            
-            // Filter the observations that have a state that is neither an out state, nor a prob0A or prob1A state
-            storm::storage::BitVector stateFilter = ~(uniqueOutStates | prob01States.first | prob01States.second);
-            for (auto const& state : stateFilter) {
-                mecChoicesPerObservation[pomdp.getObservation(state)].clear();
-            }
-            
-            // It should not be possible to clear all choices for an observation since we only consider states that lead outside of its MEC.
-            for (auto& clearedChoices : mecChoicesPerObservation) {
-                STORM_LOG_ASSERT(clearedChoices.size() == 0 || !clearedChoices.full(), "Tried to clear all choices for an observation.");
-            }
-            
-            // transform the set of selected choices to global choice indices
-            storm::storage::BitVector choiceFilter(pomdp.getNumberOfChoices(), true);
-            stateFilter.complement();
-            for (auto const& state : stateFilter) {
-                uint64_t offset = pomdp.getTransitionMatrix().getRowGroupIndices()[state];
-                for (auto const& choice : mecChoicesPerObservation[pomdp.getObservation(state)]) {
-                    choiceFilter.set(offset + choice, false);
            }
+            return result;
        }

-            ChoiceSelector<ValueType> cs(pomdp);
-            return cs.transform(choiceFilter)->template as<storm::models::sparse::Pomdp<ValueType>>();
-        }
        
        template<typename ValueType>
        storm::storage::MaximalEndComponentDecomposition<ValueType> GlobalPomdpMecChoiceEliminator<ValueType>::decomposeEndComponents(storm::storage::BitVector const& subsystem, storm::storage::BitVector const& redirectingStates) const {
--- a/src/storm-pomdp/transformer/GlobalPomdpMecChoiceEliminator.h
+++ b/src/storm-pomdp/transformer/GlobalPomdpMecChoiceEliminator.h
@ -20,8 +20,11 @@ namespace storm {
            
        private:
            
+            std::shared_ptr<storm::models::sparse::Pomdp<ValueType>> transformMinReward(storm::logic::EventuallyFormula const& formula) const;
            std::shared_ptr<storm::models::sparse::Pomdp<ValueType>> transformMax(storm::logic::UntilFormula const& formula) const;
            storm::storage::MaximalEndComponentDecomposition<ValueType> decomposeEndComponents(storm::storage::BitVector const& subsystem, storm::storage::BitVector const& ignoredStates) const;
+            storm::storage::BitVector getEndComponentsWithSingleOutStates(storm::storage::MaximalEndComponentDecomposition<ValueType> const& mecs) const;
+            std::vector<storm::storage::BitVector> getEndComponentChoicesPerObservation(storm::storage::MaximalEndComponentDecomposition<ValueType> const& mecs, storm::storage::BitVector const& consideredStates) const;
            
            storm::storage::BitVector checkPropositionalFormula(storm::logic::Formula const& propositionalFormula) const;