Nondeterministic Infinite horizon: Split value getters into StateValueGetter and ActionValueGetters. Made VI code more general, so that they may also be used for Markov Automata.

6 years ago · fc66e01ed5
2 changed files with 313 additions and 141 deletions
--- a/src/storm/modelchecker/helper/infinitehorizon/SparseNondeterministicInfiniteHorizonHelper.cpp
+++ b/src/storm/modelchecker/helper/infinitehorizon/SparseNondeterministicInfiniteHorizonHelper.cpp
@ -31,36 +31,56 @@ namespace storm {
            
            template <typename ValueType>
            std::vector<ValueType> SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLongRunAverageProbabilities(Environment const& env, storm::storage::BitVector const& psiStates) {
-                return computeLongRunAverageValues(env, [&psiStates] (uint64_t stateIndex, uint64_t) { return psiStates.get(stateIndex) ? storm::utility::one<ValueType>() : storm::utility::zero<ValueType>();});
+                return computeLongRunAverageValues(env,
+                            [&psiStates] (uint64_t stateIndex) { return psiStates.get(stateIndex) ? storm::utility::one<ValueType>() : storm::utility::zero<ValueType>(); },
+                            [] (uint64_t) { return storm::utility::zero<ValueType>(); }
+                    );
            }
            
            
            template <typename ValueType>
            std::vector<ValueType> SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLongRunAverageRewards(Environment const& env, storm::models::sparse::StandardRewardModel<ValueType> const& rewardModel) {
-                if (_markovianStates) {
-                    return computeLongRunAverageValues(env, [&] (uint64_t stateIndex, uint64_t globalChoiceIndex) {
-                        if (rewardModel.hasStateRewards() && _markovianStates->get(stateIndex)) {
-                            return rewardModel.getTotalStateActionReward(stateIndex, globalChoiceIndex, _transitionMatrix, (ValueType) (storm::utility::one<ValueType>() / (*_exitRates)[stateIndex]));
-                        } else {
-                            return rewardModel.getTotalStateActionReward(stateIndex, globalChoiceIndex, _transitionMatrix, storm::utility::zero<ValueType>());
-                        }
-                    });
+                std::function<ValueType(uint64_t stateIndex)> stateRewardsGetter;
+                if (rewardModel.hasStateRewards()) {
+                    stateRewardsGetter = [&rewardModel] (uint64_t stateIndex) { return rewardModel.getStateReward(stateIndex); };
+                } else {
+                    stateRewardsGetter = [] (uint64_t) { return storm::utility::zero<ValueType>(); };
+                }
+                std::function<ValueType(uint64_t globalChoiceIndex)> actionRewardsGetter;
+                if (rewardModel.hasStateActionRewards() || rewardModel.hasTransitionRewards()) {
+                    if (rewardModel.hasTransitionRewards()) {
+                        actionRewardsGetter = [&] (uint64_t globalChoiceIndex) { return rewardModel.getStateActionAndTransitionReward(globalChoiceIndex, this->_transitionMatrix); };
+                    } else {
+                        actionRewardsGetter = [&] (uint64_t globalChoiceIndex) { return rewardModel.getStateActionReward(globalChoiceIndex); };
+                    }
                } else {
-                    return computeLongRunAverageValues(env, [&] (uint64_t stateIndex, uint64_t globalChoiceIndex) {
-                        return rewardModel.getTotalStateActionReward(stateIndex, globalChoiceIndex, _transitionMatrix);
-                    });
+                    stateRewardsGetter = [] (uint64_t) { return storm::utility::zero<ValueType>(); };
                }
+                
+                return computeLongRunAverageValues(env, stateRewardsGetter, actionRewardsGetter);
            }
            
            template <typename ValueType>
-            std::vector<ValueType> SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLongRunAverageValues(Environment const& env, std::vector<ValueType> const& combinedStateActionRewards) {
-                return computeLongRunAverageValues(env, [&combinedStateActionRewards] (uint64_t, uint64_t globalChoiceIndex) {
-                    return combinedStateActionRewards[globalChoiceIndex];
-                });
+            std::vector<ValueType> SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLongRunAverageValues(Environment const& env, std::vector<ValueType> const* stateValues, std::vector<ValueType> const* actionValues) {
+                std::function<ValueType(uint64_t stateIndex)> stateValuesGetter;
+                if (stateValues) {
+                    stateValuesGetter = [&stateValues] (uint64_t stateIndex) { return (*stateValues)[stateIndex]; };
+                } else {
+                    stateValuesGetter = [] (uint64_t) { return storm::utility::zero<ValueType>(); };
+                }
+                std::function<ValueType(uint64_t actionIndex)> actionValuesGetter;
+                if (actionValues) {
+                    actionValuesGetter = [&actionValues] (uint64_t globalChoiceIndex) { return (*actionValues)[globalChoiceIndex]; };
+                } else {
+                    actionValuesGetter = [] (uint64_t) { return storm::utility::zero<ValueType>(); };
+                }
+                
+                return computeLongRunAverageValues(env, stateValuesGetter, actionValuesGetter);
+
            }
            
            template <typename ValueType>
-            std::vector<ValueType> SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLongRunAverageValues(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter) {
+            std::vector<ValueType> SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLongRunAverageValues(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateRewardsGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionRewardsGetter) {
                
                 // Prepare an environment for the underlying solvers
                auto underlyingSolverEnvironment = env;
@ -86,7 +106,7 @@ namespace storm {
                std::vector<ValueType> mecLraValues;
                mecLraValues.reserve(mecDecomposition.size());
                for (auto const& mec : mecDecomposition) {
-                    mecLraValues.push_back(computeLraForMec(underlyingSolverEnvironment, combinedStateActionRewardsGetter, mec));
+                    mecLraValues.push_back(computeLraForMec(underlyingSolverEnvironment, stateRewardsGetter, actionRewardsGetter, mec));
                }
                
                // Solve the resulting SSP where end components are collapsed into single auxiliary states
@ -129,36 +149,45 @@ namespace storm {
            }
            
            template <typename ValueType>
-            ValueType SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLraForMec(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter, storm::storage::MaximalEndComponent const& mec) {
+            bool SparseNondeterministicInfiniteHorizonHelper<ValueType>::isContinuousTime() const {
+                STORM_LOG_ASSERT((_markovianStates == nullptr) == (_exitRates == nullptr), "Inconsistent information given: Have Markovian states but no exit rates (or vice versa)." );
+                return _markovianStates != nullptr;
+            }
+    
+            template <typename ValueType>
+            ValueType SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLraForMec(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateRewardsGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionRewardsGetter, storm::storage::MaximalEndComponent const& mec) {
                
-                // FIXME: MA
                // If the mec only consists of a single state, we compute the LRA value directly
-                if (++mec.begin() == mec.end()) {
+                if (mec.size() == 1) {
                    uint64_t state = mec.begin()->first;
                    auto choiceIt = mec.begin()->second.begin();
-                    ValueType result = combinedStateActionRewardsGetter(state, *choiceIt);
-                    uint64_t bestChoice = *choiceIt;
-                    for (++choiceIt; choiceIt != mec.begin()->second.end(); ++choiceIt) {
-                        ValueType choiceValue = combinedStateActionRewardsGetter(state, *choiceIt);
-                        if (this->minimize()) {
-                            if (result > choiceValue) {
-                                result = std::move(choiceValue);
+                    if (isContinuousTime()) {
+                        // Singleton MECs have to consist of a Markovian state because of the non-Zenoness assumption. Then, there is just one possible choice.
+                        STORM_LOG_THROW(_markovianStates->get(state), storm::exceptions::InvalidOperationException, "Markov Automaton has Zeno behavior. Computation of Long Run Average values not supported.");
+                        STORM_LOG_ASSERT(mec.begin()->second.size() == 1, "Markovian state has Nondeterministic behavior.");
+                        if (isProduceSchedulerSet()) {
+                            _producedOptimalChoices.get()[state] = 0;
+                        }
+                        return stateRewardsGetter(state) + (*_exitRates)[state] * actionRewardsGetter(*choiceIt);
+                    } else {
+                        // Find the choice with the highest/lowest reward
+                        ValueType bestValue = actionRewardsGetter(*choiceIt);
+                        uint64_t bestChoice = *choiceIt;
+                        for (++choiceIt; choiceIt != mec.begin()->second.end(); ++choiceIt) {
+                            ValueType currentValue = actionRewardsGetter(*choiceIt);
+                            if ((this->minimize() &&  currentValue < bestValue) || (this->maximize() && currentValue > bestValue)) {
+                                bestValue = std::move(currentValue);
                                bestChoice = *choiceIt;
                            }
-                        } else {
-                             if (result < choiceValue) {
-                                    result = std::move(choiceValue);
-                                    bestChoice = *choiceIt;
-                             }
                        }
+                        if (isProduceSchedulerSet()) {
+                            _producedOptimalChoices.get()[state] = bestChoice - _transitionMatrix.getRowGroupIndices()[state];
+                        }
+                        return bestValue + stateRewardsGetter(state);
                    }
-                    if (isProduceSchedulerSet()) {
-                        _producedOptimalChoices.get()[state] = bestChoice - _transitionMatrix.getRowGroupIndices()[state];
-                    }
-                    return result;
                }
                
-                // Solve MEC with the method specified in the settings
+                // Solve nontrivial MEC with the method specified in the settings
                storm::solver::LraMethod method = env.solver().lra().getNondetLraMethod();
                if ((storm::NumberTraits<ValueType>::IsExact || env.solver().isForceExact()) && env.solver().lra().isNondetLraMethodSetFromDefault() && method != storm::solver::LraMethod::LinearProgramming) {
                    STORM_LOG_INFO("Selecting 'LP' as the solution technique for long-run properties to guarantee exact results. If you want to override this, please explicitly specify a different LRA method.");
@ -169,144 +198,281 @@ namespace storm {
                }
                STORM_LOG_ERROR_COND(!isProduceSchedulerSet() || method == storm::solver::LraMethod::ValueIteration, "Scheduler generation not supported for the chosen LRA method. Try value-iteration.");
                if (method == storm::solver::LraMethod::LinearProgramming) {
-                    return computeLraForMecLp(env, combinedStateActionRewardsGetter, mec);
+                    return computeLraForMecLp(env, stateRewardsGetter, actionRewardsGetter, mec);
                } else if (method == storm::solver::LraMethod::ValueIteration) {
-                    return computeLraForMecVi(env, combinedStateActionRewardsGetter, mec);
+                    return computeLraForMecVi(env, stateRewardsGetter, actionRewardsGetter, mec);
                } else {
                    STORM_LOG_THROW(false, storm::exceptions::InvalidSettingsException, "Unsupported technique.");
                }
            }
-            
+    
+            /*!
+             * Abstract helper class that performs a single iteration of the value iteration method
+             */
            template <typename ValueType>
-            ValueType SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLraForMecVi(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter, storm::storage::MaximalEndComponent const& mec) {
-                // Initialize data about the mec
-                storm::storage::BitVector mecStates(_transitionMatrix.getRowGroupCount(), false);
-                storm::storage::BitVector mecChoices(_transitionMatrix.getRowCount(), false);
-                for (auto const& stateChoicesPair : mec) {
-                    mecStates.set(stateChoicesPair.first);
-                    for (auto const& choice : stateChoicesPair.second) {
-                        mecChoices.set(choice);
+            class LraViHelper {
+            public:
+                LraViHelper(storm::storage::MaximalEndComponent const& mec, storm::storage::SparseMatrix<ValueType> const& transitionMatrix) : _mec(mec), _transitionMatrix(transitionMatrix) {
+                    // Intentionally left empty
+                }
+                virtual ~LraViHelper() = default;
+
+                /*!
+                 * performs a single iteration step.
+                 * If a choices vector is given, the optimal choices will be inserted at the appropriate states.
+                 * Note that these choices will be inserted w.r.t. the original model states/choices, i.e. the size of the vector should match the state-count of the input model
+                 * @return the current estimate of the LRA value
+                 */
+                virtual void iterate(Environment const& env, storm::solver::OptimizationDirection const& dir, std::vector<uint64_t>* choices = nullptr) = 0;
+                
+                struct ConvergenceCheckResult {
+                    bool isPrecisionAchieved;
+                    ValueType currentValue;
+                };
+                
+                /*!
+                 * Checks whether the curently computed value achieves the desired precision
+                 */
+                virtual ConvergenceCheckResult checkConvergence(bool relative, ValueType precision) = 0;
+                
+                /*!
+                 * Must be called between two calls of iterate.
+                 */
+                virtual void prepareNextIteration() = 0;
+                
+            protected:
+                
+                /*!
+                 *
+                 * @param xPrevious the 'old' values
+                 * @param xCurrent the 'new' values
+                 * @param threshold the threshold
+                 * @param relative whether the relative difference should be considered
+                 * @return The first component is true if the (relative) difference between the maximal and the minimal entry-wise change of the two value vectors is below or equal to the provided threshold.
+                 *          In this case, the second component is the average of the maximal and the minimal change.
+                 *          If the threshold is exceeded, the computation is aborted early and the second component is only an approximation of the averages.
+                 */
+                std::pair<bool, ValueType> checkMinMaxDiffBelowThreshold(std::vector<ValueType> const& xPrevious, std::vector<ValueType> const& xCurrent, ValueType const& threshold, bool relative) const {
+                    STORM_LOG_ASSERT(xPrevious.size() == xCurrent.size(), "Unexpected Dimension Mismatch");
+                    STORM_LOG_ASSERT(threshold > storm::utility::zero<ValueType>(), "Did not expect a non-positive threshold.");
+                    auto x1It = xPrevious.begin();
+                    auto x1Ite = xPrevious.end();
+                    auto x2It = xCurrent.begin();
+                    ValueType maxDiff = (*x2It - *x1It);
+                    ValueType minDiff = maxDiff;
+                    bool result = true;
+                    // The difference between maxDiff and minDiff is zero at this point. Thus, it doesn't make sense to check the threshold now.
+                    for (++x1It, ++x2It; x1It != x1Ite; ++x1It, ++x2It) {
+                        ValueType diff = (*x2It - *x1It);
+                        // Potentially update maxDiff or minDiff
+                        bool skipCheck = false;
+                        if (maxDiff < diff) {
+                            maxDiff = diff;
+                        } else if (minDiff > diff) {
+                            minDiff = diff;
+                        } else {
+                            skipCheck = true;
+                        }
+                        // Check convergence
+                        if (!skipCheck && (maxDiff - minDiff) > (relative ? (threshold * minDiff) : threshold)) {
+                            result = false;
+                            break;
+                        }
                    }
+                    ValueType avgDiff = (maxDiff + minDiff) / (storm::utility::convertNumber<ValueType>(2.0));
+                    return {result, avgDiff};
                }
                
-                boost::container::flat_map<uint64_t, uint64_t> toSubModelStateMapping;
-                uint64_t currState = 0;
-                toSubModelStateMapping.reserve(mecStates.getNumberOfSetBits());
-                for (auto const& mecState : mecStates) {
-                    toSubModelStateMapping.insert(std::pair<uint64_t, uint64_t>(mecState, currState));
-                    ++currState;
-                }
-                
-                // Get a transition matrix that only considers the states and choices within the MEC
-                storm::storage::SparseMatrixBuilder<ValueType> mecTransitionBuilder(mecChoices.getNumberOfSetBits(), mecStates.getNumberOfSetBits(), 0, true, true, mecStates.getNumberOfSetBits());
-                std::vector<ValueType> choiceValues;
-                choiceValues.reserve(mecChoices.getNumberOfSetBits());
-                uint64_t currRow = 0;
-                ValueType selfLoopProb = storm::utility::convertNumber<ValueType>(env.solver().lra().getAperiodicFactor());
-                ValueType scalingFactor = storm::utility::one<ValueType>() - selfLoopProb;
-                for (auto const& mecState : mecStates) {
-                    mecTransitionBuilder.newRowGroup(currRow);
-                    uint64_t groupStart = _transitionMatrix.getRowGroupIndices()[mecState];
-                    uint64_t groupEnd = _transitionMatrix.getRowGroupIndices()[mecState + 1];
-                    for (uint64_t choice = mecChoices.getNextSetIndex(groupStart); choice < groupEnd; choice = mecChoices.getNextSetIndex(choice + 1)) {
-                        bool insertedDiagElement = false;
-                        for (auto const& entry : _transitionMatrix.getRow(choice)) {
-                            uint64_t column = toSubModelStateMapping[entry.getColumn()];
-                            if (!insertedDiagElement && entry.getColumn() > mecState) {
-                                mecTransitionBuilder.addNextValue(currRow, toSubModelStateMapping[mecState], selfLoopProb);
-                                insertedDiagElement = true;
+                storm::storage::MaximalEndComponent const& _mec;
+                storm::storage::SparseMatrix<ValueType> const& _transitionMatrix;
+            };
+    
+            /*!
+             * Abstract helper class that performs a single iteration of the value iteration method
+             * @see Ashok et al.: Value Iteration for Long-Run Average Reward in Markov Decision Processes (CAV'17), https://doi.org/10.1007/978-3-319-63387-9_10
+             */
+            template <typename ValueType>
+            class MdpLraViHelper : public LraViHelper<ValueType> {
+            public:
+                
+                MdpLraViHelper(storm::storage::MaximalEndComponent const& mec, storm::storage::SparseMatrix<ValueType> const& transitionMatrix, std::function<ValueType(uint64_t stateIndex)> const& stateRewardsGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionRewardsGetter, ValueType const& aperiodicFactor) : LraViHelper<ValueType>(mec, transitionMatrix), _x1(mec.size(), storm::utility::zero<ValueType>()), _x2(_x1), _x1IsCurrent(true) {
+                    
+                    // We add a selfloop to each state (which is necessary for convergence)
+                    // Very roughly, this selfloop avoids that the values can flip around like this: [1, 0] -> [0, 1] -> [1, 0] -> ...
+                    ValueType selfLoopProb = aperiodicFactor;
+                    // Introducing the selfloop also requires the rewards to be scaled by the following factor.
+                    _scalingFactor = storm::utility::one<ValueType>() - selfLoopProb;
+                    
+                    uint64_t numMecStates = this->_mec.size();
+                    boost::container::flat_map<uint64_t, uint64_t> toSubModelStateMapping;
+                    toSubModelStateMapping.reserve(this->_mec.size());
+                    uint64_t currState = 0;
+                    uint64_t numMecChoices = 0;
+                    for (auto const& stateChoices : this->_mec) {
+                        toSubModelStateMapping.insert(std::pair<uint64_t, uint64_t>(stateChoices.first, currState));
+                        ++currState;
+                        numMecChoices += stateChoices.second.size();
+                    }
+                    assert(currState == numMecStates);
+                    
+                    // Get a transition matrix that only considers the states and choices within the MEC
+                    storm::storage::SparseMatrixBuilder<ValueType> mecTransitionBuilder(numMecChoices, numMecStates, 0, true, true, numMecStates);
+                    _choiceValues.reserve(numMecChoices);
+                    uint64_t currRow = 0;
+                    for (auto const& stateChoices : this->_mec) {
+                        auto const& mecState = stateChoices.first;
+                        auto const& mecChoices = stateChoices.second;
+                        mecTransitionBuilder.newRowGroup(currRow);
+                        for (auto const& choice : mecChoices) {
+                            bool insertedDiagElement = false;
+                            for (auto const& entry : this->_transitionMatrix.getRow(choice)) {
+                                uint64_t column = toSubModelStateMapping[entry.getColumn()];
+                                if (!insertedDiagElement && entry.getColumn() > mecState) {
+                                    mecTransitionBuilder.addNextValue(currRow, toSubModelStateMapping[mecState], selfLoopProb);
+                                    insertedDiagElement = true;
+                                }
+                                if (!insertedDiagElement && entry.getColumn() == mecState) {
+                                    mecTransitionBuilder.addNextValue(currRow, column, selfLoopProb + _scalingFactor * entry.getValue());
+                                    insertedDiagElement = true;
+                                } else {
+                                    mecTransitionBuilder.addNextValue(currRow, column,  _scalingFactor * entry.getValue());
+                                }
                            }
-                            if (!insertedDiagElement && entry.getColumn() == mecState) {
-                                mecTransitionBuilder.addNextValue(currRow, column, selfLoopProb + scalingFactor * entry.getValue());
-                                insertedDiagElement = true;
-                            } else {
-                                mecTransitionBuilder.addNextValue(currRow, column,  scalingFactor * entry.getValue());
+                            if (!insertedDiagElement) {
+                                mecTransitionBuilder.addNextValue(currRow, toSubModelStateMapping[mecState], selfLoopProb);
                            }
+                            
+                            // Compute the rewards obtained for this choice
+                            _choiceValues.push_back(_scalingFactor * (stateRewardsGetter(mecState) + actionRewardsGetter(choice)));
+                            
+                            ++currRow;
                        }
-                        if (!insertedDiagElement) {
-                            mecTransitionBuilder.addNextValue(currRow, toSubModelStateMapping[mecState], selfLoopProb);
+                    }
+                    
+                    _mecTransitions = mecTransitionBuilder.build();
+                    
+                    STORM_LOG_ASSERT(_mecTransitions.isProbabilistic(), "The MEC-Matrix is not probabilistic.");
+                    STORM_LOG_ASSERT(_mecTransitions.getRowGroupCount() == _x1.size(), "Unexpected size mismatch for created matrix.");
+                    STORM_LOG_ASSERT(_x1.size() == _x2.size(), "Unexpected size mismatch for created matrix.");
+                }
+                
+                virtual void iterate(Environment const& env, storm::solver::OptimizationDirection const& dir, std::vector<uint64_t>* choices = nullptr) override {
+                    // Initialize a multipler if it does not exist, yet
+                    if (!_multiplier) {
+                        _multiplier = storm::solver::MultiplierFactory<ValueType>().create(env, _mecTransitions);
+                    }
+                    
+                    if (choices == nullptr) {
+                        // Perform a simple matrix-vector multiplication
+                        _multiplier->multiplyAndReduce(env, dir, xCurrent(), &_choiceValues, xPrevious());
+                    } else {
+                        // Perform a simple matrix-vector multiplication but also keep track of the choices within the _mecTransitions
+                        std::vector<uint64_t> mecChoices(_mecTransitions.getRowGroupCount());
+                        _multiplier->multiplyAndReduce(env, dir, xCurrent(), &_choiceValues, xPrevious(), &mecChoices);
+                        // Transform the local choices (within this mec) to global indices
+                        uint64_t mecState = 0;
+                        for (auto const& stateChoices : this->_mec) {
+                            uint64_t mecChoice = mecChoices[mecState];
+                            STORM_LOG_ASSERT(mecChoice < stateChoices.second.size(), "The selected choice does not seem to exist.");
+                            uint64_t globalChoiceIndex = *(stateChoices.second.begin() + mecChoice);
+                            (*choices)[stateChoices.first] = globalChoiceIndex - this->_transitionMatrix.getRowGroupIndices()[stateChoices.first];
+                            ++mecState;
                        }
-                        
-                        // Compute the rewards obtained for this choice
-                        choiceValues.push_back(scalingFactor * combinedStateActionRewardsGetter(mecState, choice));
-                        
-                        ++currRow;
                    }
+                    
+                    // Swap current and previous x vectors
+                    _x1IsCurrent = !_x1IsCurrent;
+                    
                }
-                auto mecTransitions = mecTransitionBuilder.build();
-                STORM_LOG_ASSERT(mecTransitions.isProbabilistic(), "The MEC-Matrix is not probabilistic.");
                
-                // start the iterations
-                ValueType precision = storm::utility::convertNumber<ValueType>(env.solver().lra().getPrecision()) / scalingFactor;
-                bool relative = env.solver().lra().getRelativeTerminationCriterion();
-                std::vector<ValueType> x(mecTransitions.getRowGroupCount(), storm::utility::zero<ValueType>());
-                std::vector<ValueType> xPrime = x;
-                auto dir = this->getOptimizationDirection();
+                virtual typename LraViHelper<ValueType>::ConvergenceCheckResult checkConvergence(bool relative, ValueType precision) override {
+                    typename LraViHelper<ValueType>::ConvergenceCheckResult res;
+                    std::tie(res.isPrecisionAchieved, res.currentValue) = this->checkMinMaxDiffBelowThreshold(xPrevious(), xCurrent(), precision, relative);
+                    res.currentValue /= _scalingFactor; // "Undo" the scaling of the rewards
+                    return res;
+                }
                
-                auto multiplier = storm::solver::MultiplierFactory<ValueType>().create(env, mecTransitions);
-                ValueType maxDiff, minDiff;
+                virtual void prepareNextIteration() override {
+                    // To avoid large (and numerically unstable) x-values, we substract a reference value.
+                    ValueType referenceValue = xCurrent().front();
+                    storm::utility::vector::applyPointwise<ValueType, ValueType>(xCurrent(), xCurrent(), [&referenceValue] (ValueType const& x_i) -> ValueType { return x_i - referenceValue; });
+                }
                
-                uint64_t iter = 0;
+            private:
+                
+                std::vector<ValueType>& xCurrent() {
+                    return _x1IsCurrent ? _x1 : _x2;
+                }
+                
+                std::vector<ValueType>& xPrevious() {
+                    return _x1IsCurrent ? _x2 : _x1;
+                }
+                
+                storm::storage::SparseMatrix<ValueType> _mecTransitions;
+                std::vector<ValueType> _x1, _x2, _choiceValues;
+                bool _x1IsCurrent;
+                std::unique_ptr<storm::solver::Multiplier<ValueType>> _multiplier;
+                ValueType _scalingFactor;
+            };
+            
+            template <typename ValueType>
+            ValueType SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLraForMecVi(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateRewardsGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionRewardsGetter, storm::storage::MaximalEndComponent const& mec) {
+
+                // Collect some parameters of the computation.
+                ValueType aperiodicFactor = storm::utility::convertNumber<ValueType>(env.solver().lra().getAperiodicFactor());
+                ValueType precision = storm::utility::convertNumber<ValueType>(env.solver().lra().getPrecision()) / aperiodicFactor;
+                bool relative = env.solver().lra().getRelativeTerminationCriterion();
                boost::optional<uint64_t> maxIter;
                if (env.solver().lra().isMaximalIterationCountSet()) {
                    maxIter = env.solver().lra().getMaximalIterationCount();
                }
+                auto dir = this->getOptimizationDirection();
+                
+                // Create an object for the iterations
+                std::shared_ptr<LraViHelper<ValueType>> iterationHelper;
+                if (isContinuousTime()) {
+                    // TODO
+                } else {
+                    iterationHelper = std::make_shared<MdpLraViHelper<ValueType>>(mec, _transitionMatrix, stateRewardsGetter, actionRewardsGetter, aperiodicFactor);
+                }
+                
+                // start the iterations
+                ValueType result = storm::utility::zero<ValueType>();
+                uint64_t iter = 0;
                while (!maxIter.is_initialized() || iter < maxIter.get()) {
                    ++iter;
-                    // Compute the obtained values for the next step
-                    multiplier->multiplyAndReduce(env, dir, x, &choiceValues, x);
-                    
-                    // update xPrime and check for convergence
-                    // to avoid large (and numerically unstable) x-values, we substract a reference value.
-                    auto xIt = x.begin();
-                    auto xPrimeIt = xPrime.begin();
-                    ValueType refVal = *xIt;
-                    maxDiff = *xIt - *xPrimeIt;
-                    minDiff = maxDiff;
-                    *xIt -= refVal;
-                    *xPrimeIt = *xIt;
-                    for (++xIt, ++xPrimeIt; xIt != x.end(); ++xIt, ++xPrimeIt) {
-                        ValueType diff = *xIt - *xPrimeIt;
-                        maxDiff = std::max(maxDiff, diff);
-                        minDiff = std::min(minDiff, diff);
-                        *xIt -= refVal;
-                        *xPrimeIt = *xIt;
-                    }
-
-                    if ((maxDiff - minDiff) <= (relative ? (precision * minDiff) : precision)) {
+                    iterationHelper->iterate(env, dir);
+                    // Check if we are done
+                    auto convergenceCheckResult = iterationHelper->checkConvergence(relative, precision);
+                    result = convergenceCheckResult.currentValue;
+                    if (convergenceCheckResult.isPrecisionAchieved) {
                        break;
                    }
                    if (storm::utility::resources::isTerminate()) {
                        break;
                    }
+                    
+                    iterationHelper->prepareNextIteration();
+                    
                }
                if (maxIter.is_initialized() && iter == maxIter.get()) {
                    STORM_LOG_WARN("LRA computation did not converge within " << iter << " iterations.");
+                } else if (storm::utility::resources::isTerminate()) {
+                    STORM_LOG_WARN("LRA computation aborted after " << iter << " iterations.");
                } else {
                    STORM_LOG_TRACE("LRA computation converged after " << iter << " iterations.");
                }
                
                if (isProduceSchedulerSet()) {
-                    std::vector<uint_fast64_t> localMecChoices(mecTransitions.getRowGroupCount(), 0);
-                    multiplier->multiplyAndReduce(env, dir, x, &choiceValues, x, &localMecChoices);
-                    auto localMecChoiceIt = localMecChoices.begin();
-                    for (auto const& mecState : mecStates) {
-                        // Get the choice index of the selected mec choice with respect to the global transition matrix.
-                        uint_fast64_t globalChoice = mecChoices.getNextSetIndex(_transitionMatrix.getRowGroupIndices()[mecState]);
-                        for (uint_fast64_t i = 0; i < *localMecChoiceIt; ++i) {
-                            globalChoice = mecChoices.getNextSetIndex(globalChoice + 1);
-                        }
-                        STORM_LOG_ASSERT(globalChoice < _transitionMatrix.getRowGroupIndices()[mecState + 1], "Invalid global choice for mec state.");
-                        _producedOptimalChoices.get()[mecState] = globalChoice - _transitionMatrix.getRowGroupIndices()[mecState];
-                        ++localMecChoiceIt;
-                    }
+                    // We will be doing one more iteration step and track scheduler choices this time.
+                    iterationHelper->prepareNextIteration();
+                    iterationHelper->iterate(env, dir, &_producedOptimalChoices.get());
                }
-                return (maxDiff + minDiff) / (storm::utility::convertNumber<ValueType>(2.0) * scalingFactor);
-
+                return result;
            }
            
            template <typename ValueType>
-            ValueType SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLraForMecLp(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter, storm::storage::MaximalEndComponent const& mec) {
+            ValueType SparseNondeterministicInfiniteHorizonHelper<ValueType>::computeLraForMecLp(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateRewardsGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionRewardsGetter, storm::storage::MaximalEndComponent const& mec) {
                std::shared_ptr<storm::solver::LpSolver<ValueType>> solver = storm::utility::solver::getLpSolver<ValueType>("LRA for MEC");
                solver->setOptimizationDirection(invert(this->getOptimizationDirection()));
                
@ -330,7 +496,7 @@ namespace storm {
                        for (auto element : _transitionMatrix.getRow(choice)) {
                            constraint = constraint + stateToVariableMap.at(element.getColumn()) * solver->getConstant(element.getValue());
                        }
-                        constraint = solver->getConstant(combinedStateActionRewardsGetter(state, choice)) + constraint;
+                        constraint = solver->getConstant(stateRewardsGetter(state) + actionRewardsGetter(choice)) + constraint;
                        
                        if (this->minimize()) {
                            constraint = stateToVariableMap.at(state) <= constraint;
--- a/src/storm/modelchecker/helper/infinitehorizon/SparseNondeterministicInfiniteHorizonHelper.h
+++ b/src/storm/modelchecker/helper/infinitehorizon/SparseNondeterministicInfiniteHorizonHelper.h
@ -44,13 +44,13 @@ namespace storm {
                 * Computes the long run average value given the provided action-based rewards
                 * @return a value for each state
                 */
-                std::vector<ValueType> computeLongRunAverageValues(Environment const& env, std::vector<ValueType> const& combinedStateActionRewards);
+                std::vector<ValueType> computeLongRunAverageValues(Environment const& env, std::vector<ValueType> const* stateValues = nullptr, std::vector<ValueType> const* actionValues = nullptr);
                
                /*!
                 * Computes the long run average value given the provided state-action-based rewards
                 * @return a value for each state
                 */
-                std::vector<ValueType> computeLongRunAverageValues(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter);
+                std::vector<ValueType> computeLongRunAverageValues(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateValuesGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionValuesGetter);
                
                /*!
                 * Sets whether an optimal scheduler shall be constructed during the computation
@ -81,21 +81,27 @@ namespace storm {
                storm::storage::Scheduler<ValueType> extractScheduler() const;

            protected:
+                
+                /*!
+                 * @return true iff this is a computation on a continuous time model (i.e. MA)
+                 */
+                bool isContinuousTime() const;
+                
                /*!
                 * @pre if scheduler production is enabled, the _producedOptimalChoices vector should be initialized and sufficiently large
                 * @return the (unique) optimal LRA value for the given mec.
                 * @post _producedOptimalChoices contains choices for the states of the given MEC which yield the returned LRA value.
                 */
-                ValueType computeLraForMec(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter, storm::storage::MaximalEndComponent const& mec);
+                ValueType computeLraForMec(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateValuesGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionValuesGetter, storm::storage::MaximalEndComponent const& mec);
                
                /*!
                 * As computeLraForMec but uses value iteration as a solution method (independent of what is set in env)
                 */
-                ValueType computeLraForMecVi(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter, storm::storage::MaximalEndComponent const& mec);
+                ValueType computeLraForMecVi(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateValuesGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionValuesGetter, storm::storage::MaximalEndComponent const& mec);
                /*!
                 * As computeLraForMec but uses linear programming as a solution method (independent of what is set in env)
                 */
-                ValueType computeLraForMecLp(Environment const& env, std::function<ValueType(uint64_t stateIndex, uint64_t globalChoiceIndex)> const& combinedStateActionRewardsGetter, storm::storage::MaximalEndComponent const& mec);
+                ValueType computeLraForMecLp(Environment const& env, std::function<ValueType(uint64_t stateIndex)> const& stateValuesGetter,  std::function<ValueType(uint64_t globalChoiceIndex)> const& actionValuesGetter, storm::storage::MaximalEndComponent const& mec);
                
                /*!
                 * @return Lra values for each state