Renamed BeliefGrid to BeliefManager

5 years ago · 0b552e6813
3 changed files with 85 additions and 79 deletions
--- a/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.cpp
+++ b/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.cpp
@ -380,9 +380,9 @@ namespace storm {
                    underMap = underApproximationMap.value();
                }

-                storm::storage::BeliefGrid<storm::models::sparse::Pomdp<ValueType>> beliefGrid(pomdp, options.numericPrecision);
+                auto beliefManager = std::make_shared<storm::storage::BeliefManager<storm::models::sparse::Pomdp<ValueType>>>(pomdp, options.numericPrecision);
                if (computeRewards) {
-                    beliefGrid.setRewardModel();
+                    beliefManager->setRewardModel(); // TODO: get actual name
                }
                
                bsmap_type beliefStateMap;
@ -391,9 +391,7 @@ namespace storm {

                statistics.overApproximationBuildTime.start();
                // Initial belief always has belief ID 0
-                auto initialBeliefId = beliefGrid.getInitialBelief();
-                auto const& initialBelief = beliefGrid.getGridPoint(initialBeliefId);
-                auto initialObservation = beliefGrid.getBeliefObservation(initialBelief);
+                auto initialObservation = beliefManager->getBeliefObservation(beliefManager->getInitialBelief());
                // These are the components to build the MDP from the grid
                // Reserve states 0 and 1 as always sink/goal states
                storm::storage::SparseMatrixBuilder<ValueType> mdpTransitionsBuilder(0, 0, 0, true, true);
@ -419,14 +417,14 @@ namespace storm {
                std::map<uint64_t, ValueType> weightedSumUnderMap;

                // for the initial belief, add the triangulated initial states
-                auto triangulation = beliefGrid.triangulateBelief(initialBelief, observationResolutionVector[initialObservation]);
+                auto triangulation = beliefManager->triangulateBelief(beliefManager->getInitialBelief(), observationResolutionVector[initialObservation]);
                uint64_t initialMdpState = nextMdpStateId;
                ++nextMdpStateId;
                if (triangulation.size() == 1) {
                    // The initial belief is on the grid itself
                    auto initBeliefId = triangulation.gridPoints.front();
                    if (boundMapsSet) {
-                        auto const& gridPoint = beliefGrid.getGridPoint(initBeliefId);
+                        auto const& gridPoint = beliefManager->getBelief(initBeliefId);
                        weightedSumOverMap[initBeliefId] = getWeightedSum<ValueType>(gridPoint, overMap);
                        weightedSumUnderMap[initBeliefId] = getWeightedSum<ValueType>(gridPoint, underMap);
                    }
@ -443,7 +441,7 @@ namespace storm {
                        beliefStateMap.insert(bsmap_type::value_type(triangulation.gridPoints[i], nextMdpStateId));
                        ++nextMdpStateId;
                        if (boundMapsSet) {
-                            auto const& gridPoint = beliefGrid.getGridPoint(triangulation.gridPoints[i]);
+                            auto const& gridPoint = beliefManager->getBelief(triangulation.gridPoints[i]);
                            weightedSumOverMap[triangulation.gridPoints[i]] = getWeightedSum<ValueType>(gridPoint, overMap);
                            weightedSumUnderMap[triangulation.gridPoints[i]] = getWeightedSum<ValueType>(gridPoint, underMap);
                        }
@ -458,7 +456,7 @@ namespace storm {
                if (options.explorationThreshold > storm::utility::zero<ValueType>()) {
                    STORM_PRINT("Exploration threshold: " << options.explorationThreshold << std::endl)
                }
-                storm::storage::BitVector foundBeliefs(beliefGrid.getNumberOfGridPointIds(), false);
+                storm::storage::BitVector foundBeliefs(beliefManager->getNumberOfBeliefIds(), false);
                for (auto const& belId : beliefsToBeExpanded) {
                    foundBeliefs.set(belId, true);
                }
@ -467,7 +465,7 @@ namespace storm {
                    beliefsToBeExpanded.pop_front();
                    
                    uint64_t currMdpState = beliefStateMap.left.at(currId);
-                    uint32_t currObservation = beliefGrid.getBeliefObservation(currId);
+                    uint32_t currObservation = beliefManager->getBeliefObservation(currId);

                    mdpTransitionsBuilder.newRowGroup(mdpMatrixRow);
                    
@ -484,17 +482,17 @@ namespace storm {
                    } else {
                        fullyExpandedStates.grow(nextMdpStateId, false);
                        fullyExpandedStates.set(currMdpState, true);
-                        uint64_t someState = beliefGrid.getGridPoint(currId).begin()->first;
+                        uint64_t someState = beliefManager->getBelief(currId).begin()->first;
                        uint64_t numChoices = pomdp.getNumberOfChoices(someState);

                        for (uint64_t action = 0; action < numChoices; ++action) {
-                            auto successorGridPoints = beliefGrid.expandAndTriangulate(currId, action, observationResolutionVector);
+                            auto successorGridPoints = beliefManager->expandAndTriangulate(currId, action, observationResolutionVector);
                            // Check for newly found grid points
-                            foundBeliefs.grow(beliefGrid.getNumberOfGridPointIds(), false);
+                            foundBeliefs.grow(beliefManager->getNumberOfBeliefIds(), false);
                            for (auto const& successor : successorGridPoints) {
                                auto successorId = successor.first;
-                                auto const& successorBelief = beliefGrid.getGridPoint(successorId);
-                                auto successorObservation = beliefGrid.getBeliefObservation(successorBelief);
+                                auto const& successorBelief = beliefManager->getBelief(successorId);
+                                auto successorObservation = beliefManager->getBeliefObservation(successorBelief);
                                if (!foundBeliefs.get(successorId)) {
                                    foundBeliefs.set(successorId);
                                    beliefsToBeExpanded.push_back(successorId);
@ -548,11 +546,11 @@ namespace storm {
                    storm::models::sparse::StandardRewardModel<ValueType> mdpRewardModel(boost::none, std::vector<ValueType>(mdpMatrixRow, storm::utility::zero<ValueType>()));
                    for (auto const &iter : beliefStateMap.left) {
                        if (fullyExpandedStates.get(iter.second)) {
-                            auto const& currentBelief = beliefGrid.getGridPoint(iter.first);
+                            auto const& currentBelief = beliefManager->getBelief(iter.first);
                            auto representativeState = currentBelief.begin()->first;
                            for (uint64_t action = 0; action < pomdp.getNumberOfChoices(representativeState); ++action) {
                                uint64_t mdpChoice = overApproxMdp->getChoiceIndex(storm::storage::StateActionPair(iter.second, action));
-                                mdpRewardModel.setStateActionReward(mdpChoice, beliefGrid.getBeliefActionReward(currentBelief, action));
+                                mdpRewardModel.setStateActionReward(mdpChoice, beliefManager->getBeliefActionReward(currentBelief, action));
                            }
                        }
                    }
@ -575,16 +573,16 @@ namespace storm {
                STORM_LOG_ASSERT(res, "Result does not exist.");
                res->filter(storm::modelchecker::ExplicitQualitativeCheckResult(storm::storage::BitVector(overApproxMdp->getNumberOfStates(), true)));
                auto overApproxResultMap = res->asExplicitQuantitativeCheckResult<ValueType>().getValueMap();
-                auto overApprox = overApproxResultMap[beliefStateMap.left.at(initialBeliefId)];
+                auto overApprox = overApproxResultMap[initialMdpState];

                STORM_PRINT("Time Overapproximation: " <<  statistics.overApproximationCheckTime << " seconds." << std::endl);
                STORM_PRINT("Over-Approximation Result: " << overApprox << std::endl);
                //auto underApprox = weightedSumUnderMap[initialBelief.id];
-                auto underApproxComponents = computeUnderapproximation(beliefGrid, targetObservations, min, computeRewards, maxUaModelSize);
+                auto underApproxComponents = computeUnderapproximation(beliefManager, targetObservations, min, computeRewards, maxUaModelSize);
                if (storm::utility::resources::isTerminate() && !underApproxComponents) {
                    // TODO: return other components needed for refinement.
                    //return std::make_unique<RefinementComponents<ValueType>>(RefinementComponents<ValueType>{modelPtr, overApprox, 0, overApproxResultMap, {}, beliefList, beliefGrid, beliefIsTarget, beliefStateMap, {}, initialBelief.id});
-                    return std::make_unique<RefinementComponents<ValueType>>(RefinementComponents<ValueType>{modelPtr, overApprox, 0, overApproxResultMap, {}, {}, {}, {}, beliefStateMap, {}, initialBeliefId});
+                    return std::make_unique<RefinementComponents<ValueType>>(RefinementComponents<ValueType>{modelPtr, overApprox, 0, overApproxResultMap, {}, {}, {}, {}, beliefStateMap, {}, beliefManager->getInitialBelief()});
                }
                
                STORM_PRINT("Under-Approximation Result: " << underApproxComponents->underApproxValue << std::endl);
@ -595,7 +593,7 @@ namespace storm {
                                                        underApproxComponents->underApproxBeliefStateMap, initialBelief.id});
                */
                return std::make_unique<RefinementComponents<ValueType>>(RefinementComponents<ValueType>{modelPtr, overApprox, underApproxComponents->underApproxValue, overApproxResultMap,
-                                                                                                         underApproxComponents->underApproxMap, {}, {}, {}, beliefStateMap, underApproxComponents->underApproxBeliefStateMap, initialBeliefId});
+                                                                                                         underApproxComponents->underApproxMap, {}, {}, {}, beliefStateMap, underApproxComponents->underApproxBeliefStateMap, beliefManager->getInitialBelief()});

            }

@ -1075,7 +1073,7 @@ namespace storm {

            template<typename ValueType, typename RewardModelType>
            std::unique_ptr<UnderApproxComponents<ValueType, RewardModelType>>
-            ApproximatePOMDPModelchecker<ValueType, RewardModelType>::computeUnderapproximation(storm::storage::BeliefGrid<storm::models::sparse::Pomdp<ValueType>>& beliefGrid,
+            ApproximatePOMDPModelchecker<ValueType, RewardModelType>::computeUnderapproximation(std::shared_ptr<storm::storage::BeliefManager<storm::models::sparse::Pomdp<ValueType>>> beliefManager,
                                                                                                std::set<uint32_t> const &targetObservations, bool min,
                                                                                                bool computeRewards, uint64_t maxModelSize) {
                // Build the belief MDP until enough states are explored.
@ -1100,13 +1098,12 @@ namespace storm {
                bsmap_type beliefStateMap;
                std::deque<uint64_t> beliefsToBeExpanded;
                
-                auto initialBeliefId = beliefGrid.getInitialBelief();
-                beliefStateMap.insert(bsmap_type::value_type(initialBeliefId, nextMdpStateId));
-                beliefsToBeExpanded.push_back(initialBeliefId);
+                beliefStateMap.insert(bsmap_type::value_type(beliefManager->getInitialBelief(), nextMdpStateId));
+                beliefsToBeExpanded.push_back(beliefManager->getInitialBelief());
                ++nextMdpStateId;

                // Expand the believes
-                storm::storage::BitVector foundBeliefs(beliefGrid.getNumberOfGridPointIds(), false);
+                storm::storage::BitVector foundBeliefs(beliefManager->getNumberOfBeliefIds(), false);
                for (auto const& belId : beliefsToBeExpanded) {
                    foundBeliefs.set(belId, true);
                }
@ -1115,8 +1112,8 @@ namespace storm {
                    beliefsToBeExpanded.pop_front();
                    
                    uint64_t currMdpState = beliefStateMap.left.at(currId);
-                    auto const& currBelief = beliefGrid.getGridPoint(currId);
-                    uint32_t currObservation = beliefGrid.getBeliefObservation(currBelief);
+                    auto const& currBelief = beliefManager->getBelief(currId);
+                    uint32_t currObservation = beliefManager->getBeliefObservation(currBelief);
                    
                    mdpTransitionsBuilder.newRowGroup(mdpMatrixRow);
                    
@ -1147,9 +1144,9 @@ namespace storm {
                        uint64_t someState = currBelief.begin()->first;
                        uint64_t numChoices = pomdp.getNumberOfChoices(someState);
                        for (uint64_t action = 0; action < numChoices; ++action) {
-                            auto successorBeliefs = beliefGrid.expand(currId, action);
+                            auto successorBeliefs = beliefManager->expand(currId, action);
                            // Check for newly found beliefs
-                            foundBeliefs.grow(beliefGrid.getNumberOfGridPointIds(), false);
+                            foundBeliefs.grow(beliefManager->getNumberOfBeliefIds(), false);
                            for (auto const& successor : successorBeliefs) {
                                auto successorId = successor.first;
                                if (!foundBeliefs.get(successorId)) {
@ -1159,7 +1156,7 @@ namespace storm {
                                    ++nextMdpStateId;
                                }
                                auto successorMdpState = beliefStateMap.left.at(successorId);
-                                // This assumes that the successor MDP states are given in ascending order, which is indeed the case because the successorGridPoints are sorted.
+                                // This assumes that the successor MDP states are given in ascending order, which is indeed the case because the successorBeliefs are sorted.
                                mdpTransitionsBuilder.addNextValue(mdpMatrixRow, successorMdpState, successor.second);
                            }
                            ++mdpMatrixRow;
@ -1179,7 +1176,7 @@ namespace storm {
                storm::models::sparse::StateLabeling mdpLabeling(nextMdpStateId);
                mdpLabeling.addLabel("init");
                mdpLabeling.addLabel("target");
-                mdpLabeling.addLabelToState("init", beliefStateMap.left.at(initialBeliefId));
+                mdpLabeling.addLabelToState("init", beliefStateMap.left.at(beliefManager->getInitialBelief()));
                for (auto targetState : targetStates) {
                    mdpLabeling.addLabelToState("target", targetState);
                }
@ -1190,11 +1187,11 @@ namespace storm {
                    storm::models::sparse::StandardRewardModel<ValueType> mdpRewardModel(boost::none, std::vector<ValueType>(mdpMatrixRow, storm::utility::zero<ValueType>()));
                    for (auto const &iter : beliefStateMap.left) {
                        if (fullyExpandedStates.get(iter.second)) {
-                            auto const& currentBelief = beliefGrid.getGridPoint(iter.first);
+                            auto const& currentBelief = beliefManager->getBelief(iter.first);
                            auto representativeState = currentBelief.begin()->first;
                            for (uint64_t action = 0; action < pomdp.getNumberOfChoices(representativeState); ++action) {
                                uint64_t mdpChoice = model->getChoiceIndex(storm::storage::StateActionPair(iter.second, action));
-                                mdpRewardModel.setStateActionReward(mdpChoice, beliefGrid.getBeliefActionReward(currentBelief, action));
+                                mdpRewardModel.setStateActionReward(mdpChoice, beliefManager->getBeliefActionReward(currentBelief, action));
                            }
                        }
                    }
@ -1207,8 +1204,8 @@ namespace storm {

                auto property = createStandardProperty(min, computeRewards);
                auto task = createStandardCheckTask(property, std::vector<ValueType>());
-                statistics.underApproximationCheckTime.start();
                
+                statistics.underApproximationCheckTime.start();
                std::unique_ptr<storm::modelchecker::CheckResult> res(storm::api::verifyWithSparseEngine<ValueType>(model, task));
                statistics.underApproximationCheckTime.stop();
                if (storm::utility::resources::isTerminate() && !res) {
@ -1217,7 +1214,7 @@ namespace storm {
                STORM_LOG_ASSERT(res, "Result does not exist.");
                res->filter(storm::modelchecker::ExplicitQualitativeCheckResult(storm::storage::BitVector(model->getNumberOfStates(), true)));
                auto underApproxResultMap = res->asExplicitQuantitativeCheckResult<ValueType>().getValueMap();
-                auto underApprox = underApproxResultMap[beliefStateMap.left.at(initialBeliefId)];
+                auto underApprox = underApproxResultMap[beliefStateMap.left.at(beliefManager->getInitialBelief())];

                return std::make_unique<UnderApproxComponents<ValueType>>(UnderApproxComponents<ValueType>{underApprox, underApproxResultMap, beliefStateMap});
            }
--- a/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.h
+++ b/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.h
@ -3,7 +3,7 @@
 #include "storm/models/sparse/Pomdp.h"
 #include "storm/utility/logging.h"
 #include "storm-pomdp/storage/Belief.h"
-#include "storm-pomdp/storage/BeliefGrid.h"
+#include "storm-pomdp/storage/BeliefManager.h"
 #include <boost/bimap.hpp>

 #include "storm/storage/jani/Property.h"
@ -163,7 +163,7 @@ namespace storm {
                                                                                                             std::set<uint32_t> const &targetObservations,
                                                                                                             uint64_t initialBeliefId, bool min, bool computeReward,
                                                                                                             uint64_t maxModelSize);
-                std::unique_ptr<UnderApproxComponents<ValueType, RewardModelType>> computeUnderapproximation(storm::storage::BeliefGrid<storm::models::sparse::Pomdp<ValueType>>& beliefGrid,
+                std::unique_ptr<UnderApproxComponents<ValueType, RewardModelType>> computeUnderapproximation(std::shared_ptr<storm::storage::BeliefManager<storm::models::sparse::Pomdp<ValueType>>> beliefManager,
                                                                                                             std::set<uint32_t> const &targetObservations, bool min, bool computeReward,
                                                                                                             uint64_t maxModelSize);

--- a/src/storm-pomdp/storage/BeliefManager.h
+++ b/src/storm-pomdp/storage/BeliefManager.h
@ -11,8 +11,7 @@ namespace storm {
    namespace storage {
        
        template <typename PomdpType, typename BeliefValueType = typename PomdpType::ValueType, typename StateType = uint64_t>
-        // TODO: Change name. This actually does not only manage grid points.
-        class BeliefGrid {
+        class BeliefManager {
        public:
            
            typedef typename PomdpType::ValueType ValueType;
@ -20,8 +19,8 @@ namespace storm {
            typedef std::map<StateType, BeliefValueType> BeliefType;
            typedef uint64_t BeliefId;
            
-            BeliefGrid(PomdpType const& pomdp, BeliefValueType const& precision) : pomdp(pomdp), cc(precision, false) {
-                // Intentionally left empty
+            BeliefManager(PomdpType const& pomdp, BeliefValueType const& precision) : pomdp(pomdp), cc(precision, false) {
+                initialBeliefId = computeInitialBelief();
            }
            
            void setRewardModel(boost::optional<std::string> rewardModelName = boost::none) {
@ -45,13 +44,13 @@ namespace storm {
                }
            };
            
-            BeliefType const& getGridPoint(BeliefId const& id) const {
-                return gridPoints[id];
+            BeliefType const& getBelief(BeliefId const& id) const {
+                return beliefs[id];
            }
            
-            BeliefId getIdOfGridPoint(BeliefType const& gridPoint) const {
-                auto idIt = gridPointToIdMap.find(gridPoint);
-                STORM_LOG_THROW(idIt != gridPointToIdMap.end(), storm::exceptions::UnexpectedException, "Unknown grid state.");
+            BeliefId getId(BeliefType const& belief) const {
+                auto idIt = beliefToIdMap.find(belief);
+                STORM_LOG_THROW(idIt != beliefToIdMap.end(), storm::exceptions::UnexpectedException, "Unknown Belief.");
                return idIt->second;
            }
            
@ -75,7 +74,7 @@ namespace storm {
                std::stringstream str;
                str << "(\n";
                for (uint64_t i = 0; i < t.size(); ++i) {
-                    str << "\t" << t.weights[i] << " * \t" << toString(getGridPoint(t.gridPoints[i])) << "\n";
+                    str << "\t" << t.weights[i] << " * \t" << toString(getBelief(t.gridPoints[i])) << "\n";
                }
                str <<")\n";
                return str.str();
@ -161,7 +160,7 @@ namespace storm {
                        STORM_LOG_ERROR("Weight greater than one in triangulation.");
                    }
                    weightSum += triangulation.weights[i];
-                    BeliefType const& gridPoint = getGridPoint(triangulation.gridPoints[i]);
+                    BeliefType const& gridPoint = getBelief(triangulation.gridPoints[i]);
                    for (auto const& pointEntry : gridPoint) {
                        BeliefValueType& triangulatedValue = triangulatedBelief.emplace(pointEntry.first, storm::utility::zero<ValueType>()).first->second;
                        triangulatedValue += triangulation.weights[i] * pointEntry.second;
@ -181,16 +180,8 @@ namespace storm {
                return true;
            }
            
-            BeliefId getInitialBelief() {
-                STORM_LOG_ASSERT(pomdp.getInitialStates().getNumberOfSetBits() < 2,
-                                 "POMDP contains more than one initial state");
-                STORM_LOG_ASSERT(pomdp.getInitialStates().getNumberOfSetBits() == 1,
-                                 "POMDP does not contain an initial state");
-                BeliefType belief;
-                belief[*pomdp.getInitialStates().begin()] = storm::utility::one<ValueType>();
-                
-                STORM_LOG_ASSERT(assertBelief(belief), "Invalid initial belief.");
-                return getOrAddGridPointId(belief);
+            BeliefId const& getInitialBelief() const {
+                return initialBeliefId;
            }
            
            ValueType getBeliefActionReward(BeliefType const& belief, uint64_t const& localActionIndex) const {
@ -212,10 +203,10 @@ namespace storm {
            }
            
            uint32_t getBeliefObservation(BeliefId beliefId) {
-                return getBeliefObservation(getGridPoint(beliefId));
+                return getBeliefObservation(getBelief(beliefId));
            }
            
-            
+
            Triangulation triangulateBelief(BeliefType belief, uint64_t resolution) {
                //TODO this can also be simplified using the sparse vector interpretation
                //TODO Enable chaching for this method?
@ -286,7 +277,7 @@ namespace storm {
                        if (!cc.isZero(qsj[nrStates - 1])) {
                            gridPoint[nrStates - 1] = qsj[nrStates - 1] / convResolution;
                        }
-                        result.gridPoints.push_back(getOrAddGridPointId(gridPoint));
+                        result.gridPoints.push_back(getOrAddBeliefId(gridPoint));
                    }
                }
                
@ -294,6 +285,10 @@ namespace storm {
                return result;
            }
            
+            Triangulation triangulateBelief(BeliefId beliefId, uint64_t resolution) {
+                return triangulateBelief(getBelief(beliefId), resolution);
+            }
+            
            template<typename DistributionType>
            void addToDistribution(DistributionType& distr, StateType const& state, BeliefValueType const& value) {
                auto insertionRes = distr.emplace(state, value);
@ -302,19 +297,19 @@ namespace storm {
                }
            }
            
-            BeliefId getNumberOfGridPointIds() const {
-                return gridPoints.size();
+            BeliefId getNumberOfBeliefIds() const {
+                return beliefs.size();
            }
            
-            std::map<BeliefId, ValueType> expandInternal(BeliefId const& gridPointId, uint64_t actionIndex, boost::optional<std::vector<uint64_t>> const& observationTriangulationResolutions = boost::none) {
+            std::map<BeliefId, ValueType> expandInternal(BeliefId const& beliefId, uint64_t actionIndex, boost::optional<std::vector<uint64_t>> const& observationTriangulationResolutions = boost::none) {
                std::map<BeliefId, ValueType> destinations; // The belief ids should be ordered
                // TODO: Does this make sense? It could be better to order them afterwards because now we rely on the fact that MDP states have the same order than their associated BeliefIds
                
-                BeliefType gridPoint = getGridPoint(gridPointId);
+                BeliefType belief = getBelief(beliefId);
                
                // Find the probability we go to each observation
                BeliefType successorObs; // This is actually not a belief but has the same type
-                for (auto const& pointEntry : gridPoint) {
+                for (auto const& pointEntry : belief) {
                    uint64_t state = pointEntry.first;
                    for (auto const& pomdpTransition : pomdp.getTransitionMatrix().getRow(state, actionIndex)) {
                        if (!storm::utility::isZero(pomdpTransition.getValue())) {
@ -327,7 +322,7 @@ namespace storm {
                // Now for each successor observation we find and potentially triangulate the successor belief
                for (auto const& successor : successorObs) {
                    BeliefType successorBelief;
-                    for (auto const& pointEntry : gridPoint) {
+                    for (auto const& pointEntry : belief) {
                        uint64_t state = pointEntry.first;
                        for (auto const& pomdpTransition : pomdp.getTransitionMatrix().getRow(state, actionIndex)) {
                            if (pomdp.getObservation(pomdpTransition.getColumn()) == successor.first) {
@ -344,7 +339,7 @@ namespace storm {
                            addToDistribution(destinations, triangulation.gridPoints[j], triangulation.weights[j] * successor.second);
                        }
                    } else {
-                        addToDistribution(destinations, getOrAddGridPointId(successorBelief), successor.second);
+                        addToDistribution(destinations, getOrAddBeliefId(successorBelief), successor.second);
                    }
                }
    
@ -352,21 +347,33 @@ namespace storm {
                
            }
            
-            std::map<BeliefId, ValueType> expandAndTriangulate(BeliefId const& gridPointId, uint64_t actionIndex, std::vector<uint64_t> const& observationResolutions) {
-                return expandInternal(gridPointId, actionIndex, observationResolutions);
+            std::map<BeliefId, ValueType> expandAndTriangulate(BeliefId const& beliefId, uint64_t actionIndex, std::vector<uint64_t> const& observationResolutions) {
+                return expandInternal(beliefId, actionIndex, observationResolutions);
            }
            
-            std::map<BeliefId, ValueType> expand(BeliefId const& gridPointId, uint64_t actionIndex) {
-                return expandInternal(gridPointId, actionIndex);
+            std::map<BeliefId, ValueType> expand(BeliefId const& beliefId, uint64_t actionIndex) {
+                return expandInternal(beliefId, actionIndex);
            }
            
        private:
            
-            BeliefId getOrAddGridPointId(BeliefType const& gridPoint) {
-                auto insertioRes = gridPointToIdMap.emplace(gridPoint, gridPoints.size());
+            BeliefId computeInitialBelief() {
+                STORM_LOG_ASSERT(pomdp.getInitialStates().getNumberOfSetBits() < 2,
+                                 "POMDP contains more than one initial state");
+                STORM_LOG_ASSERT(pomdp.getInitialStates().getNumberOfSetBits() == 1,
+                                 "POMDP does not contain an initial state");
+                BeliefType belief;
+                belief[*pomdp.getInitialStates().begin()] = storm::utility::one<ValueType>();
+                
+                STORM_LOG_ASSERT(assertBelief(belief), "Invalid initial belief.");
+                return getOrAddBeliefId(belief);
+            }
+            
+            BeliefId getOrAddBeliefId(BeliefType const& belief) {
+                auto insertioRes = beliefToIdMap.emplace(belief, beliefs.size());
                if (insertioRes.second) {
-                    // There actually was an insertion, so add the new grid state
-                    gridPoints.push_back(gridPoint);
+                    // There actually was an insertion, so add the new belief
+                    beliefs.push_back(belief);
                }
                // Return the id
                return insertioRes.first->second;
@ -375,8 +382,10 @@ namespace storm {
            PomdpType const& pomdp;
            std::vector<ValueType> pomdpActionRewardVector;
            
-            std::vector<BeliefType> gridPoints;
-            std::map<BeliefType, BeliefId> gridPointToIdMap;
+            std::vector<BeliefType> beliefs;
+            std::map<BeliefType, BeliefId> beliefToIdMap;
+            BeliefId initialBeliefId;
+            
            storm::utility::ConstantsComparator<ValueType> cc;