Browse Source

Fixed beliefgrid exploration.

tempestpy_adaptions
Tim Quatmann 5 years ago
parent
commit
97842f356d
  1. 16
      src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.cpp

16
src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.cpp

@ -367,7 +367,7 @@ namespace storm {
bsmap_type beliefStateMap; bsmap_type beliefStateMap;
std::deque<uint64_t> beliefsToBeExpanded; std::deque<uint64_t> beliefsToBeExpanded;
storm::storage::BitVector expandedBeliefs;
storm::storage::BitVector foundBeliefs;
// current ID -> action -> reward // current ID -> action -> reward
std::map<uint64_t, std::vector<ValueType>> beliefActionRewards; std::map<uint64_t, std::vector<ValueType>> beliefActionRewards;
@ -445,13 +445,14 @@ namespace storm {
if (options.explorationThreshold > storm::utility::zero<ValueType>()) { if (options.explorationThreshold > storm::utility::zero<ValueType>()) {
STORM_PRINT("Exploration threshold: " << options.explorationThreshold << std::endl) STORM_PRINT("Exploration threshold: " << options.explorationThreshold << std::endl)
} }
expandedBeliefs.grow(newBeliefGrid.getNumberOfGridPointIds(), false);
foundBeliefs.grow(newBeliefGrid.getNumberOfGridPointIds(), false);
for (auto const& belId : beliefsToBeExpanded) {
foundBeliefs.set(belId, true);
}
while (!beliefsToBeExpanded.empty()) { while (!beliefsToBeExpanded.empty()) {
uint64_t currId = beliefsToBeExpanded.front(); uint64_t currId = beliefsToBeExpanded.front();
beliefsToBeExpanded.pop_front(); beliefsToBeExpanded.pop_front();
expandedBeliefs.set(currId, true); // Do not expand this belief again.
assert(currId < expandedBeliefs.size());
uint64_t currMdpState = beliefStateMap.left.at(currId); uint64_t currMdpState = beliefStateMap.left.at(currId);
auto const& currBelief = newBeliefGrid.getGridPoint(currId); auto const& currBelief = newBeliefGrid.getGridPoint(currId);
uint32_t currObservation = pomdp.getObservation(currBelief.begin()->first); uint32_t currObservation = pomdp.getObservation(currBelief.begin()->first);
@ -478,12 +479,13 @@ namespace storm {
for (uint64_t action = 0; action < numChoices; ++action) { for (uint64_t action = 0; action < numChoices; ++action) {
auto successorGridPoints = newBeliefGrid.expandAction(currId, action, observationResolutionVector); auto successorGridPoints = newBeliefGrid.expandAction(currId, action, observationResolutionVector);
// Check for newly found grid points // Check for newly found grid points
expandedBeliefs.grow(newBeliefGrid.getNumberOfGridPointIds(), false);
foundBeliefs.grow(newBeliefGrid.getNumberOfGridPointIds(), false);
for (auto const& successor : successorGridPoints) { for (auto const& successor : successorGridPoints) {
auto successorId = successor.first; auto successorId = successor.first;
auto successorBelief = newBeliefGrid.getGridPoint(successorId); auto successorBelief = newBeliefGrid.getGridPoint(successorId);
auto successorObservation = pomdp.getObservation(successorBelief.begin()->first); auto successorObservation = pomdp.getObservation(successorBelief.begin()->first);
if (!expandedBeliefs.get(successorId)) {
if (!foundBeliefs.get(successorId)) {
foundBeliefs.set(successorId);
beliefsToBeExpanded.push_back(successorId); beliefsToBeExpanded.push_back(successorId);
beliefStateMap.insert(bsmap_type::value_type(successorId, nextMdpStateId)); beliefStateMap.insert(bsmap_type::value_type(successorId, nextMdpStateId));
++nextMdpStateId; ++nextMdpStateId;

Loading…
Cancel
Save