@ -359,23 +359,16 @@ namespace storm {
underMap = underApproximationMap . value ( ) ;
underMap = underApproximationMap . value ( ) ;
}
}
storm : : storage : : BeliefGrid < storm : : models : : sparse : : Pomdp < ValueType > , ValueType > newBeliefGrid ( pomdp , options . numericPrecision ) ;
//Use caching to avoid multiple computation of the subsimplices and lambdas
std : : map < uint64_t , std : : vector < std : : map < uint64_t , ValueType > > > subSimplexCache ;
std : : map < uint64_t , std : : vector < ValueType > > lambdaCache ;
storm : : storage : : BeliefGrid < storm : : models : : sparse : : Pomdp < ValueType > > beliefGrid ( pomdp , options . numericPrecision ) ;
bsmap_type beliefStateMap ;
bsmap_type beliefStateMap ;
std : : deque < uint64_t > beliefsToBeExpanded ;
std : : deque < uint64_t > beliefsToBeExpanded ;
storm : : storage : : BitVector foundBeliefs ;
// current ID -> action -> reward
std : : map < uint64_t , std : : vector < ValueType > > beliefActionRewards ;
uint64_t nextId = 0 ;
statistics . overApproximationBuildTime . start ( ) ;
statistics . overApproximationBuildTime . start ( ) ;
// Initial belief always has belief ID 0
// Initial belief always has belief ID 0
storm : : pomdp : : Belief < ValueType > initialBelief = getInitialBelief ( nextId ) ;
+ + nextId ;
auto initialBeliefId = beliefGrid . getInitialBelief ( ) ;
auto const & initialBelief = beliefGrid . getGridPoint ( initialBeliefId ) ;
auto initialObservation = beliefGrid . getBeliefObservation ( initialBelief ) ;
// These are the components to build the MDP from the grid
// These are the components to build the MDP from the grid
// Reserve states 0 and 1 as always sink/goal states
// Reserve states 0 and 1 as always sink/goal states
storm : : storage : : SparseMatrixBuilder < ValueType > mdpTransitionsBuilder ( 0 , 0 , 0 , true , true ) ;
storm : : storage : : SparseMatrixBuilder < ValueType > mdpTransitionsBuilder ( 0 , 0 , 0 , true , true ) ;
@ -400,25 +393,20 @@ namespace storm {
std : : map < uint64_t , ValueType > weightedSumUnderMap ;
std : : map < uint64_t , ValueType > weightedSumUnderMap ;
// for the initial belief, add the triangulated initial states
// for the initial belief, add the triangulated initial states
auto triangulation = newBeliefGrid . triangulateBelief ( initialBelief . probabilities , observationResolutionVector [ initialBelief . observation ] ) ;
if ( options . cacheSubsimplices ) {
//subSimplexCache[0] = initSubSimplex;
//lambdaCache[0] = initLambdas;
}
std : : vector < std : : map < uint64_t , ValueType > > initTransitionsInBelief ;
auto triangulation = beliefGrid . triangulateBelief ( initialBelief , observationResolutionVector [ initialObservation ] ) ;
uint64_t initialMdpState = nextMdpStateId ;
uint64_t initialMdpState = nextMdpStateId ;
+ + nextMdpStateId ;
+ + nextMdpStateId ;
if ( triangulation . size ( ) = = 1 ) {
if ( triangulation . size ( ) = = 1 ) {
// The initial belief is on the grid itself
// The initial belief is on the grid itself
auto initBeliefId = triangulation . gridPoints . front ( ) ;
auto initBeliefId = triangulation . gridPoints . front ( ) ;
if ( boundMapsSet ) {
if ( boundMapsSet ) {
auto const & gridPoint = newB eliefGrid. getGridPoint ( initBeliefId ) ;
auto const & gridPoint = b eliefGrid. getGridPoint ( initBeliefId ) ;
weightedSumOverMap [ initBeliefId ] = getWeightedSum < ValueType > ( gridPoint , overMap ) ;
weightedSumOverMap [ initBeliefId ] = getWeightedSum < ValueType > ( gridPoint , overMap ) ;
weightedSumUnderMap [ initBeliefId ] = getWeightedSum < ValueType > ( gridPoint , underMap ) ;
weightedSumUnderMap [ initBeliefId ] = getWeightedSum < ValueType > ( gridPoint , underMap ) ;
}
}
beliefsToBeExpanded . push_back ( initBeliefId ) ;
beliefsToBeExpanded . push_back ( initBeliefId ) ;
beliefStateMap . insert ( bsmap_type : : value_type ( triangulation . gridPoints . front ( ) , initialMdpState ) ) ;
beliefStateMap . insert ( bsmap_type : : value_type ( triangulation . gridPoints . front ( ) , initialMdpState ) ) ;
hintVector . push_back ( targetObservations . find ( initialBelief . o bservation ) ! = targetObservations . end ( ) ? storm : : utility : : one < ValueType > ( )
hintVector . push_back ( targetObservations . find ( initialO bservation ) ! = targetObservations . end ( ) ? storm : : utility : : one < ValueType > ( )
: storm : : utility : : zero < ValueType > ( ) ) ;
: storm : : utility : : zero < ValueType > ( ) ) ;
} else {
} else {
// If the initial belief is not on the grid, we add the transitions from our initial MDP state to the triangulated beliefs
// If the initial belief is not on the grid, we add the transitions from our initial MDP state to the triangulated beliefs
@ -429,11 +417,11 @@ namespace storm {
beliefStateMap . insert ( bsmap_type : : value_type ( triangulation . gridPoints [ i ] , nextMdpStateId ) ) ;
beliefStateMap . insert ( bsmap_type : : value_type ( triangulation . gridPoints [ i ] , nextMdpStateId ) ) ;
+ + nextMdpStateId ;
+ + nextMdpStateId ;
if ( boundMapsSet ) {
if ( boundMapsSet ) {
auto const & gridPoint = newB eliefGrid. getGridPoint ( triangulation . gridPoints [ i ] ) ;
auto const & gridPoint = b eliefGrid. getGridPoint ( triangulation . gridPoints [ i ] ) ;
weightedSumOverMap [ triangulation . gridPoints [ i ] ] = getWeightedSum < ValueType > ( gridPoint , overMap ) ;
weightedSumOverMap [ triangulation . gridPoints [ i ] ] = getWeightedSum < ValueType > ( gridPoint , overMap ) ;
weightedSumUnderMap [ triangulation . gridPoints [ i ] ] = getWeightedSum < ValueType > ( gridPoint , underMap ) ;
weightedSumUnderMap [ triangulation . gridPoints [ i ] ] = getWeightedSum < ValueType > ( gridPoint , underMap ) ;
}
}
hintVector . push_back ( targetObservations . find ( initialBelief . o bservation ) ! = targetObservations . end ( ) ? storm : : utility : : one < ValueType > ( )
hintVector . push_back ( targetObservations . find ( initialO bservation ) ! = targetObservations . end ( ) ? storm : : utility : : one < ValueType > ( )
: storm : : utility : : zero < ValueType > ( ) ) ;
: storm : : utility : : zero < ValueType > ( ) ) ;
}
}
//beliefsToBeExpanded.push_back(initialBelief.id); I'm curious what happens if we do this instead of first triangulating. Should do nothing special if belief is on grid, otherwise it gets interesting
//beliefsToBeExpanded.push_back(initialBelief.id); I'm curious what happens if we do this instead of first triangulating. Should do nothing special if belief is on grid, otherwise it gets interesting
@ -444,7 +432,7 @@ namespace storm {
if ( options . explorationThreshold > storm : : utility : : zero < ValueType > ( ) ) {
if ( options . explorationThreshold > storm : : utility : : zero < ValueType > ( ) ) {
STORM_PRINT ( " Exploration threshold: " < < options . explorationThreshold < < std : : endl )
STORM_PRINT ( " Exploration threshold: " < < options . explorationThreshold < < std : : endl )
}
}
foundBeliefs . grow ( newB eliefGrid. getNumberOfGridPointIds ( ) , false ) ;
storm : : storage : : BitVector foundBeliefs ( b eliefGrid. getNumberOfGridPointIds ( ) , false ) ;
for ( auto const & belId : beliefsToBeExpanded ) {
for ( auto const & belId : beliefsToBeExpanded ) {
foundBeliefs . set ( belId , true ) ;
foundBeliefs . set ( belId , true ) ;
}
}
@ -453,8 +441,8 @@ namespace storm {
beliefsToBeExpanded . pop_front ( ) ;
beliefsToBeExpanded . pop_front ( ) ;
uint64_t currMdpState = beliefStateMap . left . at ( currId ) ;
uint64_t currMdpState = beliefStateMap . left . at ( currId ) ;
auto const & currBelief = newB eliefGrid. getGridPoint ( currId ) ;
uint32_t currObservation = pomdp . getObservation ( currBelief . begin ( ) - > first ) ;
auto const & currBelief = b eliefGrid. getGridPoint ( currId ) ;
uint32_t currObservation = beliefGrid . getBelief Observation ( currBelief ) ;
mdpTransitionsBuilder . newRowGroup ( mdpMatrixRow ) ;
mdpTransitionsBuilder . newRowGroup ( mdpMatrixRow ) ;
@ -469,20 +457,18 @@ namespace storm {
mdpTransitionsBuilder . addNextValue ( mdpMatrixRow , extraBottomState , storm : : utility : : one < ValueType > ( ) - weightedSumOverMap [ currId ] ) ;
mdpTransitionsBuilder . addNextValue ( mdpMatrixRow , extraBottomState , storm : : utility : : one < ValueType > ( ) - weightedSumOverMap [ currId ] ) ;
+ + mdpMatrixRow ;
+ + mdpMatrixRow ;
} else {
} else {
auto const & currBelief = newB eliefGrid. getGridPoint ( currId ) ;
auto const & currBelief = b eliefGrid. getGridPoint ( currId ) ;
uint64_t someState = currBelief . begin ( ) - > first ;
uint64_t someState = currBelief . begin ( ) - > first ;
uint64_t numChoices = pomdp . getNumberOfChoices ( someState ) ;
uint64_t numChoices = pomdp . getNumberOfChoices ( someState ) ;
std : : vector < ValueType > actionRewardsInState ( numChoices ) ;
std : : vector < std : : map < uint64_t , ValueType > > transitionsInBelief ;
for ( uint64_t action = 0 ; action < numChoices ; + + action ) {
for ( uint64_t action = 0 ; action < numChoices ; + + action ) {
auto successorGridPoints = beliefGrid . expandAndTriangulate ( currId , action , observationResolutionVector ) ;
auto successorGridPoints = beliefGrid . expandAndTriangulate ( currId , action , observationResolutionVector ) ;
// Check for newly found grid points
// Check for newly found grid points
foundBeliefs . grow ( newB eliefGrid. getNumberOfGridPointIds ( ) , false ) ;
foundBeliefs . grow ( b eliefGrid. getNumberOfGridPointIds ( ) , false ) ;
for ( auto const & successor : successorGridPoints ) {
for ( auto const & successor : successorGridPoints ) {
auto successorId = successor . first ;
auto successorId = successor . first ;
auto successorBelief = newB eliefGrid. getGridPoint ( successorId ) ;
auto successorObservation = pomdp . getObservation ( successorBelief . begin ( ) - > first ) ;
auto const & successorBelief = b eliefGrid. getGridPoint ( successorId ) ;
auto successorObservation = beliefGrid . getBelief Observation ( successorBelief ) ;
if ( ! foundBeliefs . get ( successorId ) ) {
if ( ! foundBeliefs . get ( successorId ) ) {
foundBeliefs . set ( successorId ) ;
foundBeliefs . set ( successorId ) ;
beliefsToBeExpanded . push_back ( successorId ) ;
beliefsToBeExpanded . push_back ( successorId ) ;
@ -525,21 +511,16 @@ namespace storm {
storm : : models : : sparse : : StateLabeling mdpLabeling ( nextMdpStateId ) ;
storm : : models : : sparse : : StateLabeling mdpLabeling ( nextMdpStateId ) ;
mdpLabeling . addLabel ( " init " ) ;
mdpLabeling . addLabel ( " init " ) ;
mdpLabeling . addLabel ( " target " ) ;
mdpLabeling . addLabel ( " target " ) ;
mdpLabeling . addLabelToState ( " init " , beliefStateMap . left . at ( initialMdpState ) ) ;
mdpLabeling . addLabelToState ( " init " , initialMdpState ) ;
for ( auto targetState : targetStates ) {
for ( auto targetState : targetStates ) {
mdpLabeling . addLabelToState ( " target " , targetState ) ;
mdpLabeling . addLabelToState ( " target " , targetState ) ;
}
}
storm : : storage : : sparse : : ModelComponents < ValueType , RewardModelType > modelComponents ( mdpTransitionsBuilder . build ( mdpMatrixRow , nextMdpStateId , nextMdpStateId ) , std : : move ( mdpLabeling ) ) ;
storm : : storage : : sparse : : ModelComponents < ValueType , RewardModelType > modelComponents ( mdpTransitionsBuilder . build ( mdpMatrixRow , nextMdpStateId , nextMdpStateId ) , std : : move ( mdpLabeling ) ) ;
for ( uint64_t row = 0 ; row < modelComponents . transitionMatrix . getRowCount ( ) ; + + row ) {
if ( ! storm : : utility : : isOne ( modelComponents . transitionMatrix . getRowSum ( row ) ) ) {
std : : cout < < " Row " < < row < < " does not sum up to one. " < < modelComponents . transitionMatrix . getRowSum ( row ) < < " instead " < < std : : endl ;
}
}
auto overApproxMdp = std : : make_shared < storm : : models : : sparse : : Mdp < ValueType , RewardModelType > > ( std : : move ( modelComponents ) ) ;
auto overApproxMdp = std : : make_shared < storm : : models : : sparse : : Mdp < ValueType , RewardModelType > > ( std : : move ( modelComponents ) ) ;
if ( computeRewards ) {
if ( computeRewards ) {
storm : : models : : sparse : : StandardRewardModel < ValueType > mdpRewardModel ( boost : : none , std : : vector < ValueType > ( mdpMatrixRow ) ) ;
storm : : models : : sparse : : StandardRewardModel < ValueType > mdpRewardModel ( boost : : none , std : : vector < ValueType > ( mdpMatrixRow ) ) ;
for ( auto const & iter : beliefStateMap . left ) {
for ( auto const & iter : beliefStateMap . left ) {
auto currentBelief = newB eliefGrid. getGridPoint ( iter . first ) ;
auto currentBelief = beliefGrid . getGridPoint ( iter . first ) ;
auto representativeState = currentBelief . begin ( ) - > first ;
auto representativeState = currentBelief . begin ( ) - > first ;
for ( uint64_t action = 0 ; action < overApproxMdp - > getNumberOfChoices ( representativeState ) ; + + action ) {
for ( uint64_t action = 0 ; action < overApproxMdp - > getNumberOfChoices ( representativeState ) ; + + action ) {
// Add the reward
// Add the reward
@ -575,25 +556,27 @@ namespace storm {
STORM_LOG_ASSERT ( res , " Result does not exist. " ) ;
STORM_LOG_ASSERT ( res , " Result does not exist. " ) ;
res - > filter ( storm : : modelchecker : : ExplicitQualitativeCheckResult ( storm : : storage : : BitVector ( overApproxMdp - > getNumberOfStates ( ) , true ) ) ) ;
res - > filter ( storm : : modelchecker : : ExplicitQualitativeCheckResult ( storm : : storage : : BitVector ( overApproxMdp - > getNumberOfStates ( ) , true ) ) ) ;
auto overApproxResultMap = res - > asExplicitQuantitativeCheckResult < ValueType > ( ) . getValueMap ( ) ;
auto overApproxResultMap = res - > asExplicitQuantitativeCheckResult < ValueType > ( ) . getValueMap ( ) ;
auto overApprox = overApproxResultMap [ beliefStateMap . left . at ( initialBelief . i d) ] ;
auto overApprox = overApproxResultMap [ beliefStateMap . left . at ( initialBeliefI d ) ] ;
STORM_PRINT ( " Time Overapproximation: " < < statistics . overApproximationCheckTime < < " seconds. " < < std : : endl ) ;
STORM_PRINT ( " Time Overapproximation: " < < statistics . overApproximationCheckTime < < " seconds. " < < std : : endl ) ;
STORM_PRINT ( " Over-Approximation Result: " < < overApprox < < std : : endl ) ;
STORM_PRINT ( " Over-Approximation Result: " < < overApprox < < std : : endl ) ;
//auto underApprox = weightedSumUnderMap[initialBelief.id];
//auto underApprox = weightedSumUnderMap[initialBelief.id];
/* TODO: Enable under approx again:
auto underApproxComponents = computeUnderapproximation ( beliefList , beliefIsTarget , targetObservations , initialBelief . id , min , computeRewards , maxUaModelSize ) ;
auto underApproxComponents = computeUnderapproximation ( beliefGrid , targetObservations , min , computeRewards , maxUaModelSize ) ;
if ( storm : : utility : : resources : : isTerminate ( ) & & ! underApproxComponents ) {
if ( storm : : utility : : resources : : isTerminate ( ) & & ! underApproxComponents ) {
return std : : make_unique < RefinementComponents < ValueType > > (
RefinementComponents < ValueType > { modelPtr , overApprox , 0 , overApproxResultMap , { } , beliefList , beliefGrid , beliefIsTarget , beliefStateMap , { } , initialBelief . id } ) ;
// TODO: return other components needed for refinement.
//return std::make_unique<RefinementComponents<ValueType>>(RefinementComponents<ValueType>{modelPtr, overApprox, 0, overApproxResultMap, {}, beliefList, beliefGrid, beliefIsTarget, beliefStateMap, {}, initialBelief.id});
return std : : make_unique < RefinementComponents < ValueType > > ( RefinementComponents < ValueType > { modelPtr , overApprox , 0 , overApproxResultMap , { } , { } , { } , { } , beliefStateMap , { } , initialBeliefId } ) ;
}
}
STORM_PRINT ( " Under-Approximation Result: " < < underApproxComponents - > underApproxValue < < std : : endl ) ;
STORM_PRINT ( " Under-Approximation Result: " < < underApproxComponents - > underApproxValue < < std : : endl ) ;
/* TODO: return other components needed for refinement.
return std : : make_unique < RefinementComponents < ValueType > > (
return std : : make_unique < RefinementComponents < ValueType > > (
RefinementComponents < ValueType > { modelPtr , overApprox , underApproxComponents - > underApproxValue , overApproxResultMap ,
RefinementComponents < ValueType > { modelPtr , overApprox , underApproxComponents - > underApproxValue , overApproxResultMap ,
underApproxComponents - > underApproxMap , beliefList , beliefGrid , beliefIsTarget , beliefStateMap ,
underApproxComponents - > underApproxMap , beliefList , beliefGrid , beliefIsTarget , beliefStateMap ,
underApproxComponents - > underApproxBeliefStateMap , initialBelief . id } ) ;
underApproxComponents - > underApproxBeliefStateMap , initialBelief . id } ) ;
*/
*/
return std : : make_unique < RefinementComponents < ValueType > > ( RefinementComponents < ValueType > { modelPtr , overApprox , storm : : utility : : zero < ValueType > ( ) , overApproxResultMap ,
{ } , { } , { } , { } , beliefStateMap , { } , initialBelief . i d} ) ;
return std : : make_unique < RefinementComponents < ValueType > > ( RefinementComponents < ValueType > { modelPtr , overApprox , underApproxComponents - > underApproxValue , overApproxResultMap ,
underApproxComponents - > underApproxMap , { } , { } , { } , beliefStateMap , underApproxComponents - > underApproxBeliefStateMap , initialBeliefI d} ) ;
}
}
@ -949,7 +932,7 @@ namespace storm {
uint64_t initialBeliefId , bool min ,
uint64_t initialBeliefId , bool min ,
bool computeRewards , uint64_t maxModelSize ) {
bool computeRewards , uint64_t maxModelSize ) {
std : : set < uint64_t > visitedBelieves ;
std : : set < uint64_t > visitedBelieves ;
std : : deque < uint64_t > believe sToBeExpanded ;
std : : deque < uint64_t > belief sToBeExpanded ;
bsmap_type beliefStateMap ;
bsmap_type beliefStateMap ;
std : : vector < std : : vector < std : : map < uint64_t , ValueType > > > transitions = { { { { 0 , storm : : utility : : one < ValueType > ( ) } } } ,
std : : vector < std : : vector < std : : map < uint64_t , ValueType > > > transitions = { { { { 0 , storm : : utility : : one < ValueType > ( ) } } } ,
{ { { 1 , storm : : utility : : one < ValueType > ( ) } } } } ;
{ { { 1 , storm : : utility : : one < ValueType > ( ) } } } } ;
@ -964,10 +947,10 @@ namespace storm {
statistics . underApproximationBuildTime . start ( ) ;
statistics . underApproximationBuildTime . start ( ) ;
// Expand the believes
// Expand the believes
visitedBelieves . insert ( initialBeliefId ) ;
visitedBelieves . insert ( initialBeliefId ) ;
believe sToBeExpanded . push_back ( initialBeliefId ) ;
while ( ! believe sToBeExpanded . empty ( ) ) {
belief sToBeExpanded . push_back ( initialBeliefId ) ;
while ( ! belief sToBeExpanded . empty ( ) ) {
//TODO think of other ways to stop exploration besides model size
//TODO think of other ways to stop exploration besides model size
auto currentBeliefId = believe sToBeExpanded . front ( ) ;
auto currentBeliefId = belief sToBeExpanded . front ( ) ;
uint64_t numChoices = pomdp . getNumberOfChoices ( pomdp . getStatesWithObservation ( beliefList [ currentBeliefId ] . observation ) . front ( ) ) ;
uint64_t numChoices = pomdp . getNumberOfChoices ( pomdp . getStatesWithObservation ( beliefList [ currentBeliefId ] . observation ) . front ( ) ) ;
// for targets, we only consider one action with one transition
// for targets, we only consider one action with one transition
if ( beliefIsTarget [ currentBeliefId ] ) {
if ( beliefIsTarget [ currentBeliefId ] ) {
@ -992,7 +975,7 @@ namespace storm {
if ( visitedBelieves . insert ( nextBeliefId ) . second ) {
if ( visitedBelieves . insert ( nextBeliefId ) . second ) {
beliefStateMap . insert ( bsmap_type : : value_type ( nextBeliefId , stateId ) ) ;
beliefStateMap . insert ( bsmap_type : : value_type ( nextBeliefId , stateId ) ) ;
+ + stateId ;
+ + stateId ;
believe sToBeExpanded . push_back ( nextBeliefId ) ;
belief sToBeExpanded . push_back ( nextBeliefId ) ;
+ + counter ;
+ + counter ;
}
}
transitionsInStateWithAction [ beliefStateMap . left . at ( nextBeliefId ) ] = iter - > second ;
transitionsInStateWithAction [ beliefStateMap . left . at ( nextBeliefId ) ] = iter - > second ;
@ -1001,7 +984,7 @@ namespace storm {
}
}
transitions . push_back ( actionTransitionStorage ) ;
transitions . push_back ( actionTransitionStorage ) ;
}
}
believe sToBeExpanded . pop_front ( ) ;
belief sToBeExpanded . pop_front ( ) ;
if ( storm : : utility : : resources : : isTerminate ( ) ) {
if ( storm : : utility : : resources : : isTerminate ( ) ) {
statistics . underApproximationBuildAborted = true ;
statistics . underApproximationBuildAborted = true ;
break ;
break ;