fixes

7 years ago · 2be3f553e0
3 changed files with 74 additions and 34 deletions
--- a/src/storm-pomdp/transformer/ApplyFiniteSchedulerToPomdp.cpp
+++ b/src/storm-pomdp/transformer/ApplyFiniteSchedulerToPomdp.cpp
@ -1,5 +1,7 @@
 #include "storm-pomdp/transformer/ApplyFiniteSchedulerToPomdp.h"

+#include "storm/utility/vector.h"
+
 namespace storm {
    namespace transformer {

@ -16,57 +18,89 @@ namespace storm {
            std::shared_ptr<RawPolynomialCache> cache;
        };

-        template<typename ValueType>
-        std::shared_ptr<storm::models::sparse::Model<storm::RationalFunction>> ApplyFiniteSchedulerToPomdp<ValueType>::transform() const {
-            uint64_t nrStates = pomdp.getNumberOfStates();
-            std::unordered_map<uint32_t, std::vector<storm::RationalFunction>> parameters;
-            bool nondeterminism = false;
-            storm::storage::SparseMatrixBuilder<storm::RationalFunction> smb(nrStates, nrStates, 0, !nondeterminism, false, nrStates);

+        template<typename ValueType>
+        std::unordered_map<uint32_t, std::vector<storm::RationalFunction>> ApplyFiniteSchedulerToPomdp<ValueType>::getObservationChoiceWeights() const {
+            std::unordered_map<uint32_t, std::vector<storm::RationalFunction>> res;
            RationalFunctionConstructor ratFuncConstructor;
-
-            for (uint64_t state = 0; state < nrStates; ++state) {
-                if (nondeterminism) {
-                    smb.newRowGroup(state);
-                }
+             
+            for (uint64_t state = 0; state < pomdp.getNumberOfStates(); ++state) {
                auto observation = pomdp.getObservation(state);
-                auto it = parameters.find(observation);
-                std::vector<storm::RationalFunction> localWeights;
-                if (it == parameters.end()) {
-                    storm::RationalFunction lastWeight(1);
+                auto it = res.find(observation);
+                if (it == res.end()) {
+                    std::vector<storm::RationalFunction> weights;
+                    storm::RationalFunction lastWeight = storm::utility::one<storm::RationalFunction>();
                    for (uint64_t a = 0; a < pomdp.getNumberOfChoices(state) - 1; ++a) {
                        std::string varName = "p" + std::to_string(observation) + "_" + std::to_string(a);
-                        localWeights.push_back(ratFuncConstructor.translate(carl::freshRealVariable(varName)));
-                        lastWeight -= localWeights.back();
+                        weights.push_back(ratFuncConstructor.translate(carl::freshRealVariable(varName)));
+                        lastWeight -= weights.back();
                    }
-                    localWeights.push_back(lastWeight);
-                    parameters.emplace(observation, localWeights);
-                } else {
-                    STORM_LOG_ASSERT(it->second.size() == pomdp.getNumberOfChoices(state), "Number of choices must be equal for every state with same number of actions");
-                    localWeights = it->second;
+                    weights.push_back(lastWeight);
+                    res.emplace(observation, weights);
                }
+                STORM_LOG_ASSERT(it == res.end() || it->second.size() == pomdp.getNumberOfChoices(state), "Number of choices must be equal for every state with same number of actions");
+            }
+            return res;
+        }
+
+
+
+        template<typename ValueType>
+        std::shared_ptr<storm::models::sparse::Model<storm::RationalFunction>> ApplyFiniteSchedulerToPomdp<ValueType>::transform() const {
+            storm::storage::sparse::ModelComponents<storm::RationalFunction> modelComponents;
+
+            uint64_t nrStates = pomdp.getNumberOfStates();
+            std::unordered_map<uint32_t, std::vector<storm::RationalFunction>> observationChoiceWeights = getObservationChoiceWeights();
+            storm::storage::SparseMatrixBuilder<storm::RationalFunction> smb(nrStates, nrStates, 0, true);
+
+            for (uint64_t state = 0; state < nrStates; ++state) {
+                auto const& weights = observationChoiceWeights.at(pomdp.getObservation(state));
                std::map<uint64_t, storm::RationalFunction> weightedTransitions;
                for (uint64_t action = 0; action < pomdp.getNumberOfChoices(state); ++action) {
                    for (auto const& entry: pomdp.getTransitionMatrix().getRow(state, action)) {
                        auto it = weightedTransitions.find(entry.getColumn());
                        if (it == weightedTransitions.end()) {
-                            weightedTransitions[entry.getColumn()] = storm::utility::convertNumber<storm::RationalFunctionCoefficient>(entry.getValue()) * localWeights[action]; //carl::rationalize<storm::RationalFunctionCoefficient>(entry.getValue()) * localWeights[action];
+                            weightedTransitions[entry.getColumn()] = storm::utility::convertNumber<storm::RationalFunction>(entry.getValue()) * weights[action];
                        } else {
-                            it->second += storm::utility::convertNumber<storm::RationalFunctionCoefficient>(entry.getValue()) * localWeights[action];
+                            it->second += storm::utility::convertNumber<storm::RationalFunction>(entry.getValue()) * weights[action];
                        }
                    }
                }
-
                for (auto const& entry : weightedTransitions) {
                    smb.addNextValue(state, entry.first, entry.second);
                }
            }
-
-            // TODO rewards.
-
-            storm::storage::sparse::ModelComponents<storm::RationalFunction> modelComponents(smb.build(),pomdp.getStateLabeling());
+            modelComponents.transitionMatrix = smb.build();
+            
+            for (auto const& pomdpRewardModel : pomdp.getRewardModels()) {
+                std::vector<storm::RationalFunction> stateRewards;
+                
+                if (pomdpRewardModel.second.hasStateRewards()) {
+                    stateRewards = storm::utility::vector::convertNumericVector<storm::RationalFunction>(pomdpRewardModel.second.getStateRewardVector());
+                } else {
+                    stateRewards.resize(nrStates, storm::utility::zero<storm::RationalFunction>());
+                }
+                if (pomdpRewardModel.second.hasStateActionRewards()) {
+                    std::vector<ValueType> pomdpActionRewards = pomdpRewardModel.second.getStateActionRewardVector();
+                    for (uint64_t state = 0; state < nrStates; ++state) {
+                        auto& stateReward = stateRewards[state];
+                        auto const& weights = observationChoiceWeights.at(pomdp.getObservation(state));
+                        uint64_t offset = pomdp.getTransitionMatrix().getRowGroupIndices()[state];
+                        for (uint64_t action = 0; action < pomdp.getNumberOfChoices(state); ++action) {
+                            if (!storm::utility::isZero(pomdpActionRewards[offset + action])) {
+                                stateReward += storm::utility::convertNumber<storm::RationalFunction>(pomdpActionRewards[offset + action]) * weights[action];
+                            }
+                        }
+                    }
+                }
+                storm::models::sparse::StandardRewardModel<storm::RationalFunction> rewardModel(std::move(stateRewards));
+                modelComponents.rewardModels.emplace(pomdpRewardModel.first, std::move(rewardModel));
+            }
+            
+            modelComponents.stateLabeling = pomdp.getStateLabeling();
+            
            return std::make_shared<storm::models::sparse::Dtmc<storm::RationalFunction>>(modelComponents);
-
+            
        }

        template class ApplyFiniteSchedulerToPomdp<storm::RationalNumber>;
--- a/src/storm-pomdp/transformer/ApplyFiniteSchedulerToPomdp.h
+++ b/src/storm-pomdp/transformer/ApplyFiniteSchedulerToPomdp.h
@ -17,6 +17,12 @@ namespace storm {
            }

            std::shared_ptr<storm::models::sparse::Model<storm::RationalFunction>> transform() const;
+        
+        private:
+        
+        
+            std::unordered_map<uint32_t, std::vector<storm::RationalFunction>> getObservationChoiceWeights() const;
+
            storm::models::sparse::Pomdp<ValueType> const& pomdp;
        };
    }
--- a/src/storm-pomdp/transformer/PomdpMemoryUnfolder.cpp
+++ b/src/storm-pomdp/transformer/PomdpMemoryUnfolder.cpp
@ -31,11 +31,11 @@ namespace storm {
            template<typename ValueType>
            storm::storage::SparseMatrix<ValueType> PomdpMemoryUnfolder<ValueType>::transformTransitions() const {
                storm::storage::SparseMatrix<ValueType> const& origTransitions = pomdp.getTransitionMatrix();
-                storm::storage::SparseMatrixBuilder<ValueType> builder(pomdp.getNumberOfStates() * numMemoryStates * numMemoryStates,
+                storm::storage::SparseMatrixBuilder<ValueType> builder(pomdp.getNumberOfChoices() * numMemoryStates * numMemoryStates,
                                                                        pomdp.getNumberOfStates() * numMemoryStates,
                                                                        origTransitions.getEntryCount() * numMemoryStates * numMemoryStates,
                                                                        true,
-                                                                        false,
+                                                                        true,
                                                                        pomdp.getNumberOfStates() * numMemoryStates);
                
                uint64_t row = 0;
@ -96,7 +96,7 @@ namespace storm {
                }
                if (rewardModel.hasStateActionRewards()) {
                    actionRewards = std::vector<ValueType>();
-                    stateRewards->reserve(pomdp.getNumberOfStates() * numMemoryStates * numMemoryStates);
+                    actionRewards->reserve(pomdp.getNumberOfStates() * numMemoryStates * numMemoryStates);
                    for (uint64_t modelState = 0; modelState < pomdp.getNumberOfStates(); ++modelState) {
                        for (uint32_t memState = 0; memState < numMemoryStates; ++memState) {
                            for (uint64_t origRow = pomdp.getTransitionMatrix().getRowGroupIndices()[modelState]; origRow < pomdp.getTransitionMatrix().getRowGroupIndices()[modelState + 1]; ++origRow) {
@ -108,7 +108,7 @@ namespace storm {
                        }
                    }
                }
-                STORM_LOG_THROW(rewardModel.hasTransitionRewards(), storm::exceptions::NotSupportedException, "Transition rewards are currently not supported.");
+                STORM_LOG_THROW(!rewardModel.hasTransitionRewards(), storm::exceptions::NotSupportedException, "Transition rewards are currently not supported.");
                return storm::models::sparse::StandardRewardModel<ValueType>(std::move(stateRewards), std::move(actionRewards));
            }