restore remove_reward_model bind

randriu · Jan 26, 2024 · 7d3be7e · 7d3be7e
1 parent 387a3cf
commit 7d3be7e
Show file tree

Hide file tree

Showing 9 changed files with 730 additions and 733 deletions.
diff --git a/paynt/parser/sketch.py b/paynt/parser/sketch.py
@@ -46,7 +46,7 @@ def make_rewards_action_based(model):
             for action in range(tm.get_row_group_start(state),tm.get_row_group_end(state)):
                 action_reward[action] += state_reward
 
-        model.remove_reward_model(name)
+        payntbind.synthesis.remove_reward_model(model,name)
         new_reward_model = stormpy.storage.SparseRewardModel(optional_state_action_reward_vector=action_reward)
         model.add_reward_model(name, new_reward_model)
 

diff --git a/paynt/synthesizer/policy_tree.py b/paynt/synthesizer/policy_tree.py
@@ -235,12 +235,14 @@ def node_id(self):
     def add_nodes_to_graphviz_tree(self, graphviz_tree):
         node_label = ""
         if self.sat is False:
-            node_label = "X"
+            node_label = "∅"
+            # node_label = "X"
         elif self.sat is True:
             # node_label = "✓"
             node_label = f"p{self.policy_index}"
         graphviz_tree.node(self.node_id, label=node_label, shape="ellipse", width="0.15", height="0.15")
-        for child in self.child_nodes:
+        # enumerating in reverse to print policies in ascending order, from left to right
+        for child in reversed(self.child_nodes):
             child.add_nodes_to_graphviz_tree(graphviz_tree)
 
     def add_edges_to_graphviz_tree(self, graphviz_tree):

diff --git a/payntbind/src/synthesis/helpers.cpp b/payntbind/src/synthesis/helpers.cpp
@@ -12,6 +12,7 @@
 #include <storm/environment/solver/NativeSolverEnvironment.h>
 #include <storm/environment/solver/MinMaxSolverEnvironment.h>
 #include <storm/storage/SparseMatrix.h>
+#include <storm/models/sparse/Model.h>
 
 namespace synthesis {
 
@@ -36,6 +37,11 @@ std::shared_ptr<storm::logic::Formula> transformUntilToEventually(
     return modified_formula;
 }
 
+template<typename ValueType>
+void removeRewardModel(storm::models::sparse::Model<ValueType> & model, std::string const& reward_name) {
+    model.removeRewardModel(reward_name);
+}
+
 }
 
 
@@ -51,6 +57,7 @@ void define_helpers(py::module& m) {
     });
 
     m.def("transform_until_to_eventually", &synthesis::transformUntilToEventually<double>, py::arg("formula"));
+    m.def("remove_reward_model", &synthesis::removeRewardModel<double>, py::arg("model"), py::arg("reward_name"));
 
     m.def("multiply_with_vector", [] (storm::storage::SparseMatrix<double> matrix,std::vector<double> vector) {
         std::vector<double> result(matrix.getRowCount());

diff --git a/payntbind/src/synthesis/pomdp/PomdpManager.cpp b/payntbind/src/synthesis/pomdp/PomdpManager.cpp
diff --git a/payntbind/src/synthesis/pomdp/PomdpManager.h b/payntbind/src/synthesis/pomdp/PomdpManager.h
@@ -3,126 +3,124 @@
 #include "storm/models/sparse/Mdp.h"
 #include "storm/models/sparse/Pomdp.h"
 
-namespace storm {
-    namespace synthesis {
-
-        template<typename ValueType>
-        class PomdpManager {
-
-        public:
-
-            PomdpManager(storm::models::sparse::Pomdp<ValueType> const& pomdp);
-
-            // number of actions available at this observation
-            std::vector<uint64_t> observation_actions;
-            // for each observation, a list of successor observations
-            std::vector<std::vector<uint64_t>> observation_successors;
-
-            /** Memory manipulation . */
-
-            // for each observation contains the number of allocated memory states (initially 1)
-            std::vector<uint64_t> observation_memory_size;
-
-            // set memory size to a selected observation
-            void setObservationMemorySize(uint64_t obs, uint64_t memory_size);
-            // set memory size to all observations
-            void setGlobalMemorySize(uint64_t memory_size);
-
-            // unfold memory model (a priori memory update) into the POMDP
-            std::shared_ptr<storm::models::sparse::Mdp<ValueType>> constructMdp();
-
-            /** Design space associated with this POMDP. */
-
-            // total number of holes
-            uint64_t num_holes;
-            // for each observation, a list of action holes
-            std::vector<std::vector<uint64_t>> action_holes;
-            // for each observation, a list of memory holes
-            std::vector<std::vector<uint64_t>> memory_holes;
-            // for each hole, its size
-            std::vector<uint64_t> hole_options;
-
-            /** Unfolded MDP stuff. */
-
-            // MDP obtained after last injection (initially contains MDP-ized POMDP)
-            std::shared_ptr<storm::models::sparse::Mdp<ValueType>> mdp;
-
-            // for each state contains its prototype state (reverse of prototype_duplicates)
-            std::vector<uint64_t> state_prototype;
-            // for each state contains its memory index
-            std::vector<uint64_t> state_memory;
-
-            // for each row, the corresponding action hole
-            std::vector<uint64_t> row_action_hole;
-            // for each row, the corresponding option of the action hole
-            std::vector<uint64_t> row_action_option;
-            // for each row, the corresponding memory hole
-            std::vector<uint64_t> row_memory_hole;
-            // for each row, the corresponding option of the memory hole
-            std::vector<uint64_t> row_memory_option;
-
-            // for each observation contains the maximum memory size of a destination
-            // across all rows of a prototype state having this observation
-            std::vector<uint64_t> max_successor_memory_size;
-
-
-        private:
-
-            /**
-             * Build the state space:
-             * - compute total number of states (@num_states)
-             * - associate prototype states with their duplicates (@prototype_duplicates)
-             * - for each state, remember its prototype (@state_prototype)
-             * - for each state, remember its memory (@state_memory)
-             */ 
-            void buildStateSpace();
-
-            /**
-             * Get index of the @memory equivalent of the @prototype.
-             * If the prototype does not have the corresponding memory
-             * equivalent, default to @memory=0.
-             */
-            uint64_t translateState(uint64_t prototype, uint64_t memory);
-
-            // compute max memory size among all destinations of a prototype row
-            uint64_t maxSuccessorMemorySize(uint64_t prototype_row);
-
-            /**
-             * Build the shape of the transition matrix:
-             * - for each row store its prototype (@row_prototype)
-             * - for each row store its memory index (@row_memory)
-             * - deduce row groups of the resulting transition matrix (@row_groups)
-             * - deduce the overall number of rows (@num_rows)
-             */
-            void buildTransitionMatrix();
-
-            void buildTransitionMatrixSpurious();
-
-            void resetDesignSpace();
-            void buildDesignSpaceSpurious();
-
-            storm::models::sparse::StateLabeling constructStateLabeling();
-            storm::storage::SparseMatrix<ValueType> constructTransitionMatrix();
-            storm::models::sparse::StandardRewardModel<ValueType> constructRewardModel(storm::models::sparse::StandardRewardModel<ValueType> const& reward_model);
-
-            // original POMDP
-            storm::models::sparse::Pomdp<ValueType> const& pomdp;
-            // for each row of a POMDP contains its index in its row group
-            std::vector<uint64_t> prototype_row_index;
-
-            // number of states in an unfolded MDP
-            uint64_t num_states;
-            // for each prototype state contains a list of its duplicates (including itself)
-            std::vector<std::vector<uint64_t>> prototype_duplicates;
-
-            // number of rows in an unfolded MDP
-            uint64_t num_rows;
-            // row groups of the resulting transition matrix
-            std::vector<uint64_t> row_groups;
-            // for each row contains index of the prototype row
-            std::vector<uint64_t> row_prototype;
-            // for each row contains a memory update associated with it 
-            std::vector<uint64_t> row_memory;
-        };
-    }
+namespace synthesis {
+
+    template<typename ValueType>
+    class PomdpManager {
+
+    public:
+
+        PomdpManager(storm::models::sparse::Pomdp<ValueType> const& pomdp);
+
+        // number of actions available at this observation
+        std::vector<uint64_t> observation_actions;
+        // for each observation, a list of successor observations
+        std::vector<std::vector<uint64_t>> observation_successors;
+
+        /** Memory manipulation . */
+
+        // for each observation contains the number of allocated memory states (initially 1)
+        std::vector<uint64_t> observation_memory_size;
+
+        // set memory size to a selected observation
+        void setObservationMemorySize(uint64_t obs, uint64_t memory_size);
+        // set memory size to all observations
+        void setGlobalMemorySize(uint64_t memory_size);
+
+        // unfold memory model (a priori memory update) into the POMDP
+        std::shared_ptr<storm::models::sparse::Mdp<ValueType>> constructMdp();
+
+        /** Design space associated with this POMDP. */
+
+        // total number of holes
+        uint64_t num_holes;
+        // for each observation, a list of action holes
+        std::vector<std::vector<uint64_t>> action_holes;
+        // for each observation, a list of memory holes
+        std::vector<std::vector<uint64_t>> memory_holes;
+        // for each hole, its size
+        std::vector<uint64_t> hole_options;
+
+        /** Unfolded MDP stuff. */
+
+        // MDP obtained after last injection (initially contains MDP-ized POMDP)
+        std::shared_ptr<storm::models::sparse::Mdp<ValueType>> mdp;
+
+        // for each state contains its prototype state (reverse of prototype_duplicates)
+        std::vector<uint64_t> state_prototype;
+        // for each state contains its memory index
+        std::vector<uint64_t> state_memory;
+
+        // for each row, the corresponding action hole
+        std::vector<uint64_t> row_action_hole;
+        // for each row, the corresponding option of the action hole
+        std::vector<uint64_t> row_action_option;
+        // for each row, the corresponding memory hole
+        std::vector<uint64_t> row_memory_hole;
+        // for each row, the corresponding option of the memory hole
+        std::vector<uint64_t> row_memory_option;
+
+        // for each observation contains the maximum memory size of a destination
+        // across all rows of a prototype state having this observation
+        std::vector<uint64_t> max_successor_memory_size;
+
+
+    private:
+
+        /**
+         * Build the state space:
+         * - compute total number of states (@num_states)
+         * - associate prototype states with their duplicates (@prototype_duplicates)
+         * - for each state, remember its prototype (@state_prototype)
+         * - for each state, remember its memory (@state_memory)
+         */ 
+        void buildStateSpace();
+
+        /**
+         * Get index of the @memory equivalent of the @prototype.
+         * If the prototype does not have the corresponding memory
+         * equivalent, default to @memory=0.
+         */
+        uint64_t translateState(uint64_t prototype, uint64_t memory);
+
+        // compute max memory size among all destinations of a prototype row
+        uint64_t maxSuccessorMemorySize(uint64_t prototype_row);
+
+        /**
+         * Build the shape of the transition matrix:
+         * - for each row store its prototype (@row_prototype)
+         * - for each row store its memory index (@row_memory)
+         * - deduce row groups of the resulting transition matrix (@row_groups)
+         * - deduce the overall number of rows (@num_rows)
+         */
+        void buildTransitionMatrix();
+
+        void buildTransitionMatrixSpurious();
+
+        void resetDesignSpace();
+        void buildDesignSpaceSpurious();
+
+        storm::models::sparse::StateLabeling constructStateLabeling();
+        storm::storage::SparseMatrix<ValueType> constructTransitionMatrix();
+        storm::models::sparse::StandardRewardModel<ValueType> constructRewardModel(storm::models::sparse::StandardRewardModel<ValueType> const& reward_model);
+
+        // original POMDP
+        storm::models::sparse::Pomdp<ValueType> const& pomdp;
+        // for each row of a POMDP contains its index in its row group
+        std::vector<uint64_t> prototype_row_index;
+
+        // number of states in an unfolded MDP
+        uint64_t num_states;
+        // for each prototype state contains a list of its duplicates (including itself)
+        std::vector<std::vector<uint64_t>> prototype_duplicates;
+
+        // number of rows in an unfolded MDP
+        uint64_t num_rows;
+        // row groups of the resulting transition matrix
+        std::vector<uint64_t> row_groups;
+        // for each row contains index of the prototype row
+        std::vector<uint64_t> row_prototype;
+        // for each row contains a memory update associated with it 
+        std::vector<uint64_t> row_memory;
+    };
 }