d4/de5/_belief_mdp_explorer_8h_source.html

#pragma once


#include <deque>

#include <map>

#include <memory>

#include <optional>

#include <queue>

#include <vector>


#include "storm-pomdp/storage/BeliefExplorationBounds.h"

#include "storm-pomdp/storage/BeliefManager.h"

#include "storm/models/sparse/Mdp.h"

#include "storm/storage/BitVector.h"


namespace storm {

class Environment;


namespace modelchecker {

template<typename FormulaType, typename ValueType>

class CheckTask;

class CheckResult;

}  // namespace modelchecker

namespace builder {

enum class ExplorationHeuristic { BreadthFirst, LowerBoundPrio, UpperBoundPrio, GapPrio, ProbabilityPrio };


template<typename PomdpType, typename BeliefValueType = typename PomdpType::ValueType>


class BeliefMdpExplorer {

   public:

    typedef typename PomdpType::ValueType ValueType;

    typedef storm::storage::BeliefManager<PomdpType, BeliefValueType> BeliefManagerType;

    typedef typename BeliefManagerType::BeliefId BeliefId;

    typedef uint64_t MdpStateType;


    struct SuccessorObservationInformation {

        SuccessorObservationInformation(ValueType const &obsProb, ValueType const &maxProb, uint64_t const &count);

        void join(SuccessorObservationInformation other);

        ValueType observationProbability;

        ValueType maxProbabilityToSuccessorWithObs;

        uint64_t successorWithObsCount;

        typename BeliefManagerType::BeliefSupportType support;

    };


    enum class Status { Uninitialized, Exploring, ModelFinished, ModelChecked };


    BeliefMdpExplorer(std::shared_ptr<BeliefManagerType> beliefManager, storm::pomdp::storage::PreprocessingPomdpValueBounds<ValueType> const &pomdpValueBounds,

                      ExplorationHeuristic explorationHeuristic = ExplorationHeuristic::BreadthFirst);


    BeliefMdpExplorer(BeliefMdpExplorer &&other) = default;


    BeliefManagerType const &getBeliefManager() const;


    void startNewExploration(std::optional<ValueType> extraTargetStateValue = boost::none, std::optional<ValueType> extraBottomStateValue = std::nullopt);


    void restartExploration();


    bool hasUnexploredState() const;


    std::vector<uint64_t> getUnexploredStates();


    BeliefId exploreNextState();


    void addChoiceLabelToCurrentState(uint64_t const &localActionIndex, std::string const &label);


    void addTransitionsToExtraStates(uint64_t const &localActionIndex, ValueType const &targetStateValue = storm::utility::zero<ValueType>(),

                                     ValueType const &bottomStateValue = storm::utility::zero<ValueType>());


    void addSelfloopTransition(uint64_t const &localActionIndex = 0, ValueType const &value = storm::utility::one<ValueType>());


    bool addTransitionToBelief(uint64_t const &localActionIndex, BeliefId const &transitionTarget, ValueType const &value, bool ignoreNewBeliefs);


    void computeRewardAtCurrentState(uint64_t const &localActionIndex, ValueType extraReward = storm::utility::zero<ValueType>());


    void addRewardToCurrentState(uint64_t const &localActionIndex, ValueType rewardValue);


    void setCurrentStateIsTarget();


    void setCurrentStateIsTruncated();


    void setCurrentStateIsClipped();


    void setCurrentChoiceIsDelayed(uint64_t const &localActionIndex);


    bool currentStateHasOldBehavior() const;


    bool getCurrentStateWasTruncated() const;


    bool getCurrentStateWasClipped() const;


    bool stateIsOptimalSchedulerReachable(MdpStateType mdpState) const;


    bool actionIsOptimal(uint64_t const &globalActionIndex) const;


    bool currentStateIsOptimalSchedulerReachable() const;


    bool actionAtCurrentStateWasOptimal(uint64_t const &localActionIndex) const;


    bool getCurrentStateActionExplorationWasDelayed(uint64_t const &localActionIndex) const;


    void restoreOldBehaviorAtCurrentState(uint64_t const &localActionIndex);


    void finishExploration();


    void dropUnexploredStates();


    std::shared_ptr<storm::models::sparse::Mdp<ValueType>> getExploredMdp() const;


    MdpStateType getCurrentNumberOfMdpStates() const;


    MdpStateType getCurrentNumberOfMdpChoices() const;


    MdpStateType getStartOfCurrentRowGroup() const;


    uint64_t getSizeOfCurrentRowGroup() const;


    uint64_t getRowGroupSizeOfState(uint64_t state) const;


    bool needsActionAdjustment(uint64_t numActionsNeeded);


    ValueType getLowerValueBoundAtCurrentState() const;


    ValueType getUpperValueBoundAtCurrentState() const;


    ValueType computeLowerValueBoundAtBelief(BeliefId const &beliefId) const;


    ValueType computeUpperValueBoundAtBelief(BeliefId const &beliefId) const;


    ValueType computeLowerValueBoundForScheduler(BeliefId const &beliefId, uint64_t schedulerId) const;


    ValueType computeUpperValueBoundForScheduler(BeliefId const &beliefId, uint64_t schedulerId) const;


    std::pair<bool, ValueType> computeFMSchedulerValueForMemoryNode(BeliefId const &beliefId, uint64_t memoryNode) const;


    storm::storage::Scheduler<ValueType> getUpperValueBoundScheduler(uint64_t schedulerId) const;


    storm::storage::Scheduler<ValueType> getLowerValueBoundScheduler(uint64_t schedulerId) const;


    std::vector<storm::storage::Scheduler<ValueType>> getUpperValueBoundSchedulers() const;


    std::vector<storm::storage::Scheduler<ValueType>> getLowerValueBoundSchedulers() const;


    void computeValuesOfExploredMdp(storm::Environment const &env, storm::solver::OptimizationDirection const &dir);


    bool hasComputedValues() const;


    bool hasFMSchedulerValues() const;


    std::vector<ValueType> const &getValuesOfExploredMdp() const;


    ValueType const &getComputedValueAtInitialState() const;


    MdpStateType getBeliefId(MdpStateType exploredMdpState) const;


    void gatherSuccessorObservationInformationAtCurrentState(uint64_t localActionIndex,

                                                             std::map<uint32_t, SuccessorObservationInformation> &gatheredSuccessorObservations);


    void gatherSuccessorObservationInformationAtMdpChoice(uint64_t mdpChoice,

                                                          std::map<uint32_t, SuccessorObservationInformation> &gatheredSuccessorObservations);


    bool currentStateHasSuccessorObservationInObservationSet(uint64_t localActionIndex, storm::storage::BitVector const &observationSet);


    void takeCurrentValuesAsUpperBounds();


    void takeCurrentValuesAsLowerBounds();


    void computeOptimalChoicesAndReachableMdpStates(ValueType const &ancillaryChoicesEpsilon, bool relativeDifference);


    std::vector<BeliefId> getBeliefsWithObservationInMdp(uint32_t obs) const;


    std::vector<BeliefId> getBeliefsInMdp();


    void addClippingRewardToCurrentState(uint64_t const &localActionIndex, ValueType rewardValue);


    ValueType getTrivialUpperBoundAtPOMDPState(uint64_t const &pomdpState);


    ValueType getTrivialLowerBoundAtPOMDPState(uint64_t const &pomdpState);


    void setExtremeValueBound(storm::pomdp::storage::ExtremePOMDPValueBound<ValueType> valueBound);


    ValueType getExtremeValueBoundAtPOMDPState(uint64_t const &pomdpState);


    MdpStateType getExploredMdpState(BeliefId const &beliefId) const;


    bool beliefHasMdpState(BeliefId const &beliefId) const;


    storm::storage::BitVector getStateExtremeBoundIsInfinite();


    uint64_t getNrSchedulersForUpperBounds();


    uint64_t getNrSchedulersForLowerBounds();


    void markAsGridBelief(BeliefId const &beliefId);


    bool isMarkedAsGridBelief(BeliefId const &beliefId);


    const std::shared_ptr<storm::storage::Scheduler<BeliefMdpExplorer<PomdpType, BeliefValueType>::ValueType>> &getSchedulerForExploredMdp() const;


    void setFMSchedValueList(std::vector<std::vector<std::unordered_map<uint64_t, ValueType>>> valueList);


    uint64_t getNrOfMemoryNodesForObservation(uint32_t observation) const;


    void storeExplorationState();


    void restoreExplorationState();


    void adjustActions(uint64_t totalNumberOfActions);


    std::vector<BeliefValueType> computeProductWithSparseMatrix(BeliefId const &beliefId, storm::storage::SparseMatrix<BeliefValueType> &matrix) const;


   private:

    MdpStateType noState() const;


    std::shared_ptr<storm::logic::Formula const> createStandardProperty(storm::solver::OptimizationDirection const &dir, bool computeRewards);


    storm::modelchecker::CheckTask<storm::logic::Formula, ValueType> createStandardCheckTask(std::shared_ptr<storm::logic::Formula const> &property);


    MdpStateType getCurrentMdpState() const;


    MdpStateType getCurrentBeliefId() const;


    void internalAddTransition(uint64_t const &row, MdpStateType const &column, ValueType const &value);


    void internalAddRowGroupIndex();


    void insertValueHints(ValueType const &lowerBound, ValueType const &upperBound);


    MdpStateType getOrAddMdpState(BeliefId const &beliefId, ValueType const &transitionValue = storm::utility::zero<ValueType>());


    // Belief state related information

    std::shared_ptr<BeliefManagerType> beliefManager;

    std::vector<BeliefId> mdpStateToBeliefIdMap;

    std::map<BeliefId, MdpStateType> beliefIdToMdpStateMap;

    storm::storage::BitVector exploredBeliefIds;

    std::map<BeliefId, std::map<uint64_t, std::string>> mdpStateToChoiceLabelsMap;


    // Exploration information

    std::multimap<ValueType, uint64_t> mdpStatesToExplorePrioState;

    std::map<uint64_t, ValueType> mdpStatesToExploreStatePrio;

    std::vector<ValueType> probabilityEstimation;

    std::vector<std::map<MdpStateType, ValueType>> exploredMdpTransitions;

    std::vector<MdpStateType> exploredChoiceIndices;

    std::vector<MdpStateType> previousChoiceIndices;

    std::vector<ValueType> mdpActionRewards;

    std::map<MdpStateType, ValueType> clippingTransitionRewards;

    uint64_t currentMdpState;

    std::map<MdpStateType, MdpStateType> stateRemapping;

    uint64_t nextId;

    ValueType prio;


    // Special states and choices during exploration

    std::optional<MdpStateType> extraTargetState;

    std::optional<MdpStateType> extraBottomState;

    storm::storage::BitVector targetStates;

    storm::storage::BitVector truncatedStates;

    storm::storage::BitVector clippedStates;

    MdpStateType initialMdpState;

    storm::storage::BitVector delayedExplorationChoices;

    std::unordered_set<BeliefId> gridBeliefs;


    // Final Mdp

    std::shared_ptr<storm::models::sparse::Mdp<ValueType>> exploredMdp;


    // Value and scheduler related information

    storm::pomdp::storage::PreprocessingPomdpValueBounds<ValueType> pomdpValueBounds;

    storm::pomdp::storage::ExtremePOMDPValueBound<ValueType> extremeValueBound;

    std::vector<std::vector<std::unordered_map<uint64_t, ValueType>>> fmSchedulerValueList;

    std::vector<ValueType> lowerValueBounds;

    std::vector<ValueType> upperValueBounds;

    std::vector<ValueType> values;  // Contains an estimate during building and the actual result after a check has performed

    std::optional<storm::storage::BitVector> optimalChoices;

    std::optional<storm::storage::BitVector> optimalChoicesReachableMdpStates;

    std::shared_ptr<storm::storage::Scheduler<ValueType>> scheduler;


    // The current status of this explorer

    ExplorationHeuristic explHeuristic;

    Status status;


    struct ExplorationStorage {

        std::vector<BeliefId> storedMdpStateToBeliefIdMap;

        std::map<BeliefId, MdpStateType> storedBeliefIdToMdpStateMap;

        storm::storage::BitVector storedExploredBeliefIds;

        std::map<BeliefId, std::map<uint64_t, std::string>> storedMdpStateToChoiceLabelsMap;

        std::multimap<ValueType, uint64_t> storedMdpStatesToExplorePrioState;

        std::map<uint64_t, ValueType> storedMdpStatesToExploreStatePrio;

        std::vector<ValueType> storedProbabilityEstimation;

        std::vector<std::map<MdpStateType, ValueType>> storedExploredMdpTransitions;

        std::vector<MdpStateType> storedExploredChoiceIndices;

        std::vector<ValueType> storedMdpActionRewards;

        std::map<MdpStateType, ValueType> storedClippingTransitionRewards;

        uint64_t storedCurrentMdpState;

        std::map<MdpStateType, MdpStateType> storedStateRemapping;

        uint64_t storedNextId;

        ValueType storedPrio;

        std::vector<ValueType> storedLowerValueBounds;

        std::vector<ValueType> storedUpperValueBounds;

        std::vector<ValueType> storedValues;

        storm::storage::BitVector storedTargetStates;

    };


    ExplorationStorage explorationStorage;

};


}  // namespace builder

}  // namespace storm

BeliefExplorationBounds.h

BeliefManager.h

BitVector.h

storm::Environment
Definition Environment.h:17

storm::builder::BeliefMdpExplorer
Definition BeliefMdpExplorer.h:27

storm::builder::BeliefMdpExplorer::getExploredMdpState
MdpStateType getExploredMdpState(BeliefId const &beliefId) const
Definition BeliefMdpExplorer.cpp:1136

storm::builder::BeliefMdpExplorer::storeExplorationState
void storeExplorationState()
Definition BeliefMdpExplorer.cpp:166

storm::builder::BeliefMdpExplorer::addClippingRewardToCurrentState
void addClippingRewardToCurrentState(uint64_t const &localActionIndex, ValueType rewardValue)
Definition BeliefMdpExplorer.cpp:350

storm::builder::BeliefMdpExplorer::computeUpperValueBoundAtBelief
ValueType computeUpperValueBoundAtBelief(BeliefId const &beliefId) const
Definition BeliefMdpExplorer.cpp:875

storm::builder::BeliefMdpExplorer::getNrSchedulersForLowerBounds
uint64_t getNrSchedulersForLowerBounds()
Definition BeliefMdpExplorer.cpp:1321

storm::builder::BeliefMdpExplorer::getCurrentNumberOfMdpStates
MdpStateType getCurrentNumberOfMdpStates() const
Definition BeliefMdpExplorer.cpp:806

storm::builder::BeliefMdpExplorer::getComputedValueAtInitialState
ValueType const & getComputedValueAtInitialState() const
Definition BeliefMdpExplorer.cpp:956

storm::builder::BeliefMdpExplorer::restartExploration
void restartExploration()
Restarts the exploration to allow re-exploring each state.
Definition BeliefMdpExplorer.cpp:123

storm::builder::BeliefMdpExplorer::currentStateHasSuccessorObservationInObservationSet
bool currentStateHasSuccessorObservationInObservationSet(uint64_t localActionIndex, storm::storage::BitVector const &observationSet)
Definition BeliefMdpExplorer.cpp:998

storm::builder::BeliefMdpExplorer::getTrivialLowerBoundAtPOMDPState
ValueType getTrivialLowerBoundAtPOMDPState(uint64_t const &pomdpState)
Definition BeliefMdpExplorer.cpp:1284

storm::builder::BeliefMdpExplorer::setFMSchedValueList
void setFMSchedValueList(std::vector< std::vector< std::unordered_map< uint64_t, ValueType > > > valueList)
Definition BeliefMdpExplorer.cpp:1295

storm::builder::BeliefMdpExplorer::getTrivialUpperBoundAtPOMDPState
ValueType getTrivialUpperBoundAtPOMDPState(uint64_t const &pomdpState)
Definition BeliefMdpExplorer.cpp:1278

storm::builder::BeliefMdpExplorer::addTransitionsToExtraStates
void addTransitionsToExtraStates(uint64_t const &localActionIndex, ValueType const &targetStateValue=storm::utility::zero< ValueType >(), ValueType const &bottomStateValue=storm::utility::zero< ValueType >())
Definition BeliefMdpExplorer.cpp:277

storm::builder::BeliefMdpExplorer::beliefHasMdpState
bool beliefHasMdpState(BeliefId const &beliefId) const
Definition BeliefMdpExplorer.cpp:1061

storm::builder::BeliefMdpExplorer::getValuesOfExploredMdp
std::vector< ValueType > const & getValuesOfExploredMdp() const
Definition BeliefMdpExplorer.cpp:942

storm::builder::BeliefMdpExplorer::getStateExtremeBoundIsInfinite
storm::storage::BitVector getStateExtremeBoundIsInfinite()
Definition BeliefMdpExplorer.cpp:1311

storm::builder::BeliefMdpExplorer::setCurrentStateIsClipped
void setCurrentStateIsClipped()
Definition BeliefMdpExplorer.cpp:371

storm::builder::BeliefMdpExplorer::setCurrentStateIsTarget
void setCurrentStateIsTarget()
Definition BeliefMdpExplorer.cpp:357

storm::builder::BeliefMdpExplorer::getLowerValueBoundScheduler
storm::storage::Scheduler< ValueType > getLowerValueBoundScheduler(uint64_t schedulerId) const
Definition BeliefMdpExplorer.cpp:1327

storm::builder::BeliefMdpExplorer::restoreExplorationState
void restoreExplorationState()
Definition BeliefMdpExplorer.cpp:190

storm::builder::BeliefMdpExplorer::gatherSuccessorObservationInformationAtCurrentState
void gatherSuccessorObservationInformationAtCurrentState(uint64_t localActionIndex, std::map< uint32_t, SuccessorObservationInformation > &gatheredSuccessorObservations)
Definition BeliefMdpExplorer.cpp:970

storm::builder::BeliefMdpExplorer::getSizeOfCurrentRowGroup
uint64_t getSizeOfCurrentRowGroup() const
Definition BeliefMdpExplorer.cpp:825

storm::builder::BeliefMdpExplorer::takeCurrentValuesAsLowerBounds
void takeCurrentValuesAsLowerBounds()
Definition BeliefMdpExplorer.cpp:1016

storm::builder::BeliefMdpExplorer::hasComputedValues
bool hasComputedValues() const
Definition BeliefMdpExplorer.cpp:937

storm::builder::BeliefMdpExplorer::startNewExploration
void startNewExploration(std::optional< ValueType > extraTargetStateValue=boost::none, std::optional< ValueType > extraBottomStateValue=std::nullopt)
Definition BeliefMdpExplorer.cpp:51

storm::builder::BeliefMdpExplorer::getCurrentStateWasTruncated
bool getCurrentStateWasTruncated() const
Definition BeliefMdpExplorer.cpp:393

storm::builder::BeliefMdpExplorer::actionIsOptimal
bool actionIsOptimal(uint64_t const &globalActionIndex) const
Retrieves whether the given action at the current state was optimal in the most recent check.
Definition BeliefMdpExplorer.cpp:419

storm::builder::BeliefMdpExplorer::needsActionAdjustment
bool needsActionAdjustment(uint64_t numActionsNeeded)
Definition BeliefMdpExplorer.cpp:845

storm::builder::BeliefMdpExplorer::getBeliefsWithObservationInMdp
std::vector< BeliefId > getBeliefsWithObservationInMdp(uint32_t obs) const
Definition BeliefMdpExplorer.cpp:1264

storm::builder::BeliefMdpExplorer::getExtremeValueBoundAtPOMDPState
ValueType getExtremeValueBoundAtPOMDPState(uint64_t const &pomdpState)
Definition BeliefMdpExplorer.cpp:1305

storm::builder::BeliefMdpExplorer::getBeliefId
MdpStateType getBeliefId(MdpStateType exploredMdpState) const
Definition BeliefMdpExplorer.cpp:963

storm::builder::BeliefMdpExplorer::computeValuesOfExploredMdp
void computeValuesOfExploredMdp(storm::Environment const &env, storm::solver::OptimizationDirection const &dir)
Definition BeliefMdpExplorer.cpp:915

storm::builder::BeliefMdpExplorer::getBeliefsInMdp
std::vector< BeliefId > getBeliefsInMdp()
Definition BeliefMdpExplorer.cpp:1259

storm::builder::BeliefMdpExplorer::getExploredMdp
std::shared_ptr< storm::models::sparse::Mdp< ValueType > > getExploredMdp() const
Definition BeliefMdpExplorer.cpp:799

storm::builder::BeliefMdpExplorer::getUpperValueBoundScheduler
storm::storage::Scheduler< ValueType > getUpperValueBoundScheduler(uint64_t schedulerId) const
Definition BeliefMdpExplorer.cpp:1336

storm::builder::BeliefMdpExplorer::getLowerValueBoundSchedulers
std::vector< storm::storage::Scheduler< ValueType > > getLowerValueBoundSchedulers() const
Definition BeliefMdpExplorer.cpp:1345

storm::builder::BeliefMdpExplorer::getCurrentStateActionExplorationWasDelayed
bool getCurrentStateActionExplorationWasDelayed(uint64_t const &localActionIndex) const
Definition BeliefMdpExplorer.cpp:447

storm::builder::BeliefMdpExplorer::getBeliefManager
BeliefManagerType const & getBeliefManager() const
Definition BeliefMdpExplorer.cpp:46

storm::builder::BeliefMdpExplorer::Status
Status
Definition BeliefMdpExplorer.h:43

storm::builder::BeliefMdpExplorer::Status::Exploring
@ Exploring

storm::builder::BeliefMdpExplorer::Status::ModelChecked
@ ModelChecked

storm::builder::BeliefMdpExplorer::Status::Uninitialized
@ Uninitialized

storm::builder::BeliefMdpExplorer::Status::ModelFinished
@ ModelFinished

storm::builder::BeliefMdpExplorer::ValueType
PomdpType::ValueType ValueType
Definition BeliefMdpExplorer.h:29

storm::builder::BeliefMdpExplorer::hasUnexploredState
bool hasUnexploredState() const
Definition BeliefMdpExplorer.cpp:222

storm::builder::BeliefMdpExplorer::dropUnexploredStates
void dropUnexploredStates()
Definition BeliefMdpExplorer.cpp:685

storm::builder::BeliefMdpExplorer::setCurrentStateIsTruncated
void setCurrentStateIsTruncated()
Definition BeliefMdpExplorer.cpp:364

storm::builder::BeliefMdpExplorer::BeliefManagerType
storm::storage::BeliefManager< PomdpType, BeliefValueType > BeliefManagerType
Definition BeliefMdpExplorer.h:30

storm::builder::BeliefMdpExplorer::computeFMSchedulerValueForMemoryNode
std::pair< bool, ValueType > computeFMSchedulerValueForMemoryNode(BeliefId const &beliefId, uint64_t memoryNode) const
Definition BeliefMdpExplorer.cpp:905

storm::builder::BeliefMdpExplorer::setExtremeValueBound
void setExtremeValueBound(storm::pomdp::storage::ExtremePOMDPValueBound< ValueType > valueBound)
Definition BeliefMdpExplorer.cpp:1290

storm::builder::BeliefMdpExplorer::hasFMSchedulerValues
bool hasFMSchedulerValues() const
Definition BeliefMdpExplorer.cpp:1359

storm::builder::BeliefMdpExplorer::addChoiceLabelToCurrentState
void addChoiceLabelToCurrentState(uint64_t const &localActionIndex, std::string const &label)
Definition BeliefMdpExplorer.cpp:1254

storm::builder::BeliefMdpExplorer::getUnexploredStates
std::vector< uint64_t > getUnexploredStates()
Definition BeliefMdpExplorer.cpp:228

storm::builder::BeliefMdpExplorer::restoreOldBehaviorAtCurrentState
void restoreOldBehaviorAtCurrentState(uint64_t const &localActionIndex)
Inserts transitions and rewards at the given action as in the MDP of the previous exploration.
Definition BeliefMdpExplorer.cpp:458

storm::builder::BeliefMdpExplorer::computeLowerValueBoundAtBelief
ValueType computeLowerValueBoundAtBelief(BeliefId const &beliefId) const
Definition BeliefMdpExplorer.cpp:863

storm::builder::BeliefMdpExplorer::getRowGroupSizeOfState
uint64_t getRowGroupSizeOfState(uint64_t state) const
Definition BeliefMdpExplorer.cpp:832

storm::builder::BeliefMdpExplorer::currentStateHasOldBehavior
bool currentStateHasOldBehavior() const
Definition BeliefMdpExplorer.cpp:386

storm::builder::BeliefMdpExplorer::getSchedulerForExploredMdp
const std::shared_ptr< storm::storage::Scheduler< BeliefMdpExplorer< PomdpType, BeliefValueType >::ValueType > > & getSchedulerForExploredMdp() const
Definition BeliefMdpExplorer.cpp:950

storm::builder::BeliefMdpExplorer::getStartOfCurrentRowGroup
MdpStateType getStartOfCurrentRowGroup() const
Definition BeliefMdpExplorer.cpp:818

storm::builder::BeliefMdpExplorer::computeLowerValueBoundForScheduler
ValueType computeLowerValueBoundForScheduler(BeliefId const &beliefId, uint64_t schedulerId) const
Definition BeliefMdpExplorer.cpp:887

storm::builder::BeliefMdpExplorer::currentStateIsOptimalSchedulerReachable
bool currentStateIsOptimalSchedulerReachable() const
Retrieves whether the current state can be reached under a scheduler that was optimal in the most rec...
Definition BeliefMdpExplorer.cpp:426

storm::builder::BeliefMdpExplorer::addRewardToCurrentState
void addRewardToCurrentState(uint64_t const &localActionIndex, ValueType rewardValue)
Adds the provided reward value to the given action of the current state.
Definition BeliefMdpExplorer.cpp:340

storm::builder::BeliefMdpExplorer::BeliefMdpExplorer
BeliefMdpExplorer(BeliefMdpExplorer &&other)=default

storm::builder::BeliefMdpExplorer::gatherSuccessorObservationInformationAtMdpChoice
void gatherSuccessorObservationInformationAtMdpChoice(uint64_t mdpChoice, std::map< uint32_t, SuccessorObservationInformation > &gatheredSuccessorObservations)
Definition BeliefMdpExplorer.cpp:979

storm::builder::BeliefMdpExplorer::getNrOfMemoryNodesForObservation
uint64_t getNrOfMemoryNodesForObservation(uint32_t observation) const
Definition BeliefMdpExplorer.cpp:1300

storm::builder::BeliefMdpExplorer::computeRewardAtCurrentState
void computeRewardAtCurrentState(uint64_t const &localActionIndex, ValueType extraReward=storm::utility::zero< ValueType >())
Definition BeliefMdpExplorer.cpp:330

storm::builder::BeliefMdpExplorer::computeOptimalChoicesAndReachableMdpStates
void computeOptimalChoicesAndReachableMdpStates(ValueType const &ancillaryChoicesEpsilon, bool relativeDifference)
Computes the set of states that are reachable via a path that is consistent with an optimal MDP sched...
Definition BeliefMdpExplorer.cpp:1022

storm::builder::BeliefMdpExplorer::getNrSchedulersForUpperBounds
uint64_t getNrSchedulersForUpperBounds()
Definition BeliefMdpExplorer.cpp:1316

storm::builder::BeliefMdpExplorer::isMarkedAsGridBelief
bool isMarkedAsGridBelief(BeliefId const &beliefId)
Definition BeliefMdpExplorer.cpp:1131

storm::builder::BeliefMdpExplorer::getUpperValueBoundAtCurrentState
ValueType getUpperValueBoundAtCurrentState() const
Definition BeliefMdpExplorer.cpp:857

storm::builder::BeliefMdpExplorer::exploreNextState
BeliefId exploreNextState()
Definition BeliefMdpExplorer.cpp:239

storm::builder::BeliefMdpExplorer::markAsGridBelief
void markAsGridBelief(BeliefId const &beliefId)
Definition BeliefMdpExplorer.cpp:1126

storm::builder::BeliefMdpExplorer::computeUpperValueBoundForScheduler
ValueType computeUpperValueBoundForScheduler(BeliefId const &beliefId, uint64_t schedulerId) const
Definition BeliefMdpExplorer.cpp:896

storm::builder::BeliefMdpExplorer::adjustActions
void adjustActions(uint64_t totalNumberOfActions)
Definition BeliefMdpExplorer.cpp:1370

storm::builder::BeliefMdpExplorer::actionAtCurrentStateWasOptimal
bool actionAtCurrentStateWasOptimal(uint64_t const &localActionIndex) const
Retrieves whether the given action at the current state was optimal in the most recent check.
Definition BeliefMdpExplorer.cpp:436

storm::builder::BeliefMdpExplorer::setCurrentChoiceIsDelayed
void setCurrentChoiceIsDelayed(uint64_t const &localActionIndex)
Definition BeliefMdpExplorer.cpp:379

storm::builder::BeliefMdpExplorer::computeProductWithSparseMatrix
std::vector< BeliefValueType > computeProductWithSparseMatrix(BeliefId const &beliefId, storm::storage::SparseMatrix< BeliefValueType > &matrix) const
Definition BeliefMdpExplorer.cpp:1364

storm::builder::BeliefMdpExplorer::addSelfloopTransition
void addSelfloopTransition(uint64_t const &localActionIndex=0, ValueType const &value=storm::utility::one< ValueType >())
Definition BeliefMdpExplorer.cpp:295

storm::builder::BeliefMdpExplorer::getUpperValueBoundSchedulers
std::vector< storm::storage::Scheduler< ValueType > > getUpperValueBoundSchedulers() const
Definition BeliefMdpExplorer.cpp:1352

storm::builder::BeliefMdpExplorer::getLowerValueBoundAtCurrentState
ValueType getLowerValueBoundAtCurrentState() const
Definition BeliefMdpExplorer.cpp:851

storm::builder::BeliefMdpExplorer::MdpStateType
uint64_t MdpStateType
Definition BeliefMdpExplorer.h:32

storm::builder::BeliefMdpExplorer::getCurrentStateWasClipped
bool getCurrentStateWasClipped() const
Definition BeliefMdpExplorer.cpp:402

storm::builder::BeliefMdpExplorer::addTransitionToBelief
bool addTransitionToBelief(uint64_t const &localActionIndex, BeliefId const &transitionTarget, ValueType const &value, bool ignoreNewBeliefs)
Adds the next transition to the given successor belief.
Definition BeliefMdpExplorer.cpp:305

storm::builder::BeliefMdpExplorer::takeCurrentValuesAsUpperBounds
void takeCurrentValuesAsUpperBounds()
Definition BeliefMdpExplorer.cpp:1010

storm::builder::BeliefMdpExplorer::stateIsOptimalSchedulerReachable
bool stateIsOptimalSchedulerReachable(MdpStateType mdpState) const
Retrieves whether the current state can be reached under an optimal scheduler This requires a previou...
Definition BeliefMdpExplorer.cpp:411

storm::builder::BeliefMdpExplorer::BeliefId
BeliefManagerType::BeliefId BeliefId
Definition BeliefMdpExplorer.h:31

storm::builder::BeliefMdpExplorer::finishExploration
void finishExploration()
Definition BeliefMdpExplorer.cpp:516

storm::builder::BeliefMdpExplorer::getCurrentNumberOfMdpChoices
MdpStateType getCurrentNumberOfMdpChoices() const
Definition BeliefMdpExplorer.cpp:812

storm::modelchecker::CheckTask
Definition CheckTask.h:30

storm::storage::BeliefManager
Definition BeliefManager.h:22

storm::storage::BeliefManager::BeliefSupportType
boost::container::flat_set< StateType > BeliefSupportType
Definition BeliefManager.h:26

storm::storage::BeliefManager::BeliefId
uint64_t BeliefId
Definition BeliefManager.h:27

storm::storage::BitVector
A bit vector that is internally represented as a vector of 64-bit values.
Definition BitVector.h:18

storm::storage::Scheduler
This class defines which action is chosen in a particular state of a non-deterministic model.
Definition Scheduler.h:18

storm::storage::SparseMatrix
A class that holds a possibly non-square matrix in the compressed row storage format.
Definition SparseMatrix.h:332

storm::builder::ExplorationHeuristic
ExplorationHeuristic
Definition BeliefMdpExplorer.h:24

storm::builder::ExplorationHeuristic::LowerBoundPrio
@ LowerBoundPrio

storm::builder::ExplorationHeuristic::BreadthFirst
@ BreadthFirst

storm::builder::ExplorationHeuristic::GapPrio
@ GapPrio

storm::builder::ExplorationHeuristic::UpperBoundPrio
@ UpperBoundPrio

storm::builder::ExplorationHeuristic::ProbabilityPrio
@ ProbabilityPrio

storm::solver::OptimizationDirection
OptimizationDirection
Definition OptimizationDirection.h:8

storm
LabParser.cpp.
Definition cli.cpp:18

Mdp.h

storm::builder::BeliefMdpExplorer::SuccessorObservationInformation
Definition BeliefMdpExplorer.h:34

storm::builder::BeliefMdpExplorer::SuccessorObservationInformation::support
BeliefManagerType::BeliefSupportType support
The number of successor beliefstates with this observation.
Definition BeliefMdpExplorer.h:40

storm::builder::BeliefMdpExplorer::SuccessorObservationInformation::join
void join(SuccessorObservationInformation other)
Definition BeliefMdpExplorer.cpp:30

storm::builder::BeliefMdpExplorer::SuccessorObservationInformation::maxProbabilityToSuccessorWithObs
ValueType maxProbabilityToSuccessorWithObs
The probability we move to the corresponding observation.
Definition BeliefMdpExplorer.h:38

storm::builder::BeliefMdpExplorer::SuccessorObservationInformation::successorWithObsCount
uint64_t successorWithObsCount
The maximal probability to move to a successor with the corresponding observation.
Definition BeliefMdpExplorer.h:39

storm::builder::BeliefMdpExplorer::SuccessorObservationInformation::observationProbability
ValueType observationProbability
Definition BeliefMdpExplorer.h:37

storm::pomdp::storage::ExtremePOMDPValueBound
Struct to store the extreme bound values needed for the reward correction values when clipping is use...
Definition BeliefExplorationBounds.h:53

storm::pomdp::storage::PreprocessingPomdpValueBounds
Struct for storing precomputed values bounding the actual values on the POMDP.
Definition BeliefExplorationBounds.h:13