imported patch rewardcounter-MDPCounterAndCounterTransformation.patch

7 years ago · 40eafca2f5
2 changed files with 116 additions and 0 deletions
--- a/prism/src/explicit/CounterProduct.java
+++ b/prism/src/explicit/CounterProduct.java
@ -32,6 +32,7 @@ import java.util.BitSet;
 import common.SafeCast;

 import explicit.rewards.MCRewards;
+import explicit.rewards.MDPRewards;
 import prism.IntegerBound;
 import prism.PrismException;

@ -88,6 +89,74 @@ public class CounterProduct<M extends Model> extends ProductWithProductStates<M>
 		return result;
 	}

+	/**
+	 * Generate the product of a MDP with an accumulated reward counter.
+	 * The counter has the range [0,limit], with saturation semantics for accumulated
+	 * rewards >=limit.
+	 * @param graph the MDP
+	 * @param rewards integer MCRewards
+	 * @param limit the saturation value for the counter
+	 * @param statesOfInterest the set of state of interest, the starting point for the counters
+	 * @return
+	 * @throws PrismException
+	 */
+	static public CounterProduct<MDP> generate(final MDP graph, final MDPRewards rewards, final int limit, BitSet statesOfInterest) throws PrismException {
+		final CounterProduct<MDP> result = new CounterProduct<MDP>(graph, limit);
+
+		class RewardProductOperator implements MDPProductOperator {
+			@Override
+			public ProductState getInitialState(Integer dtmc_state)
+			{
+				return new ProductState(dtmc_state, 0);
+			}
+
+			@Override
+			public ProductState getSuccessor(ProductState from_state, int choice_i, Integer dtmc_to_state) throws PrismException
+			{
+				// the accumulated reward
+				int acc_reward = from_state.getSecondState();
+
+				// reward(s) is accumulated on transition *from* s
+				int state_reward = SafeCast.toInt(rewards.getStateReward(from_state.getFirstState()));
+				// transition reward depends on choice_i
+				int transition_reward = SafeCast.toInt(rewards.getTransitionReward(from_state.getFirstState(), choice_i));
+
+				int next_reward = acc_reward + state_reward + transition_reward;
+				if (next_reward >= limit) {
+					// saturated
+					next_reward = limit;
+				}
+				return new ProductState(dtmc_to_state, next_reward);
+			}
+
+			@Override
+			public void notify(ProductState state, Integer index) throws PrismException
+			{
+				// store product state in the corresponding bitset of accRewardToStates
+				int reward = state.getSecondState();
+				result.accRewardToStates.get(reward).set(index);
+			}
+
+			@Override
+			public MDP getGraph()
+			{
+				return graph;
+			}
+
+			@Override
+			public void finish() throws PrismException {
+				// nothing to do
+			}
+		};
+
+		RewardProductOperator product_op = new RewardProductOperator();
+
+		ProductWithProductStates.generate(product_op, result, statesOfInterest);
+
+		return result;
+	}
+
+
 	/**
 	 * Generate the product of a DTMC with an accumulated reward counter.
 	 * The counter has the range [0,limit], with saturation semantics for accumulated
--- a/prism/src/explicit/CounterTransformation.java
+++ b/prism/src/explicit/CounterTransformation.java
@ -114,6 +114,8 @@ public class CounterTransformation<M extends Model> implements ModelExpressionTr
 	private void doTransformation(M originalModel, TemporalOperatorBound bound, BitSet statesOfInterest) throws PrismException {
 		if (originalModel instanceof DTMC) {
 			doTransformation((DTMC)originalModel, bound, statesOfInterest);
+		} else if (originalModel instanceof MDP) {
+				doTransformation((MDP)originalModel, bound, statesOfInterest);
 		} else {
 			throw new PrismException("Counter-Transformation is not supported for "+originalModel.getClass());
 		}
@ -163,6 +165,51 @@ public class CounterTransformation<M extends Model> implements ModelExpressionTr
 		}
 	}

+	private void doTransformation(MDP originalModel, TemporalOperatorBound bound, BitSet statesOfInterest) throws PrismException
+	{
+		IntegerBound intBound = IntegerBound.fromTemporalOperatorBound(bound, mc.constantValues, true);
+		int saturation_limit = intBound.getMaximalInterestingValue();
+
+		MDPRewards rewards = null;
+
+		switch (bound.getBoundType()) {
+		case REWARD_BOUND: {
+			// Get reward info
+			Object rs = bound.getRewardStructureIndex();
+			RewardStruct rewStruct = ExpressionReward.getRewardStructByIndexObject(rs, mc.modulesFile, mc.constantValues);
+
+			ConstructRewards construct_rewards = new ConstructRewards();
+			rewards = construct_rewards.buildMDPRewardStructure(originalModel, rewStruct, originalModel.getConstantValues());
+			break;
+		}
+		case DEFAULT_BOUND:
+		case STEP_BOUND:
+		case TIME_BOUND:
+			// a time/step bound, use constant reward structure assigning 1 to each state
+			rewards = new StateRewardsConstant(1);
+			break;
+		}
+
+		if (rewards == null) {
+			throw new PrismException("Couldn't generate reward information.");
+		}
+
+		product = (CounterProduct<M>) CounterProduct.generate(originalModel, rewards, saturation_limit, statesOfInterest);
+
+		// add 'in_bound-x' label
+		BitSet statesInBound = product.getStatesWithAccumulatedRewardInBound(intBound);
+		String labelInBound = ((MDPExplicit)product.getTransformedModel()).addUniqueLabel("in_bound", statesInBound, mc.getDefinedLabelNames());
+
+		// transform expression
+		ReplaceBound replace = new ReplaceBound(bound, labelInBound);
+		transformedExpression = (Expression) transformedExpression.accept(replace);
+
+		if (!replace.wasSuccessfull()) {
+			throw new PrismException("Replacing bound was not successfull.");
+		}
+	}
+
+
 	public static <M extends Model> ModelExpressionTransformation<M, M> replaceBoundsWithCounters(ProbModelChecker parent,
 			M originalModel, Expression originalExpression,
 			List<TemporalOperatorBound> bounds,