prism-accumulation/prism/src/mtbdd/PM_NondetReachReward.cc


								//==============================================================================

								//

								//	Copyright (c) 2002-

								//	Authors:

								//	* Dave Parker <david.parker@comlab.ox.ac.uk> (University of Oxford, formerly University of Birmingham)

								//

								//------------------------------------------------------------------------------

								//

								//	This file is part of PRISM.

								//

								//	PRISM is free software; you can redistribute it and/or modify

								//	it under the terms of the GNU General Public License as published by

								//	the Free Software Foundation; either version 2 of the License, or

								//	(at your option) any later version.

								//

								//	PRISM is distributed in the hope that it will be useful,

								//	but WITHOUT ANY WARRANTY; without even the implied warranty of

								//	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

								//	GNU General Public License for more details.

								//

								//	You should have received a copy of the GNU General Public License

								//	along with PRISM; if not, write to the Free Software Foundation,

								//	Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

								//

								//==============================================================================


								// includes

								#include "PrismMTBDD.h"

								#include <math.h>

								#include <util.h>

								#include <cudd.h>

								#include <dd.h>

								#include <odd.h>

								#include "PrismMTBDDGlob.h"

								#include "jnipointer.h"

								#include "prism.h"


								//------------------------------------------------------------------------------


								JNIEXPORT jlong __jlongpointer JNICALL Java_mtbdd_PrismMTBDD_PM_1NondetReachReward

								(

								JNIEnv *env,

								jclass cls,

								jlong __jlongpointer t,	// trans matrix

								jlong __jlongpointer sr,	// state rewards

								jlong __jlongpointer trr,	// state rewards

								jlong __jlongpointer od,	// odd

								jlong __jlongpointer ndm,	// nondeterminism mask

								jlong __jlongpointer rv,	// row vars

								jint num_rvars,

								jlong __jlongpointer cv,	// col vars

								jint num_cvars,

								jlong __jlongpointer ndv,	// nondet vars

								jint num_ndvars,

								jlong __jlongpointer g,	// 'goal' states

								jlong __jlongpointer in,	// 'inf' states

								jlong __jlongpointer m,	// 'maybe' states

								jboolean min		// min or max probabilities (true = min, false = max)

								)

								{

									// cast function parameters

									DdNode *trans = jlong_to_DdNode(t);		// trans matrix

									DdNode *state_rewards = jlong_to_DdNode(sr);	// state rewards

									DdNode *trans_rewards = jlong_to_DdNode(trr);	// transition rewards

									ODDNode *odd = jlong_to_ODDNode(od);		// odd

									DdNode *mask = jlong_to_DdNode(ndm);		// nondeterminism mask

									DdNode **rvars = jlong_to_DdNode_array(rv);	// row vars

									DdNode **cvars = jlong_to_DdNode_array(cv);	// col vars

									DdNode **ndvars = jlong_to_DdNode_array(ndv);	// nondet vars

									DdNode *goal = jlong_to_DdNode(g);		// 'goal' states

									DdNode *inf = jlong_to_DdNode(in); 		// 'inf' states

									DdNode *maybe = jlong_to_DdNode(m); 		// 'maybe' states


									// mtbdds

									DdNode *reach, *a, *all_rewards, *new_mask, *sol, *tmp;

									// timing stuff

									long start1, start2, start3, stop;

									double time_taken, time_for_setup, time_for_iters;

									// misc

									bool done;

									int iters, i;


									// start clocks

									start1 = start2 = util_cpu_time();


									// get reachable states

									reach = odd->dd;


									PM_PrintToMainLog(env, "\nBuilding iteration matrix MTBDD... ");


									// filter out rows (goal states and infinity states) from matrix

									Cudd_Ref(trans);

									Cudd_Ref(maybe);

									a = DD_Apply(ddman, APPLY_TIMES, trans, maybe);


									// also remove goal and infinity states from state rewards vector

									Cudd_Ref(state_rewards);

									Cudd_Ref(maybe);

									state_rewards = DD_Apply(ddman, APPLY_TIMES, state_rewards, maybe);


									// multiply transition rewards by transition probs and sum rows

									// (note also filters out unwanted states at the same time)

									Cudd_Ref(trans_rewards);

									Cudd_Ref(a);

									trans_rewards = DD_Apply(ddman, APPLY_TIMES, trans_rewards, a);

									trans_rewards = DD_SumAbstract(ddman, trans_rewards, cvars, num_cvars);


									// combine state and transition rewards

									all_rewards = DD_Apply(ddman, APPLY_PLUS, state_rewards, trans_rewards);


									// need to change mask because rewards are not necessarily in the range 0..1

									Cudd_Ref(mask);

									new_mask = DD_ITE(ddman, mask, DD_PlusInfinity(ddman), DD_Constant(ddman, 0));


									// initial solution is infinity in 'inf' states, zero elsewhere

									// note: ok to do this because cudd matrix-multiply (and other ops)

									// treat 0 * inf as 0, unlike in IEEE 754 rules

									Cudd_Ref(inf);

									sol = DD_ITE(ddman, inf, DD_PlusInfinity(ddman), DD_Constant(ddman, 0));


									// print memory usage

									i = DD_GetNumNodes(ddman, a);

									PM_PrintToMainLog(env, "[nodes=%d] [%.1f Kb]\n", i, i*20.0/1024.0);


									// get setup time

									stop = util_cpu_time();

									time_for_setup = (double)(stop - start2)/1000;

									start2 = stop;

									start3 = stop;


									// start iterations

									iters = 0;

									done = false;

									PM_PrintToMainLog(env, "\nStarting iterations...\n");


									while (!done && iters < max_iters) {


										iters++;


										// matrix-vector multiply

										Cudd_Ref(sol);

										tmp = DD_PermuteVariables(ddman, sol, rvars, cvars, num_rvars);

										Cudd_Ref(a);

										tmp = DD_MatrixMultiply(ddman, a, tmp, cvars, num_cvars, MM_BOULDER);


										// add rewards

										Cudd_Ref(all_rewards);

										tmp = DD_Apply(ddman, APPLY_PLUS, tmp, all_rewards);


										// do min/max

										if (min) {

											// mask stuff

											Cudd_Ref(new_mask);

											tmp = DD_Apply(ddman, APPLY_MAX, tmp, new_mask);

											// abstract

											tmp = DD_MinAbstract(ddman, tmp, ndvars, num_ndvars);

										}

										else {

											// abstract

											tmp = DD_MaxAbstract(ddman, tmp, ndvars, num_ndvars);

										}


										// put infinities (for 'inf' states) back into into solution vector

										Cudd_Ref(inf);

										tmp = DD_ITE(ddman, inf, DD_PlusInfinity(ddman), tmp);


										// check convergence

										switch (term_crit) {

										case TERM_CRIT_ABSOLUTE:

											if (DD_EqualSupNorm(ddman, tmp, sol, term_crit_param)) {

												done = true;

											}

											break;

										case TERM_CRIT_RELATIVE:

											if (DD_EqualSupNormRel(ddman, tmp, sol, term_crit_param)) {

												done = true;

											}

											break;

										}


										// print occasional status update

										if ((util_cpu_time() - start3) > UPDATE_DELAY) {

											PM_PrintToMainLog(env, "Iteration %d: ", iters);

											PM_PrintToMainLog(env, "%.2f sec so far\n", ((double)(util_cpu_time() - start2)/1000));

											start3 = util_cpu_time();

										}


										// prepare for next iteration

										Cudd_RecursiveDeref(ddman, sol);

										sol = tmp;

									}


									// stop clocks

									stop = util_cpu_time();

									time_for_iters = (double)(stop - start2)/1000;

									time_taken = (double)(stop - start1)/1000;


									// print iterations/timing info

									PM_PrintToMainLog(env, "\nIterative method: %d iterations in %.2f seconds (average %.6f, setup %.2f)\n", iters, time_taken, time_for_iters/iters, time_for_setup);


									// free memory

									Cudd_RecursiveDeref(ddman, a);

									Cudd_RecursiveDeref(ddman, all_rewards);

									Cudd_RecursiveDeref(ddman, new_mask);


									// if the iterative method didn't terminate, this is an error

									if (!done) { Cudd_RecursiveDeref(ddman, sol); PM_SetErrorMessage("Iterative method did not converge within %d iterations.\nConsider using a different numerical method or increasing the maximum number of iterations", iters); return 0; }


									return ptr_to_jlong(sol);

								}


								//------------------------------------------------------------------------------