adityavk/value_iteration.py Secret

## value_iteration.py
planner = Planner(env.P)

# Extract the value function, the history of log V(s), and the optimal policy learnt by VI
value_func_vi, log_value_func_history_vi, value_iteration_policy = planner.value_iteration(gamma=0.99)
	planner = Planner(env.P)

	# Extract the value function, the history of log V(s), and the optimal policy learnt by VI
	value_func_vi, log_value_func_history_vi, value_iteration_policy = planner.value_iteration(gamma=0.99)