ZSalloum

## FictitiousPlay_2x2_OddEvenGame

MAX_ITER = 10000;

function getMax(arr){
	return arr[0]<=arr[1] ? 1 : 0;
}

function getMin(arr){
	return arr[0]<arr[1] ? 0 : 1;
}

## ARS.py
# the standard implementation of ARS

# Importing the libraries
import datetime
import os
import numpy as np
import gym
from gym import wrappers
import pybullet_envs

## XOR_NeuralNetworks_with_Matrix
import numpy as np


def sigmoid(x):
    return 1.0 / (1.0 + np.exp(-x))


def sigmoid_prime(x):
    return sigmoid(x) * (1.0 - sigmoid(x))

## XOR_NeuralNetwork.py
import numpy as np


def sigmoid(x):
    return 1.0 / (1.0 + np.exp(-x))


def sigmoid_prime(x):
    return sigmoid(x) * (1.0 - sigmoid(x))

## GradienDescent.py

def dF(x):
    return 2*x

a = .9

def gradient_descent_constant_alpha(th, a, epsilon):
    i=1
    deriv=dF(th)
    print(i,",", th, ", ", a, ", ", deriv)

## DoubleQLearningVsQLearning.py
import numpy as np
import matplotlib.pyplot as plt


# these are the control variables, change them to customize the execution of this program
cntExperiments= 1001 # number of experiments to run, large number means longer execution time
MAX_ITER = 301      # number of episodes per experiment, large number means longer execution time
ACTIONS_FOR_B = 10  #number of actions at state B

	MAX_ITER = 10000;

	function getMax(arr){
	return arr[0]<=arr[1] ? 1 : 0;
	}

	function getMin(arr){
	return arr[0]<arr[1] ? 0 : 1;
	}
	# the standard implementation of ARS

	# Importing the libraries
	import datetime
	import os
	import numpy as np
	import gym
	from gym import wrappers
	import pybullet_envs
	import numpy as np


	def sigmoid(x):
	return 1.0 / (1.0 + np.exp(-x))


	def sigmoid_prime(x):
	return sigmoid(x) * (1.0 - sigmoid(x))

	def dF(x):
	return 2*x

	a = .9

	def gradient_descent_constant_alpha(th, a, epsilon):
	i=1
	deriv=dF(th)
	print(i,",", th, ", ", a, ", ", deriv)
	import numpy as np
	import matplotlib.pyplot as plt


	# these are the control variables, change them to customize the execution of this program
	cntExperiments= 1001 # number of experiments to run, large number means longer execution time
	MAX_ITER = 301 # number of episodes per experiment, large number means longer execution time
	ACTIONS_FOR_B = 10 #number of actions at state B