rymate1234/ai.lua

## ai.lua
----------------------------------------------------------------------------------------------------------------------------------------------------
--Super Mario Bros.
--Neural Network Learning
--by Michael Roberts
--06/2015
--
--Use with FCEUX v2.2.2


----------------------------------------------------------------------------------------------------------------------------------------------------
--RAM Addresses for variables
----------------------------------------------------------------------------------------------------------------------------------------------------

saveState = savestate.object(1)
savestate.save(saveState)

RamNametableHi = 0x20
RamNametableLow = 0x01
RamNametableSize = 0x2BF
RamNametableSolidStart = 0x01

--Screen attributes
RamObjectMapStart = 0x500
MapTileNum = 208

--Player attributes
RamPlayerX = 0x86
RamPlayerY = 0x3B8
RamPlayerScreenX = 0x6D
RamLives = 0x75A
RamCoins = 0x75E

--Game attributes
RamWorld = 0x75F
RamLevel = 0x760
--Score
RamScoreDigit1 = 0x7D8 --10^5
RamScoreDigit2 = 0x7D9 --10^4
RamScoreDigit3 = 0x7DA --10^3
RamScoreDigit4 = 0x7DB --10^2
RamScoreDigit5 = 0x7DC --10^1

TimeDigit1 = 0x07F8
TimeDigit2 = 0x07F9
TimeDigit3 = 0x07FA

--Enemy attributes
RamEnemyX = 0x87	--starting address in memory for multiple enemies
RamEnemyY = 0xCF
RamEnemyScreenX = 0x6E
EnemyNumSlots = 5
RamEnemyFlag = 0xF	--In Zelda, it's enemy direction used as flag

--Projectile attributes
--RamProjectileX = 0x87	--starting address in memory for multiple enemies
--RamProjectileY = 0xCF
--RamProjectileScreenX = 0x6E
--ProjectileNumSlots = 5
--RamProjectileFlag = 0xF	--In Zelda, it's enemy direction used as flag


------------------------------------------------------------------------------------------------------------------------------------------------------

--timer = 40
index = 1
--AReady = true
--BReady = true
vblankFlag = 0
vblankOff = 0
--PPU2002 = {}

generation = 1
fitness = 0
maxFitness = 0
startFitness = 0

timeStuck = 0
maxStuckTime = 1000 --220
medStuckTime = maxStuckTime / 2 --220
lastX = 0
lastY = 0
lastLives = 0
timerHold = 0
lastScreen = 0
screenTimeStuck = 0
maxScreenStuckTime = maxStuckTime

playerX = 0
playerY = 0
playerRoomX = 0
playerRoomY = 0
playerMapX = 0
playerMapY = 0
playerLives = 0
playerScore = 0
currentTime = 0
lastTime = 0

resetGame = 0


room = {}
map = {}
for i=1,2*MapTileNum do
	map[i] = 0
end


enemyX = {}
enemyY = {}
enemyRoomX = {}
enemyRoomY = {}
enemyMapX = {}
enemyMapY = {}
enemyDir = {}
projectileX = {}
projectileY = {}
projectileRoomX = {}
projectileRoomY = {}


drawRoom = false
drawMap = false
drawView = false
drawCoord = true
drawNeurons = false
drawWeights = false
drawController = false
drawPopulation = true

viewRadius = 7
viewDiameter = 2*viewRadius+1

viewBox = {}
for i=1,viewDiameter*viewDiameter do
	viewBox[i] = 0
end


inputNum = viewDiameter*viewDiameter + 1
outputNum = 6	--6 buttons on the controller
layerNum = 2
layerSize = {inputNum,  12, outputNum}
--layerSize array has layerNum+1 entries. (inputNum layer is counted as layer 0)

populationSize = 25

populationFitness = {}
for i=1, populationSize do
	populationFitness[i] = nil
end
currentChild = 1
currentParent1 = 0
currentParent2 = 0
mutationProbability = .05
meanFitness = 0
stdvFitness = 0


inputViewNum = MapTileNum	--this is the number of inputs to X that are from the view or map

--inputSigmoidStrength = 4.394/inputNum
--hiddenSigmoidStrength = 4.394/layerSize
outputStepStrength = 0 --layerSize/4
--sigmoid strength = 4ln3/N    --4ln3 = 4.394
--where N=number of neurons input into current layer being calculated.

--X[1][] = input
--X[layerNum+1][] = output
--Y = output bool
--
--S[l] = W[l]*X[l-1]
--X[l] = f(S[l])
--f is shaping function (tanh)

Y = {}
for i=1, outputNum do
	Y[i] = false
end

X = {}
S = {}
delta = {}
for l=1,layerNum+1 do
	X[l] = {}
	S[l] = {}
	delta[l] = {}
	for i=1, layerSize[l] do
		X[l][i] = 0
		S[l][i] = 0
		delta[l][i] = 0
	end
end


W = {}
memW = {}
for p=1, populationSize do
	W[p] = {}
	for l=1,layerNum do
		W[p][l] = {}
		memW[l] = {}
		for i=1,layerSize[l+1] do
			W[p][l][i] = {}
			memW[l][i] = {}
			for j=1,layerSize[l] do
				W[p][l][i][j] = 2*math.random() - 1 --math.random(3)-2
				memW[l][i][j] = W[p][l][i][j]
			end
		end
	end
end

--Training parameters

--trainingMode = 1 -> begin in training mode. 0 is game running mode
geneticMode = true
trainingMode = false

recordMode = 1
keyPressReady = true

randomChangeSize = .1
stepSize = .1
sampleRate = 100
sampleTimer = 0
controllerInput = {}
errorVal = 0

Y_Train = {}
for i=1, outputNum do
	Y_Train[i] = 0
end


--------------------------------------------------------------------------------------------------------------------------------------------
--Functions
--------------------------------------------------------------------------------------------------------------------------------------------

function readPPU()
	memory.writebyte(0x2006, RamNametableHi)
	memory.writebyte(0x2006, RamNametableLow)
	j=1
	for i=0,RamNametableSize do
		local val = memory.readbyte(0x2007)
		room[i+1] = val

		if (math.floor(i/32))%2 == 0 then
		if i%2 == 0 then
			map[j] = val
			j = j+1
		end
		end

		--if val <= RamNametableSolidStart then
		--	room[i+1] = 0
		--else
		--	room[i+1] = 1
		--end
	end
end


function inputView()
	for i = -viewRadius, viewRadius do
	for j = -viewRadius, viewRadius do
		local x = playerMapX+i-1
		local y = playerMapY+j-1
		local page = math.floor(x/16)
		local xAddress = x - 16*page+1
		local yAddress = y + 13*(page%2)
		if xAddress >= 1 and xAddress < 32 and yAddress >= 1 and yAddress <= 25 then
			viewBox[(i+viewRadius+1)+viewDiameter*(j+viewRadius)] = map[xAddress + 16*yAddress]
		else
			viewBox[(i+viewRadius+1)+viewDiameter*(j+viewRadius)] = 0
		end
	end
	end
end


function inputMap()
	for i=1, 2*MapTileNum do
		if memory.readbyte(0x500 + i-1) ~= 0 then
            if memory.readbyte(0x500 + i-1) == 193 then
                map[i] = 2
            elseif memory.readbyte(0x500 + i-1) == 192 then
                map[i] = 2
            elseif memory.readbyte(0x500 + i-1) <= 21 and memory.readbyte(0x500 + i-1) >= 18 then
                map[i] = 3
            else
			    map[i] = 1
            end
		else
			map[i] = 0
		end
	end

	for i=1, EnemyNumSlots do
		if memory.readbyte(RamEnemyFlag+(i-1)) ~= 0 then
			local page = math.floor(enemyMapX[i]/16)
			local xAddress = enemyMapX[i] - 16*page
			local yAddress = enemyMapY[i] - 1 + 13*(page%2)
			if xAddress >= 1 and xAddress < 32 and yAddress >= 1 and yAddress <= 25 then
				map[xAddress + 16*yAddress] = -1
			end
		end
	end
end


function inputPlayer()
	playerX = memory.readbyte(RamPlayerX) + memory.readbyte(RamPlayerScreenX)*0x100 + 4
	playerY = memory.readbyte(RamPlayerY) + 16
	playerRoomX = math.floor(playerX/8)+1
	playerRoomY = math.floor(playerY/7.5)-7
	playerMapX = math.floor((playerX%512)/16)+1
	playerMapY = math.floor((playerY-32)/16)+1
	playerScore = (memory.readbyte(RamScoreDigit1)*10^5)+(memory.readbyte(RamScoreDigit2)*10^4)+(memory.readbyte(RamScoreDigit3)*10^3)+(memory.readbyte(RamScoreDigit4)*10^2)+(memory.readbyte(RamScoreDigit5)*10^1)
    currentTime = (memory.readbyte(TimeDigit1)*10^2)+(memory.readbyte(TimeDigit2)*10^1)+(memory.readbyte(TimeDigit3))
end


function inputEnemies()
	for i=1,EnemyNumSlots do
		if memory.readbyte(RamEnemyFlag+(i-1)) ~= 0 then
			enemyX[i] = memory.readbyte(RamEnemyX+(i-1)) + memory.readbyte(RamEnemyScreenX+(i-1))*0x100
			enemyY[i] = memory.readbyte(RamEnemyY+(i-1)) + 24
		else
			enemyX[i] = -1
			enemyY[i] = -1
		end
		enemyRoomX[i] = math.floor(enemyX[i]/8)+1
		enemyRoomY[i] = math.floor(enemyY[i]/7.5)-7
		enemyMapX[i] = math.floor((enemyX[i]%512)/16)+1
		enemyMapY[i] = math.floor((enemyY[i]-32)/16)
	end
	--for i=1,ProjectileNumSlots do
	--	if memory.readbyte(RamProjectileFlag-(i-1)) ~= 0 then
	--		projectileX[i] = memory.readbyte(RamProjectileX-(i-1))
	--		projectileY[i] = memory.readbyte(RamProjectileY-(i-1))
	--	else
	--		projectileX[i] = -1
	--		projectileY[i] = -1
	--	end
	--	projectileRoomX[i] = math.floor(projectileX[i]/8)
	--	projectileRoomY[i] = math.floor(projectileY[i]/7.5)
	--end
end


function inputViewToX(startPosition)
	for i=1,(viewDiameter)*(viewDiameter) do
		X[1][startPosition-1+i] = viewBox[i]
	end
end


function inputMapToX(startPosition)
	for i=1,MapTileNum do
		if map[i] <= RamNametableSolidStart then
			X[1][startPosition-1+i] = 0
		else
			X[1][startPosition-1+i] = 1
		end
	end
end


function inputCoordToX(startPosition)
	X[1][startPosition] = playerMapX/32
	X[1][startPosition+1] = playerMapY/13
	--X[1][startPosition+2] = playerHealth
end


function inputEnemyToX(startPosition)
	for i=0,EnemyNumSlots-1 do
		X[1][startPosition+2*i] = enemyMapX[i+1]/32
		X[1][startPosition+2*i+1] = enemyMapY[i+1]/13
	end
	--for i=0,ProjectileNumSlots-1 do
	--	X[1][startPosition+2*i+14] = projectileX[i+1]/256
	--	X[1][startPosition+2*i+15] = projectileY[i+1]/240
	--end
end


function inputNoise(val)
	for i=1,inputNum do
		X[1][i] = X[1][i] + val*(2*math.random()-1)
		if X[1][i] > 1 then
			X[1][i] = 1
		end
		if X[1][i] < -1 then
			X[1][i] = -1
		end
	end
end


function drawGui()
	local mapDrawX = -8
	local mapDrawY = 0
	local mapScale = 8
	local viewDrawX = 56
	local viewDrawY = 56
	local neuronDrawSpacing = 32
	local neuronVerticalSpacing = 4
	local controllerDrawX = 176
	local controllerDrawY = 48 --200
	local drawNeuronsX = 88

	if drawRoom == true then
		for i=0,RamNametableSize do
			local x = i%32
			local y = math.floor(i/32)
			if tunicColor%2 == 0 then
				gui.text(x*8, 64+y*8, room[i+1]%16)
			else
				gui.text(x*8, 64+y*8, math.floor(room[i+1]/16))
			end
			--if room[i+1] <= 0x77 then
			--	gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+x*mapScale+mapScale, mapDrawY+y*mapScale+mapScale, "black")
			--else
			--	gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+x*mapScale+mapScale, mapDrawY+y*mapScale+mapScale, "blue")
			--end
		end
		gui.box(mapDrawX+playerMapX*mapScale, mapDrawY+mapScale*(playerMapY-8), mapDrawX+mapScale*(playerMapX+1.5), mapDrawY+mapScale*(playerMapY-6.5), "green")
		for i=1,EnemyNumSlots do
			if enemyX[i] ~= -1 then
				gui.box(mapDrawX+enemyRoomX[i]*mapScale, mapDrawY+mapScale*(enemyRoomY[i]-8), mapDrawX+mapScale*(enemyRoomX[i]+1.5), mapDrawY+mapScale*(enemyRoomY[i]-6.5), "red")
			end
		end
		--for i=1,ProjectileNumSlots do
		--	if projectileX[i] ~= -1 then
		--		gui.box(mapDrawX+projectileRoomX[i]*mapScale, mapDrawY+mapScale*(projectileRoomY[i]-8), mapDrawX+mapScale*(projectileRoomX[i]+1), mapDrawY+mapScale*(projectileRoomY[i]-7), "red")
		--	end
		--end
	end

	if drawMap == true then
	--gui.box(0,0,256,240,"black")
		for i=0,2*MapTileNum-1 do
			local x = 16*math.floor(i/208) + i%16 + 1
			local y = math.floor(i/16) - 13*math.floor(i/208) + 1
			--local x = i%16 + 1 -- + 16*(i%208)
			--local y = math.floor(i/16) + 1 - 13*(i%208)
			--gui.text(mapDrawX+x*16, mapDrawY++y*16, map[i+1]%16)
			if map[i+1] == 0 then
				gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+(x+1)*mapScale-1, mapDrawY+(y+1)*mapScale-1, "black")
			elseif map[i+1] == 1 then
				gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+(x+1)*mapScale-1, mapDrawY+(y+1)*mapScale-1, "blue")
            elseif map[i+1] == 2 then
				gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+(x+1)*mapScale-1, mapDrawY+(y+1)*mapScale-1, "cyan")
			elseif map[i+1] == 3 then
				gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+(x+1)*mapScale-1, mapDrawY+(y+1)*mapScale-1, "#458B00")
			elseif map[i+1] == -1 then
				gui.box(mapDrawX+x*mapScale, mapDrawY+y*mapScale, mapDrawX+(x+1)*mapScale-1, mapDrawY+(y+1)*mapScale-1, "red")
			end
		end
		gui.box(mapDrawX+playerMapX*mapScale, mapDrawY+mapScale*playerMapY, mapDrawX+mapScale*(playerMapX+1)-1, mapDrawY+mapScale*(playerMapY+1)-1, "green")
		gui.box(mapDrawX+(playerMapX-viewRadius)*mapScale, mapDrawY+mapScale*(playerMapY-viewRadius), mapDrawX+(playerMapX+viewRadius+1)*mapScale, mapDrawY+mapScale*(playerMapY+viewRadius+1), "clear", "white")
		--Draw enemies on map. Replaced by inputing enemies into map[i] as -1 values
		--for i=1,EnemyNumSlots do
		--	if enemyX[i] ~= -1 then
		--		gui.box(mapDrawX+enemyMapX[i]*mapScale, mapDrawY+mapScale*enemyMapY[i], mapDrawX+mapScale*(enemyMapX[i]+1)-1, mapDrawY+mapScale*(enemyMapY[i]+1)-1, "red")
		--	end
		--end
		--for i=1,4 do
		--	if projectileX[i] ~= -1 then
		--		gui.box(mapDrawX+projectileRoomX[i]*mapScale, mapDrawY+mapScale*(projectileRoomY[i]-8), mapDrawX+mapScale*(projectileRoomX[i]+1), mapDrawY+mapScale*(projectileRoomY[i]-7), "red")
		--	end
		--end
	end

	if drawView == true then
		for i=1,viewDiameter*viewDiameter do
			local x = (i-1)%viewDiameter - viewRadius
			local y = math.floor((i-1)/viewDiameter) - viewRadius
			if viewBox[i] == 1 then
				gui.box(viewDrawX+8*x, viewDrawY+8*y, viewDrawX+8*(x+1)-1, viewDrawY+8*(y+1)-1, "blue")
			elseif viewBox[i] == 0 then
				gui.box(viewDrawX+8*x, viewDrawY+8*y, viewDrawX+8*(x+1)-1, viewDrawY+8*(y+1)-1, "black")
			elseif viewBox[i] == -1 then
				gui.box(viewDrawX+8*x, viewDrawY+8*y, viewDrawX+8*(x+1)-1, viewDrawY+8*(y+1)-1, "red")
			end
		end
		gui.box(viewDrawX, viewDrawY, viewDrawX+8-1, viewDrawY+8-1, "green")
	end

	if drawCoord == true then
		gui.text(192,8,playerX)
		gui.text(224,8,playerY)
		gui.text(192,16,playerMapX)
		gui.text(224,16,playerMapY)
		--gui.text(168,48,playerHealth)
	end

	if drawNeurons == true then
		for l=1,layerNum+1 do
			local layerDrawSpacing = (neuronVerticalSpacing*inputNum) / layerSize[l]
			for i=1, layerSize[l] do
				if X[l][i] >= -0.5 and X[l][i] <= 0.5 then
					gui.box(drawNeuronsX+neuronDrawSpacing*(l-1), 10+(i-1)*layerDrawSpacing, drawNeuronsX+3+neuronDrawSpacing*(l-1), 10+i*layerDrawSpacing, "gray", "black")
				elseif X[l][i] > 0.5 then
					gui.box(drawNeuronsX+neuronDrawSpacing*(l-1), 10+(i-1)*layerDrawSpacing, drawNeuronsX+3+neuronDrawSpacing*(l-1), 10+i*layerDrawSpacing, "green", "black")
				elseif X[l][i] < -0.5 then
					gui.box(drawNeuronsX+neuronDrawSpacing*(l-1), 10+(i-1)*layerDrawSpacing, drawNeuronsX+3+neuronDrawSpacing*(l-1), 10+i*layerDrawSpacing, "red", "black")
				end
			end
		end
	end

	if drawController == true then
		gui.box(controllerDrawX-1, controllerDrawY-1, controllerDrawX+64, controllerDrawY+24, "black")
		--A
		if Y[1] == true then
			gui.box(controllerDrawX+56, controllerDrawY+8, controllerDrawX+63, controllerDrawY+15, "blue")
		else
			gui.box(controllerDrawX+56, controllerDrawY+8, controllerDrawX+63, controllerDrawY+15, "gray")
		end
		--up
		if Y[2] == true then
			gui.box(controllerDrawX+8, controllerDrawY, controllerDrawX+15, controllerDrawY+7, "blue")
		else
			gui.box(controllerDrawX+8, controllerDrawY, controllerDrawX+15, controllerDrawY+7, "gray")
		end
		--left
		if Y[3] == true then
			gui.box(controllerDrawX, controllerDrawY+8, controllerDrawX+7, controllerDrawY+15, "blue")
		else
			gui.box(controllerDrawX, controllerDrawY+8, controllerDrawX+7, controllerDrawY+15, "gray")
		end
		--B
		if Y[4] == true then
			gui.box(controllerDrawX+40, controllerDrawY+8, controllerDrawX+47, controllerDrawY+15, "blue")
		else
			gui.box(controllerDrawX+40, controllerDrawY+8, controllerDrawX+47, controllerDrawY+15, "gray")
		end
		--right
		if Y[5] == true then
			gui.box(controllerDrawX+16, controllerDrawY+8, controllerDrawX+23, controllerDrawY+15, "blue")
		else
			gui.box(controllerDrawX+16, controllerDrawY+8, controllerDrawX+23, controllerDrawY+15, "gray")
		end
		--down
		if Y[6] == true then
			gui.box(controllerDrawX+8, controllerDrawY+16, controllerDrawX+15, controllerDrawY+23, "blue")
		else
			gui.box(controllerDrawX+8, controllerDrawY+16, controllerDrawX+15, controllerDrawY+23, "gray")
		end
	end

	if drawWeights == true then
		for l=1,layerNum do
		local layerInSpacing = (neuronVerticalSpacing*inputNum) / layerSize[l]
		local layerOutSpacing = (neuronVerticalSpacing*inputNum) / layerSize[l+1]
			for i=1,layerSize[l+1] do
			for j=1,layerSize[l] do
				if W[currentChild][l][i][j] >= .6 then
					gui.line(drawNeuronsX+3+neuronDrawSpacing*(l-1), 10+(j-.5)*layerInSpacing, drawNeuronsX-1+neuronDrawSpacing*l, 10+(i-.5)*layerOutSpacing, {0,0,255,48})
				end
				if W[currentChild][l][i][j] <= -.6 then
					gui.line(drawNeuronsX+3+neuronDrawSpacing*(l-1), 10+(j-.5)*layerInSpacing, drawNeuronsX-1+neuronDrawSpacing*l, 10+(i-.5)*layerOutSpacing, {255,0,0,48})
				end
			end
			end
		end
	end

	if drawPopulation == true then
		if currentParent1 > 0 then
			gui.box(4, 8*currentParent1, 10, 8*(currentParent1+1)-2, "blue")
		end
		if currentParent2 > 0 then
			gui.box(4, 8*currentParent2, 10, 8*(currentParent2+1)-2, "blue")
		end
		gui.box(4, 8*currentChild, 10, 8*(currentChild+1)-2, "green")
		for i=1, populationSize do
			if populationFitness[i] ~= nil then
				gui.text(12, 8*i, populationFitness[i])
			end
		end
	end
end


function multiply(matrixIn, vectorIn, rows, collumns)
	local vectorOut = {}

	for i=1,rows do
			vectorOut[i] = 0
			for j=1,collumns do
				vectorOut[i] = vectorOut[i] + matrixIn[i][j]*vectorIn[j]
			end
	end

	return vectorOut
end


function sigmoid(inputVector, inputLength, strength)
	local vectorOut = {}
	for i=1,inputLength do
		vectorOut[i] = 2/(1+math.exp(-strength*inputVector[i])) - 1
	end
	return vectorOut
end


function tanh(inputVector, inputLength)
	local vectorOut = {}
	for i=1,inputLength do
		vectorOut[i] = (math.exp(inputVector[i]) - math.exp(-inputVector[i])) / (math.exp(inputVector[i]) + math.exp(-inputVector[i]))
	end
	return vectorOut
end


function stepFunction(inputVector, inputLength)
	local vectorOut = {}
	for i=1,inputLength do
		if inputVector[i] >= outputStepStrength then
			vectorOut[i] = true
		else
			vectorOut[i] = false
		end
	end
	return vectorOut
end


function doublePressNegate(button1, button2)
	if Y[button1] == true and Y[button2] == true then
		if X[layerNum+1][button1] > X[layerNum+1][button2] then
			Y[button2] = false
		else
			Y[button1] = false
		end
	end
end


function outputToController()
	local controllerInput = {}
	controllerInput = {A=Y[1], up=Y[2], left=Y[3], B=Y[4], select=nil, right=Y[5], down=Y[6], start=nil}
	joypad.write(1, controllerInput)
end


function controllerOverride()
	local controllerInput = {}
	controllerInput = joypad.read(1)
	Y[1] = controllerInput["A"]
	Y[2] = controllerInput["up"]
	Y[3] = controllerInput["left"]
	Y[4] = controllerInput["B"]
	Y[5] = controllerInput["right"]
	Y[6] = controllerInput["down"]
end


function updateWeightsFromMem()
	for l=1,layerNum do
		for i=1,layerSize[l+1] do
		for j=1,layerSize[l] do
			--if math.random() < stepSize then
			--	W[l][i][j] = (memW[l][i][j] + 2)%3 - 1
			--else
			--	W[l][i][j] = memW[l][i][j]
			--end

			W[currentChild][l][i][j] = memW[l][i][j] + randomChangeSize*(2*math.random() - 1)

			--if W[i][j][k] > 1 then
			--	W[i][j][k] = 1
			--end
			--if W[i][j][k] < -1 then
			--	W[i][j][k] = -1
			--end
		end
		end
	end
end


function updateWeightsRandom()
	for l=1,layerNum do
		for i=1,layerSize[l+1] do
		for j=1,layerSize[l] do
			W[currentChild][l][i][j] = 2*math.random() - 1 --math.random(3)-2
			memW[l][i][j] = W[currentChild][l][i][j]
		end
		end
	end
end


function updateMemWeights()
	for l=1,layerNum do
		for i=1,layerSize[l+1] do
		for j=1,layerSize[l] do
			memW[l][i][j] = W[currentChild][l][i][j]
		end
		end
	end
end


function restartOld()
	if fitness > maxFitness then
		maxFitness = fitness
		updateMemWeights()
	end

	updateWeightsFromMem()

	if fitness <= minFitness then
	if maxFitness <= minFitness then
		updateWeightsRandom()
	end
	end

	generation = generation + 1
	fitness = 0
	timeStuck = 0

	savestate.load(saveState)

	inputPlayer()
	inputMap()
	inputView()
end


function inputController()
	--controllerInput = {A=true, up=false, left=false, B=false, select=nil, right=false, down=false, start=nil}
	controllerInput = joypad.read(1)
	for i=1, outputNum do
		Y_Train[i] = 0
	end
	if controllerInput["A"] == true then
		Y_Train[1] = 1
	end
	if controllerInput["up"] == true then
		Y_Train[2] = 1
	end
	if controllerInput["left"] == true then
		Y_Train[3] = 1
	end
	if controllerInput["B"] == true then
		Y_Train[4] = 1
	end
	if controllerInput["right"] == true then
		Y_Train[5] = 1
	end
	if controllerInput["down"] == true then
		Y_Train[6] = 1
	end

	if controllerInput["select"] == true then
		trainingMode = false

		timeStuck = 0
		screenTimeStuck = 0

		savestate.load(saveState)

		inputPlayer()
		inputEnemies()
		inputMap()
		inputView()
		fitness = playerX
	end
	if controllerInput["up"] == true and keyPressReady == true then
		recordMode = (recordMode+1)%2
		keyPressReady = false
	end
	if controllerInput["up"] == false then
		keyPressReady = true
	end
end


function forwardPropogate()
	X[1][1] = -1
	for l=1, layerNum do
		S[l+1] = multiply(W[currentChild][l], X[l], layerSize[l+1], layerSize[l])
		X[l+1] = tanh(S[l+1], layerSize[l+1])
		if l < layerNum then
			X[l+1][1] = -1
		end
	end
	Y = stepFunction(X[layerNum+1], outputNum)

	--make it so up/down etc. can't be hit at same time
	doublePressNegate(3,5)
	doublePressNegate(2,6)
	doublePressNegate(5,6)
	doublePressNegate(2,5)
	doublePressNegate(3,6)
end


function backPropogate()
	for i=1, outputNum do
		delta[layerNum+1][i] = (1-X[layerNum+1][i]*X[layerNum+1][i]) * (X[layerNum+1][i] - Y_Train[i])
	end

	for l=1, layerNum-2 do
		for j=1, layerSize[layerNum-l] do
			local matrixProduct = 0
			for k=1, layerSize[layerNum-l+1] do
				emu.print(l)
				emu.print(W[layerNum-l][k][j][l])
				emu.print(W[layerNum-l][k][j])
				emu.print("Delta: " .. delta[layerNum-l+1][k])
				matrixProduct = matrixProduct + W[layerNum-l][k][j][layerNum] * delta[layerNum-l+1][k]
			end
			delta[layerNum-l][j] = (1 - X[layerNum-l][j]*X[layerNum-l][j]) * matrixProduct
		end
	end
end


function batchGradientDescent()
	for l=1, layerNum do
		for i=1, layerSize[l+1] do
		for j=1, layerSize[l] do

	--l = math.random(layerNum)
	--i = math.random(layerSize[l+1])
	--j = math.random(layerSize[l])
			W[currentChild][l][i][j] = W[currentChild][l][i][j] - stepSize * delta[l+1][i] * X[l][j]
		end
		end
	end
end


function restart()
	fitness = round(fitness, 0)
	generation = generation + 1/populationSize
	if populationFitness[currentChild] == nil then
		populationFitness[currentChild] = fitness
	elseif fitness > populationFitness[currentChild] then
		populationFitness[currentChild] = fitness
	end


	if #populationFitness < populationSize then
		currentChild = currentChild + 1
	else
		currentChild = minimum(populationFitness)
		if math.random() <= .5 then
			currentParent1 = maximum(populationFitness)
			if currentParent1 == currentChild then
				currentParent1 = math.random(populationSize-1)
				if currentParent1 >= currentChild then
					currentParent1 = currentParent1+1
				end
			end
		else
			currentParent1 = math.random(populationSize-1)
			if currentParent1 >= currentChild then
				currentParent1 = currentParent1+1
			end
		end
		currentParent2 = math.random(populationSize-2)
		if currentParent2 >= currentChild then
			currentParent2 = currentParent2+1
		end
		if currentParent2 >= currentParent1 then
			currentParent2 = currentParent2+1
		end
		if currentParent2 == currentChild then
			currentParent2 = currentParent2+1
		end

		meanFitness = mean(populationFitness)
		stdvFitness = standardDev(populationFitness)
		if stdvFitness <= meanFitness/6 then
			uniformCrossover(mutationProbability*2)
		else
			uniformCrossover(mutationProbability)
		end
	end

	timeStuck = 0
	screenTimeStuck = 0
	fitness = 0
	savestate.load(saveState)
	inputPlayer()
	startFitness = playerX
end


function minimum(vectorIn)
	local val = vectorIn[1]
	local index = 1
	for i=1, #vectorIn do
		if vectorIn[i] < val then
			index = i
			val = vectorIn[i]
		end
	end
	return index
end


function maximum(vectorIn)
	local val = vectorIn[1]
	local index = 1
	for i=1, #vectorIn do
		if vectorIn[i] > val then
			index = i
			val = vectorIn[i]
		end
	end
	return index
end


function uniformCrossover(probability)
	for l=1, layerNum do
		for i=1, layerSize[l+1] do
		for j=1, layerSize[l] do
			if math.random() < probability then
				W[currentChild][l][i][j] = 2*math.random()-1
			else
				if math.random() <=0.5 then
					W[currentChild][l][i][j] = W[currentParent1][l][i][j]
				else
					W[currentChild][l][i][j] = W[currentParent2][l][i][j]
				end
			end
		end
		end
	end
end


function mean(arrayIn)
	local sum = 0
	--if #arrayIn > 0 then
		for i=1, #arrayIn do
			sum = sum + arrayIn[i]
		end
		return sum / #arrayIn
	--else
	--	return 0
	--end
end


function standardDev(arrayIn)
	local sum = 0
	local stdv = 0
	local meanVal = mean(arrayIn)
	--if #arrayIn > 1 then
		for i=1, #arrayIn do
			sum = sum + (arrayIn[i] - meanVal) * (arrayIn[i] - meanVal)
		end
		stdv = math.sqrt(sum / (#arrayIn-1))
		return stdv
	--else
	--	return 0
	--end
end


function round(num, idp)
  local mult = 10^(idp or 0)
  return math.floor(num * mult + 0.5) / mult
end

------------------------------------------------------------------------------------------------------------------------------------------------------------
--Main Code
------------------------------------------------------------------------------------------------------------------------------------------------------------


inputPlayer()
lastX = playerX
lastY = playerY
lastScreen = memory.readbyte(RamPlayerScreenX)
startFitness = playerX
playerLives = memory.readbyte(RamLives)
lastLives = playerLives
lastScore = playerScore

while (true) do

	--read PPU only when changing rooms
	--vblankFlag = memory.readbyte(0xE3)
	--if vblankFlag == 1 then
	--	vblankOff = 1
	--elseif vblankOff == 1 then
	--	readPPU()
	--	vblankOff = 0
	--end

	inputPlayer()
	inputEnemies()
	inputMap()
	inputView()


	index = 2	--first neuron slot is for constant X[1] = 1
	inputViewToX(index)
	index = index + viewDiameter*viewDiameter

	--inputCoordToX(index)
	--index = index + 2

	--inputEnemyToX(index)
	--index = index + 2*EnemyNumSlots

	--inputNoise(.1)

	forwardPropogate()

	if lastScore < playerScore then
		fitness = fitness + ((playerScore - lastScore) / 2)
	end

	if lastX < playerX then
		fitness = fitness + (playerX - lastX)
	elseif lastX > playerX then
		fitness = fitness - 1
	end

	if trainingMode == true then
		inputController()
		if recordMode == 1 then
			sampleTimer = sampleTimer + 1
			if sampleTimer >= sampleRate then
				sampleTimer = 0
				backPropogate()
				batchGradientDescent()

				errorVal = 0
				for i=1, 6 do
					errorVal = errorVal + ((X[layerNum+1][i] - Y_Train[i])*(X[layerNum+1][i] - Y_Train[i]))/2
				end
			end
			-- gui.text(0,8,errorVal)
			--outputToController()
		end
	else
		outputToController()
		--timeStuck = 0
		--screenTimeStuck = 0

		-- fitness += playerX - startFitness + playerScore --player score increases fitness

		if timerHold == 0 then
			if math.abs(playerX - lastX) < 2 then
				timeStuck = timeStuck + 1
			else
				timeStuck = 0
			end
			if memory.readbyte(RamPlayerScreenX) == lastScreen then
				screenTimeStuck = screenTimeStuck + 1
			else
				screenTimeStuck = 0
			end
		end

		if (fitness < -500 or timeStuck > maxStuckTime or screenTimeStuck > maxScreenStuckTime) then
			if geneticMode == true then
				emu.print(fitness)
				restart()
				resetGame = 0
			else
				restartOld()
			end
		end

		playerLives = memory.readbyte(RamLives)
		if lastLives ~= playerLives then
			--timerHold = 200
			--timeStuck = 0
			--screenTimeStuck = 0
			if playerLives == 255 then
				savestate.load(saveState)
				restart()
                fitness = 0
			elseif playerLives < 2 then
                emu.print("lives left: "  .. playerLives .. " last lives: " .. lastLives)
                fitness = fitness - 200
                screenTimeStuck = 0
                timeStuck = 0
                timerHold = 0
			end

		end

		if timerHold > 0 then
			timerHold = timerHold - 1
		end

		--Cause seizures if he sits still for too long
		if timeStuck >= medStuckTime then
			inputNoise(1)
		end

        if (currentTime < lastTime) then
            emu.print(currentTime)
            fitness = fitness - 1
        end
	end

	drawGui()

	gui.text(220, 8, math.floor(generation))
	gui.text(48, 8, fitness)
	--gui.text(48, 16, startFitness)
	--gui.text(48, 24, timerHold)
	--gui.text(64, 24, timeStuck)
	gui.text(48, 16, math.floor(meanFitness))
	--gui.text(48, 24, math.floor(stdvFitness))


	lastX = playerX
	lastY = playerY
	lastScreen = memory.readbyte(RamPlayerScreenX)
	lastLives = playerLives
	lastScore = playerScore
   	lastTime = currentTime

	emu.frameadvance()

end

------------------------------------------------------------------------------------------------------------------------------------------------------------