70 lines
No EOL
1.5 KiB
Python
Executable file
70 lines
No EOL
1.5 KiB
Python
Executable file
#!/usr/bin/env python
|
|
import sys
|
|
import numpy as np
|
|
|
|
# Import snake game
|
|
from snake import Snake
|
|
|
|
|
|
|
|
# Setup QTable
|
|
# Boolean features:
|
|
# Snake go up?
|
|
# Snake go right?
|
|
# Snake go down?
|
|
# Snake go left?
|
|
# Apple at up?
|
|
# Apple at right?
|
|
# Apple at down?
|
|
# Apple at left?
|
|
# Obstacle at up?
|
|
# Obstacle at right?
|
|
# Obstacle at down?
|
|
# Obstacle at left?
|
|
##### Totally 12 boolean features so 2^12=4096 states
|
|
##### Totally 4 actions for the AI (up, right,down,left)
|
|
##### Totally 4*2^12 thus 16 384 table entries
|
|
##### Reward +1 when eat an apple
|
|
##### Reward -10 when hit obstacle
|
|
|
|
qtable=np.zeros((4096, 4))
|
|
|
|
|
|
|
|
game=Snake()
|
|
|
|
def isWall(h,game):
|
|
if h[0]<0 or h[1]<0 or h[0] >= game.grid_width or h[1] >= game.grid_height:
|
|
return(True)
|
|
return(False)
|
|
|
|
|
|
def event_handler(game,event):
|
|
h=game.snake[0]
|
|
left=(h[0]-1,h[1])
|
|
right=(h[0]+1,h[1])
|
|
up=(h[0],h[1]-1)
|
|
down=(h[0],h[1]+1)
|
|
a=game.apple
|
|
|
|
snake_go_up=(game.direction==12)
|
|
snake_go_right=(game.direction==3)
|
|
snake_go_down=(game.direction==6)
|
|
snake_go_left=(game.direction==9)
|
|
|
|
apple_up=(up==a)
|
|
apple_right=(right==a)
|
|
apple_down=(down==a)
|
|
apple_left=(left==a)
|
|
|
|
obstacle_up=(up in game.snake or isWall(up, game))
|
|
obstacle_right=(right in game.snake or isWall(right, game))
|
|
obstacle_down=(down in game.snake or isWall(down, game))
|
|
obstacle_left=(left in game.snake or isWall(left, game))
|
|
|
|
if game.snake[0][0]==10:
|
|
game.direction=6
|
|
|
|
for i in range(0,10):
|
|
score=game.run(event_handler=event_handler)
|
|
print("Game ended with "+str(score)) |