Minor changes

This commit is contained in:
Loic Guegan 2022-11-01 20:21:34 +01:00
parent 4d4d5b1481
commit 3b35b6866d
3 changed files with 4133 additions and 24 deletions

View file

@ -1,5 +1,5 @@
#!/usr/bin/env python #!/usr/bin/env python
import sys,random import sys,random,os
import numpy as np import numpy as np
# Import snake game # Import snake game
@ -31,7 +31,7 @@ qtable=np.zeros((4096, 4))
game=Snake() game=Snake(length=4,fps=200)
def isWall(h,game): def isWall(h,game):
if h[0]<0 or h[1]<0 or h[0] >= game.grid_width or h[1] >= game.grid_height: if h[0]<0 or h[1]<0 or h[0] >= game.grid_width or h[1] >= game.grid_height:
@ -41,8 +41,9 @@ def isWall(h,game):
last_state=None last_state=None
last_action=None last_action=None
attempt=0
def event_handler(game,event): def event_handler(game,event):
global last_state,last_action global last_state,last_action,attempt
h=game.snake[0] h=game.snake[0]
left=(h[0]-1,h[1]) left=(h[0]-1,h[1])
@ -56,10 +57,10 @@ def event_handler(game,event):
snake_go_down=(game.direction==6) snake_go_down=(game.direction==6)
snake_go_left=(game.direction==9) snake_go_left=(game.direction==9)
apple_up=(up==a) apple_up=(a[1]<h[1])
apple_right=(right==a) apple_right=(a[0]>h[0])
apple_down=(down==a) apple_down=(a[1]>h[1])
apple_left=(left==a) apple_left=(a[0]<h[0])
obstacle_up=(up in game.snake or isWall(up, game)) obstacle_up=(up in game.snake or isWall(up, game))
obstacle_right=(right in game.snake or isWall(right, game)) obstacle_right=(right in game.snake or isWall(right, game))
@ -67,24 +68,32 @@ def event_handler(game,event):
obstacle_left=(left in game.snake or isWall(left, game)) obstacle_left=(left in game.snake or isWall(left, game))
reward=0 reward=0
if event==1: if event==0:
reward=1 attempt+=1
elif event==-1: if event==-1:
reward=-10 reward=-10
attempt=0
elif event==1:
reward=1
attempt=0
# Avoid infinite loop
if attempt>3000:
reward=-1
attempt=0
# This come from me I do not now if it is the best way to identify a state # This come from me I do not now if it is the best way to identify a state
state=2**11*snake_go_up+2**10*snake_go_right+2**9*snake_go_down+2**8*snake_go_left+2**7*apple_up+2**6*apple_right+2**5*apple_down+2**4*apple_left+2**3*obstacle_up+2**2*obstacle_right+2**1*obstacle_down+obstacle_left state=2**11*snake_go_up+2**10*snake_go_right+2**9*snake_go_down+2**8*snake_go_left+2**7*apple_up+2**6*apple_right+2**5*apple_down+2**4*apple_left+2**3*obstacle_up+2**2*obstacle_right+2**1*obstacle_down+obstacle_left
# Choose an action # Choose an action
action=random.choice((0,1,2,3)) action=random.choice((0,1,2,3))
if np.max(qtable[state]) > 0: if np.max(qtable[state]) > 0:
action = np.argmax(qtable[state]) #qactions=qtable[state]
#options=np.flatnonzero(qactions == np.max(qactions)) # Since Q value might be equals for several actions
print(np.max(qtable[state])) #action = random.choice(options)
action=np.argmax(qtable[state])
# Update current state Q # Update current state Q
if last_state != None: if last_state != None:
qtable[last_state,last_action]=qtable[last_state,last_action]+0.5*(reward+0.5*qtable[state]) qtable[last_state,last_action]=qtable[last_state,last_action]+0.7*(reward+0.9*np.max(qtable[state])-qtable[last_state,last_action])
last_state=state last_state=state
last_action=action last_action=action
@ -98,8 +107,12 @@ def event_handler(game,event):
snake_action=9 snake_action=9
game.direction=snake_action game.direction=snake_action
for i in range(0,10): if os.path.exists("qtable.txt"):
qtable=np.loadtxt("qtable.txt")
for i in range(0,10000):
last_state=None last_state=None
last_action=None last_action=None
score=game.run(event_handler=event_handler) score=game.run(event_handler=event_handler)
if i%100 == 0:
np.savetxt('qtable.txt',qtable)
print("Game ended with "+str(score)) print("Game ended with "+str(score))

4096
qtable.txt Normal file

File diff suppressed because it is too large Load diff

View file

@ -7,7 +7,7 @@ class Snake:
Programmable Game of Snake written in PyGame Programmable Game of Snake written in PyGame
""" """
def __init__(self, margin=80,length=4,grid_width=30,grid_height=30, grid_pts=30,fps=12): def __init__(self, margin=80,length=4,grid_width=30,grid_height=30, grid_pts=30,fps=80):
# Init attributes # Init attributes
self.grid_width=grid_width self.grid_width=grid_width
self.grid_height=grid_height self.grid_height=grid_height
@ -26,7 +26,7 @@ class Snake:
""" """
Reset game state Reset game state
""" """
self.snake=[(5,5)]*self.default_length self.snake=[(0,0)]*self.default_length
self.direction=3 # Like clock (12=up, 3=right, 6=bottom, 9=left) self.direction=3 # Like clock (12=up, 3=right, 6=bottom, 9=left)
self.new_apple() self.new_apple()
self.score=0 self.score=0
@ -57,8 +57,8 @@ class Snake:
Create a new apple Create a new apple
""" """
self.apple=(random.randint(0,self.grid_width-1),random.randint(0,self.grid_height-1)) self.apple=(random.randint(0,self.grid_width-1),random.randint(0,self.grid_height-1))
while self.apple in self.snake: if self.apple in self.snake:
self.apple=(random.randint(0,self.grid_width),random.randint(0,self.grid_height)) self.new_apple()
def move(self): def move(self):
""" """
@ -124,7 +124,7 @@ class Snake:
clock = pygame.time.Clock() clock = pygame.time.Clock()
ignore_has_loose=True ignore_has_loose=True
self.new_game() self.new_game()
event=0 # 0 is nothing, 1 is eat an apple and -1 loose last_event=0 # 0 is nothing, 1 is eat an apple and -1 loose
while True: while True:
self.screen.fill((0,0,0)) self.screen.fill((0,0,0))
self.draw_snake() self.draw_snake()
@ -156,15 +156,15 @@ class Snake:
break break
# Check if an event handler is available # Check if an event handler is available
if event_handler!=None: if event_handler!=None:
event_handler(self,event) event_handler(self,last_event)
event=0 last_event=0
self.move() self.move()
# Check for eating apple # Check for eating apple
if self.apple==self.snake[0]: if self.apple==self.snake[0]:
self.snake.append(self.snake[len(self.snake)-1]) self.snake.append(self.snake[len(self.snake)-1])
self.new_apple() self.new_apple()
self.score+=1 self.score+=1
event=1 last_event=1
pygame.display.flip() pygame.display.flip()
clock.tick(self.fps) clock.tick(self.fps)
return(self.score) return(self.score)