Minor changes
This commit is contained in:
parent
69c5d709a4
commit
451856be1b
1 changed files with 24 additions and 3 deletions
27
qlearning.py
27
qlearning.py
|
@ -38,7 +38,12 @@ def isWall(h,game):
|
||||||
return(True)
|
return(True)
|
||||||
return(False)
|
return(False)
|
||||||
|
|
||||||
|
|
||||||
|
last_state=None
|
||||||
|
last_action=None
|
||||||
def event_handler(game,event):
|
def event_handler(game,event):
|
||||||
|
global last_state,last_action
|
||||||
|
|
||||||
h=game.snake[0]
|
h=game.snake[0]
|
||||||
left=(h[0]-1,h[1])
|
left=(h[0]-1,h[1])
|
||||||
right=(h[0]+1,h[1])
|
right=(h[0]+1,h[1])
|
||||||
|
@ -70,14 +75,30 @@ def event_handler(game,event):
|
||||||
# This come from me I do not now if it is the best way to identify a state
|
# This come from me I do not now if it is the best way to identify a state
|
||||||
state=2**11*snake_go_up+2**10*snake_go_right+2**9*snake_go_down+2**8*snake_go_left+2**7*apple_up+2**6*apple_right+2**5*apple_down+2**4*apple_left+2**3*obstacle_up+2**2*obstacle_right+2**1*obstacle_down+obstacle_left
|
state=2**11*snake_go_up+2**10*snake_go_right+2**9*snake_go_down+2**8*snake_go_left+2**7*apple_up+2**6*apple_right+2**5*apple_down+2**4*apple_left+2**3*obstacle_up+2**2*obstacle_right+2**1*obstacle_down+obstacle_left
|
||||||
|
|
||||||
|
# Choose an action
|
||||||
if np.max(qtable[state]) > 0:
|
if np.max(qtable[state]) > 0:
|
||||||
action = np.argmax(qtable[state])
|
action = np.argmax(qtable[state])
|
||||||
else:
|
else:
|
||||||
action=random.choice((12,3,6,9))
|
action=random.choice((0,1,2,3))
|
||||||
|
|
||||||
game.direction=action
|
# Update current state Q
|
||||||
|
if last_state != None:
|
||||||
|
qtable[last_state,last_action]=qtable[last_state,last_action]+0.5*(reward+0.5*qtable[state])
|
||||||
|
last_state=state
|
||||||
|
last_action=action
|
||||||
|
|
||||||
|
# Apply the action
|
||||||
|
snake_action=12
|
||||||
|
if action==1:
|
||||||
|
snake_action=3
|
||||||
|
elif action==2:
|
||||||
|
snake_action=6
|
||||||
|
elif action==3:
|
||||||
|
snake_action=9
|
||||||
|
game.direction=snake_action
|
||||||
|
|
||||||
for i in range(0,10):
|
for i in range(0,10):
|
||||||
|
last_state=None
|
||||||
|
last_action=None
|
||||||
score=game.run(event_handler=event_handler)
|
score=game.run(event_handler=event_handler)
|
||||||
print("Game ended with "+str(score))
|
print("Game ended with "+str(score))
|
Loading…
Add table
Reference in a new issue