Return to Question

Notice removed Draw attention by rookie

occurred Jun 10, 2015 at 2:25

Bounty Ended with janos's answer chosen by rookie

occurred Jun 10, 2015 at 2:25

adding link to 2048 game

Source Link

edit approved Jun 7, 2015 at 3:01

Community Bot

edit approved Jun 7, 2015 at 3:01

Community Bot

A few weeks ago, I wrote a Python implementation of 20482048. Since then, I've been working on a simple AI to play the game for me. The code uses expectimax search to evaluate each move, and chooses the move that maximizes the search as the next move to execute.

A few weeks ago, I wrote a Python implementation of 2048. Since then, I've been working on a simple AI to play the game for me. The code uses expectimax search to evaluate each move, and chooses the move that maximizes the search as the next move to execute.

Tweeted twitter.com/#!/StackCodeReview/status/606650881329774594

occurred Jun 5, 2015 at 2:36

Notice added Draw attention by rookie

occurred Jun 4, 2015 at 17:54

Bounty Started worth 50 reputation by rookie

occurred Jun 4, 2015 at 17:54

deleted 74 characters in body

Source Link

edited Jun 2, 2015 at 18:06

rookie

edited Jun 2, 2015 at 18:06

rookie

1.2k
3
14
32

The code for the game and the AI can be found here. ToYou can run: b = Game().baiplay; now play the board with a aiplay(b)Game instance.

from game import *
import math
def aimove(b):
 """
 Returns a list of possible moves ("left", "right", "up", "down")
 and each corresponding fitness
 """
 def fitness(b):
 """
 Returns the heuristic value of b
 Snake refers to the "snake line pattern" (http://tinyurl.com/l9bstk6)
 Here we only evaluate one direction; we award more points if high valued tiles
 occur along this path. We penalize the board for not having
 the highest valued tile in the lower left corner
 """
 if Game.over(b):
 return -float("inf")
 
 snake = []
 for i, col in enumerate(zip(*b)):
 snake.extend(reversed(col) if i % 2 == 0 else col)
 m = max(snake)
 return sum(x/10**n for n, x in enumerate(snake)) - \
 math.pow((b[3][0] != m)*abs(b[3][0] - m), 2)
 def search(b, d, move=False):
 """
 Performs expectimax search on a given configuration to
 specified depth (d).
 Algorithm details:
 - if the AI needs to move, make each child move,
 recurse, return the maximum fitness value
 - if it is not the AI's turn, form all
 possible child spawns, and return their weighted average 
 as that node's evaluation
 """
 if d == 0 or (move and Game.over(b)):
 return fitness(b)
 alpha = fitness(b)
 if move:
 for _, child in Game.actions(b):
 return max(alpha, search(child, d-1))
 else:
 alpha = 0
 zeros = [(i,j) for i,j in itertools.product(range(4), range(4)) if b[i][j] == 0]
 for i, j in zeros:
 c1 = [[x for x in row] for row in b]
 c2 = [[x for x in row] for row in b]
 c1[i][j] = 2
 c2[i][j] = 4
 alpha += .9*search(c1, d-1, True)/len(zeros) + \
 .1*search(c2, d-1, True)/len(zeros)
 return alpha
 return [(action, search(child, 5)) for action ,child in Game.actions(b)]
 
def aiplay(bgame):
 """
 Runs thea game instance playing the move determined
 by aimove.
 To run, get a board"""
 from Game first (b = Game()game.b). 
 You can then play that board with aiplay(b)
 """
 while True:
 print(Game.string(b) + "\n")
 action = max(aimove(b), key = lambda x: x[1])[0]
 
 if action == "left" : b = Game.left(b)
 if action == "right": b = Game.right(b)
 if action == "up" : b = Game.up(b)
 if action == "down" : b = Game.down(b)
 b = Game.spawn(b, 1)
 if Game.over(b):
 m = max(x for row in b for x in row)
 print("game over...best was %s" %m)
 print(Game.string(b))
 break

The code for the game and the AI can be found here. To run: b = Game().b; now play the board with aiplay(b)

from game import *
import math
def aimove(b):
 """
 Returns a list of possible moves ("left", "right", "up", "down")
 and each corresponding fitness
 """
 def fitness(b):
 """
 Returns the heuristic value of b
 Snake refers to the "snake line pattern" (http://tinyurl.com/l9bstk6)
 Here we only evaluate one direction; we award more points if high valued tiles
 occur along this path. We penalize the board for not having
 the highest valued tile in the lower left corner
 """
 if Game.over(b):
 return -float("inf")
 
 snake = []
 for i, col in enumerate(zip(*b)):
 snake.extend(reversed(col) if i % 2 == 0 else col)
 m = max(snake)
 return sum(x/10**n for n, x in enumerate(snake)) - \
 math.pow((b[3][0] != m)*abs(b[3][0] - m), 2)
 def search(b, d, move=False):
 """
 Performs expectimax search on a given configuration to
 specified depth (d).
 Algorithm details:
 - if the AI needs to move, make each child move,
 recurse, return the maximum fitness value
 - if it is not the AI's turn, form all
 possible child spawns, and return their weighted average 
 as that node's evaluation
 """
 if d == 0 or (move and Game.over(b)):
 return fitness(b)
 alpha = fitness(b)
 if move:
 for _, child in Game.actions(b):
 return max(alpha, search(child, d-1))
 else:
 alpha = 0
 zeros = [(i,j) for i,j in itertools.product(range(4), range(4)) if b[i][j] == 0]
 for i, j in zeros:
 c1 = [[x for x in row] for row in b]
 c2 = [[x for x in row] for row in b]
 c1[i][j] = 2
 c2[i][j] = 4
 alpha += .9*search(c1, d-1, True)/len(zeros) + \
 .1*search(c2, d-1, True)/len(zeros)
 return alpha
 return [(action, search(child, 5)) for action ,child in Game.actions(b)]
 
def aiplay(b):
 """
 Runs the game playing the move determined
 by aimove.
 To run, get a board from Game first (b = Game().b). 
 You can then play that board with aiplay(b)
 """
 while True:
 print(Game.string(b) + "\n")
 action = max(aimove(b), key = lambda x: x[1])[0]
 
 if action == "left" : b = Game.left(b)
 if action == "right": b = Game.right(b)
 if action == "up" : b = Game.up(b)
 if action == "down" : b = Game.down(b)
 b = Game.spawn(b, 1)
 if Game.over(b):
 m = max(x for row in b for x in row)
 print("game over...best was %s" %m)
 print(Game.string(b))
 break

The code for the game and the AI can be found here. You can run aiplay with a Game instance.

from game import *
import math
def aimove(b):
 """
 Returns a list of possible moves ("left", "right", "up", "down")
 and each corresponding fitness
 """
 def fitness(b):
 """
 Returns the heuristic value of b
 Snake refers to the "snake line pattern" (http://tinyurl.com/l9bstk6)
 Here we only evaluate one direction; we award more points if high valued tiles
 occur along this path. We penalize the board for not having
 the highest valued tile in the lower left corner
 """
 if Game.over(b):
 return -float("inf")
 
 snake = []
 for i, col in enumerate(zip(*b)):
 snake.extend(reversed(col) if i % 2 == 0 else col)
 m = max(snake)
 return sum(x/10**n for n, x in enumerate(snake)) - \
 math.pow((b[3][0] != m)*abs(b[3][0] - m), 2)
 def search(b, d, move=False):
 """
 Performs expectimax search on a given configuration to
 specified depth (d).
 Algorithm details:
 - if the AI needs to move, make each child move,
 recurse, return the maximum fitness value
 - if it is not the AI's turn, form all
 possible child spawns, and return their weighted average 
 as that node's evaluation
 """
 if d == 0 or (move and Game.over(b)):
 return fitness(b)
 alpha = fitness(b)
 if move:
 for _, child in Game.actions(b):
 return max(alpha, search(child, d-1))
 else:
 alpha = 0
 zeros = [(i,j) for i,j in itertools.product(range(4), range(4)) if b[i][j] == 0]
 for i, j in zeros:
 c1 = [[x for x in row] for row in b]
 c2 = [[x for x in row] for row in b]
 c1[i][j] = 2
 c2[i][j] = 4
 alpha += .9*search(c1, d-1, True)/len(zeros) + \
 .1*search(c2, d-1, True)/len(zeros)
 return alpha
 return [(action, search(child, 5)) for action ,child in Game.actions(b)]
 
def aiplay(game):
 """
 Runs a game instance playing the move determined
 by aimove.
 """
 b = game.b
 while True:
 print(Game.string(b) + "\n")
 action = max(aimove(b), key = lambda x: x[1])[0]
 
 if action == "left" : b = Game.left(b)
 if action == "right": b = Game.right(b)
 if action == "up" : b = Game.up(b)
 if action == "down" : b = Game.down(b)
 b = Game.spawn(b, 1)
 if Game.over(b):
 m = max(x for row in b for x in row)
 print("game over...best was %s" %m)
 print(Game.string(b))
 break

added 37 characters in body

Source Link

edited Jun 2, 2015 at 17:56

rookie

edited Jun 2, 2015 at 17:56

rookie

1.2k
3
14
32

The code for the game and the AI can be found here. To run: b = Game().b; now play the board with aiplay(b)

Below is the relevant AI code:

from game import *
import math
def aimove(b):
 """
 Returns a list of possible moves ("left", "right", "up", "down")
 and each corresponding fitness
 """
 def fitness(b):
 """
 Returns the heuristic value of b
 Snake refers to the "snake line pattern" (http://tinyurl.com/l9bstk6)
 Here we only evaluate one direction; we award more points if high valued tiles
 occur along this path. We penalize the board for not having
 the highest valued tile in the lower left corner
 """
 if Game.over(b):
 return -float("inf")
 
 snake = []
 for i, col in enumerate(zip(*b)):
 snake.extend(reversed(col) if i % 2 == 0 else col)
 m = max(snake)
 return sum(x/10**n for n, x in enumerate(snake)) - \
 math.pow((b[3][0] != m)*abs(b[3][0] - m), 2)
 def search(b, d, move=False):
 """
 Performs expectimax search on a given configuration to
 specified depth (d).
 Algorithm details:
 - if the AI needs to move, make each child move,
 recurse, return the maximum fitness value
 - if it is not the AI's turn, form all
 possible child spawns, and return their weighted average 
 as that node's evaluation
 """
 if d == 0 or (move and Game.over(b)):
 return fitness(b)
 alpha = fitness(b)
 if move:
 for _, child in Game.actions(b):
 return max(alpha, search(child, d-1, False))
 else:
 alpha = 0
 zeros = [(i,j) for i,j in itertools.product(range(4), range(4)) if b[i][j] == 0]
 for i, j in zeros:
 c1 = [[x for x in row] for row in b]
 c2 = [[x for x in row] for row in b]
 c1[i][j] = 2
 c2[i][j] = 4
 alpha += .9*search(c1, d-1, True)/len(zeros) + \
 .1*search(c2, d-1, True)/len(zeros)
 return alpha
 return [(action, search(child, 5)) for action ,child in Game.actions(b)]
 
def aiplay(b):
 """
 Runs the game playing the move determined
 by aimove.
 To run, get a board from Game first (b = Game().b). 
 You can then play that board with aiplay(b)
 """
 while True:
 print(Game.string(b) + "\n")
 action = max(aimove(b), key = lambda x: x[1])[0]
 
 if action == "left" : b = Game.left(b)
 if action == "right": b = Game.right(b)
 if action == "up" : b = Game.up(b)
 if action == "down" : b = Game.down(b)
 b = Game.spawn(b, 1)
 if Game.over(b):
 m = max(x for row in b for x in row)
 print("game over...best was %s" %m)
 print(Game.string(b))
 break

The code for the game and the AI can be found here. Below is the relevant AI code:

from game import *
import math
def aimove(b):
 """
 Returns a list of possible moves ("left", "right", "up", "down")
 and each corresponding fitness
 """
 def fitness(b):
 """
 Returns the heuristic value of b
 Snake refers to the "snake line pattern" (http://tinyurl.com/l9bstk6)
 Here we only evaluate one direction; we award more points if high valued tiles
 occur along this path. We penalize the board for not having
 the highest valued tile in the lower left corner
 """
 if Game.over(b):
 return -float("inf")
 
 snake = []
 for i, col in enumerate(zip(*b)):
 snake.extend(reversed(col) if i % 2 == 0 else col)
 m = max(snake)
 return sum(x/10**n for n, x in enumerate(snake)) - \
 math.pow((b[3][0] != m)*abs(b[3][0] - m), 2)
 def search(b, d, move=False):
 """
 Performs expectimax search on a given configuration to
 specified depth (d).
 Algorithm details:
 - if the AI needs to move, make each child move,
 recurse, return the maximum fitness value
 - if it is not the AI's turn, form all
 possible child spawns, and return their weighted average 
 as that node's evaluation
 """
 if d == 0 or (move and Game.over(b)):
 return fitness(b)
 alpha = fitness(b)
 if move:
 for _, child in Game.actions(b):
 return max(alpha, search(child, d-1, False))
 else:
 alpha = 0
 zeros = [(i,j) for i,j in itertools.product(range(4), range(4)) if b[i][j] == 0]
 for i, j in zeros:
 c1 = [[x for x in row] for row in b]
 c2 = [[x for x in row] for row in b]
 c1[i][j] = 2
 c2[i][j] = 4
 alpha += .9*search(c1, d-1, True)/len(zeros) + \
 .1*search(c2, d-1, True)/len(zeros)
 return alpha
 return [(action, search(child, 5)) for action ,child in Game.actions(b)]
 
def aiplay(b):
 """
 Runs the game playing the move determined
 by aimove.
 """
 while True:
 print(Game.string(b) + "\n")
 action = max(aimove(b), key = lambda x: x[1])[0]
 
 if action == "left" : b = Game.left(b)
 if action == "right": b = Game.right(b)
 if action == "up" : b = Game.up(b)
 if action == "down" : b = Game.down(b)
 b = Game.spawn(b, 1)
 if Game.over(b):
 m = max(x for row in b for x in row)
 print("game over...best was %s" %m)
 print(Game.string(b))
 break

The code for the game and the AI can be found here. To run: b = Game().b; now play the board with aiplay(b)

Below is the relevant AI code:

from game import *
import math
def aimove(b):
 """
 Returns a list of possible moves ("left", "right", "up", "down")
 and each corresponding fitness
 """
 def fitness(b):
 """
 Returns the heuristic value of b
 Snake refers to the "snake line pattern" (http://tinyurl.com/l9bstk6)
 Here we only evaluate one direction; we award more points if high valued tiles
 occur along this path. We penalize the board for not having
 the highest valued tile in the lower left corner
 """
 if Game.over(b):
 return -float("inf")
 
 snake = []
 for i, col in enumerate(zip(*b)):
 snake.extend(reversed(col) if i % 2 == 0 else col)
 m = max(snake)
 return sum(x/10**n for n, x in enumerate(snake)) - \
 math.pow((b[3][0] != m)*abs(b[3][0] - m), 2)
 def search(b, d, move=False):
 """
 Performs expectimax search on a given configuration to
 specified depth (d).
 Algorithm details:
 - if the AI needs to move, make each child move,
 recurse, return the maximum fitness value
 - if it is not the AI's turn, form all
 possible child spawns, and return their weighted average 
 as that node's evaluation
 """
 if d == 0 or (move and Game.over(b)):
 return fitness(b)
 alpha = fitness(b)
 if move:
 for _, child in Game.actions(b):
 return max(alpha, search(child, d-1))
 else:
 alpha = 0
 zeros = [(i,j) for i,j in itertools.product(range(4), range(4)) if b[i][j] == 0]
 for i, j in zeros:
 c1 = [[x for x in row] for row in b]
 c2 = [[x for x in row] for row in b]
 c1[i][j] = 2
 c2[i][j] = 4
 alpha += .9*search(c1, d-1, True)/len(zeros) + \
 .1*search(c2, d-1, True)/len(zeros)
 return alpha
 return [(action, search(child, 5)) for action ,child in Game.actions(b)]
 
def aiplay(b):
 """
 Runs the game playing the move determined
 by aimove.
 To run, get a board from Game first (b = Game().b). 
 You can then play that board with aiplay(b)
 """
 while True:
 print(Game.string(b) + "\n")
 action = max(aimove(b), key = lambda x: x[1])[0]
 
 if action == "left" : b = Game.left(b)
 if action == "right": b = Game.right(b)
 if action == "up" : b = Game.up(b)
 if action == "down" : b = Game.down(b)
 b = Game.spawn(b, 1)
 if Game.over(b):
 m = max(x for row in b for x in row)
 print("game over...best was %s" %m)
 print(Game.string(b))
 break