Minimax算法研究（TicTacToe）

全部 Linux 数据库敏捷编程数据结构软件测试项目管理 Oracle 编程综合互联网 Erlang MySQL

浏览 7290 次

锁定老帖子主题：Minimax算法研究（TicTacToe）精华帖 (0) :: 良好帖 (0) :: 新手帖 (0) :: 隐藏帖 (0)
作者	正文
univasity 等级: 性别: 文章: 35 积分: 160 来自: 广州	发表时间：2011-09-11 最后修改：2011-09-12 相关推荐: TicTacToe：实现了minimax算法的TicTacToe 有一个农场公司，专门向市场销售各类水果，主要包括下列水果：葡萄 Grape，草莓 Stuawberry，苹果 Apple；有一个Fruit接口，包含grow生长，harvest收获和plant方法， Minimax-TicTacToe：一个Minimax算法实现项目 TicTacToe:使用Winmaxs和minimax算法开发的TicTacToe游戏 tictactoe:Minimax算法更多相关推荐数据结构极小极大的定义 Minimax算法又名极小化极大算法，是一种找出失败的最大可能性中的最小值的算法（即最小化对手的最大得益）。通常以递归形式来实现。 Minimax算法常用于棋类等由两方较量的游戏和程序。该算法是一个零总和算法，即一方要在可选的选项中选择将其优势最大化的选择，另一方则选择令对手优势最小化的一个，其输赢的总和为0（有点像能量守恒，就像本身两个玩家都有1点，最后输家要将他的1点给赢家，但整体上还是总共有2点）。很多棋类游戏可以采取此算法，例如tic-tac-toe。关于极小极大，更多的信息可参考以下文章： Minimax(wikipedia) Understanding The MiniMax Algorithm Minimax Explained 最小最大原理与搜索方法以TIC-TAC-TOE为例 tic-tac-toe就是我们小时候玩的井字棋（我这边习惯叫“井字过三关”），不熟悉的可以参考wiki 。一般X的玩家先下。设定X玩家的最大利益为正无穷（+∞），O玩家的最大利益为负无穷（-∞），这样我们称X玩家为MAX（因为他总是追求更大的值），成O玩家为MIN（她总是追求更小的值），各自都为争取自己的最大获益而努力。现在，让我们站在MAX的立场来分析局势（这是必须的，应为你总不能两边倒吧，你喜欢的话也可以选择MIN）。由于MAX是先下的（习惯上X的玩家先下），于是构建出来的博弈树如下(前面两层)： MAX总是会选择MIN最大获利中的最小值（对MAX最有利），同样MIN也会一样，选择对自己最有利的（即MAX有可能获得的最大值）。有点难理解，其实就是自己得不到也不给你得到这样的意思啦，抢先把对对手有利的位置抢占了。你会看出，这是不断往下深钻的，直到最底层（即叶节点）你才能网上回溯，确定那个是对你最有利的。具体过程会像是这么一个样子的：但实际情况下，完全遍历一颗博弈树是不现实的，因为层级的节点数是指数级递增的：层数节点数 0 1 1 9 2 72 3 504 4 3024 5 15120 6 60480 7 181440 8 362880 完全遍历会很耗时...一般情况下需要限制深钻的层数，在达到限定的层数时就返回一个估算值（通过一个启发式的函数对当前博弈位置进行估值），这样获得的值就不是精确的了（遍历的层数越深越精确，当然和估算函数也有一定关系），但该值依然是足够帮助我们做出决策的。于是，对耗时和精确度需要做一个权衡。一般我们限定其遍历的深度为6（目前多数的象棋游戏也是这么设定的）。于是，我们站在MAX的角度，评估函数会是这样子的： static final int INFINITY = 100 ; // 表示无穷的值 static final int WIN = +INFINITY ; // MAX的最大利益为正无穷 static final int LOSE = -INFINITY ; // MAX的最小得益（即MIN的最大得益）为负无穷 static final int DOUBLE_LINK = INFINITY / 2 ; // 如果同一行、列或对角上连续有两个，赛点 static final int INPROGRESS = 1 ; // 仍可继续下（没有胜出或和局） static final int DRAW = 0 ; // 和局 static final int [][] WIN_STATUS = { { 0, 1, 2 }, { 3, 4, 5 }, { 6, 7, 8 }, { 0, 3, 6 }, { 1, 4, 7 }, { 2, 5, 8 }, { 0, 4, 8 }, { 2, 4, 6 } }; /** * 估值函数，提供一个启发式的值，决定了游戏AI的高低 / public int gameState( char [] board ) { int result = INPROGRESS; boolean isFull = true ; // is game over? for ( int pos = 0; pos < 9; pos++) { char chess = board[pos]; if ( empty == chess) { isFull = false ; break ; } } // is Max win/lose? for ( int [] status : WIN_STATUS) { char chess = board[status[0]]; if (chess == empty ) { break ; } int i = 1; for (; i < status.length; i++) { if (board[status[i]] != chess) { break ; } } if (i == status.length) { result = chess == x ? WIN : LOSE; break ; } } if (result != WIN & result != LOSE) { if (isFull) { // is draw result = DRAW; } else { // check double link // finds[0]->'x', finds[1]->'o' int [] finds = new int [2]; for ( int [] status : WIN_STATUS) { char chess = empty ; boolean hasEmpty = false ; int count = 0; for ( int i = 0; i < status.length; i++) { if (board[status[i]] == empty ) { hasEmpty = true ; } else { if (chess == empty ) { chess = board[status[i]]; } if (board[status[i]] == chess) { count++; } } } if (hasEmpty && count > 1) { if (chess == x ) { finds[0]++; } else { finds[1]++; } } } // check if two in one line if (finds[1] > 0) { result = -DOUBLE_LINK; } else if (finds[0] > 0) { result = DOUBLE_LINK; } } } return result; } 基于这些，一个限定层数的实现是这样的： /* * 以'x'的角度来考虑的极小极大算法 / public int minimax( char [] board, int depth){ int [] bestMoves = new int [9]; int index = 0; int bestValue = - INFINITY ; for ( int pos=0; pos<9; pos++){ if (board[pos]== empty ){ board[pos] = x ; int value = min(board, depth); if (value>bestValue){ bestValue = value; index = 0; bestMoves[index] = pos; } else if (value==bestValue){ index++; bestMoves[index] = pos; } board[pos] = empty ; } } if (index>1){ index = ( new Random (System. currentTimeMillis ()).nextInt()>>>1)%index; } return bestMoves[index]; } /* * 对于'x'，估值越大对其越有利 / public int max( char [] board, int depth){ int evalValue = gameState (board); boolean isGameOver = (evalValue== WIN \|\| evalValue== LOSE \|\| evalValue== DRAW ); if (depth==0 \|\| isGameOver){ return evalValue; } int bestValue = - INFINITY ; for ( int pos=0; pos<9; pos++){ if (board[pos]== empty ){ // try board[pos] = x ; // maximixing bestValue = Math. max (bestValue, min(board, depth-1)); // reset board[pos] = empty ; } } return evalValue; } /* * 对于'o'，估值越小对其越有利 / public int min( char [] board, int depth){ int evalValue = gameState (board); boolean isGameOver = (evalValue== WIN \|\| evalValue== LOSE \|\| evalValue== DRAW ); if (depth==0 \|\| isGameOver){ return evalValue; } int bestValue = + INFINITY ; for ( int pos=0; pos<9; pos++){ if (board[pos]== empty ){ // try board[pos] = o ; // minimixing bestValue = Math.min(bestValue, max(board, depth-1)); // reset board[pos] = empty ; } } return evalValue; } Alpha-beta剪枝* 另外，通过结合Alpha-beta剪枝能进一步优化效率。Alpha-beta剪枝顾名思义就是裁剪掉一些不必要的分支，以减少遍历的节点数。实际上是通过传递两个参数alpha和beta到递归的极小极大函数中，alpha表示了MAX的最坏情况，beta表示了MIN的最坏情况，因此他们的初始值为负无穷和正无穷。在递归的过程中，在轮到MAX的回合，如果极小极大的值比alpha大，则更新alpha；在MIN的回合中，如果极小极大值比beta小，则更新beta。当alpha和beta相交时（即alpha>=beta），这时该节点的所有子节点对于MAX和MIN双方都不会带来好的获益，所以可以忽略掉（裁剪掉）以该节点为父节点的整棵子树。根据这一定义，可以很轻易地在上面程序的基础上进行改进： /** * 以'x'的角度来考虑的极小极大算法 / public int minimax( char [] board, int depth){ int [] bestMoves = new int [9]; int index = 0; int bestValue = - INFINITY ; for ( int pos=0; pos<9; pos++){ if (board[pos]== empty ){ board[pos] = x ; int value = min(board, depth, - INFINITY , + INFINITY ); if (value>bestValue){ bestValue = value; index = 0; bestMoves[index] = pos; } else if (value==bestValue){ index++; bestMoves[index] = pos; } board[pos] = empty ; } } if (index>1){ index = ( new Random (System. currentTimeMillis ()).nextInt()>>>1)%index; } return bestMoves[index]; } /* * 对于'x'，估值越大对其越有利 / public int max( char [] board, int depth, int alpha, int beta){ int evalValue = gameState (board); boolean isGameOver = (evalValue== WIN \|\| evalValue== LOSE \|\| evalValue== DRAW ); if (beta<=alpha){ return evalValue; } if (depth==0 \|\| isGameOver){ return evalValue; } int bestValue = - INFINITY ; for ( int pos=0; pos<9; pos++){ if (board[pos]== empty ){ // try board[pos] = x ; // maximixing bestValue = Math. max (bestValue, min(board, depth-1, Math. max (bestValue, alpha), beta)); // reset board[pos] = empty ; } } return evalValue; } /* * 对于'o'，估值越小对其越有利 / public int min( char [] board, int depth, int alpha, int beta){ int evalValue = gameState (board); boolean isGameOver = (evalValue== WIN \|\| evalValue== LOSE \|\| evalValue== DRAW ); if (alpha>=beta){ return evalValue; } // try if (depth==0 \|\| isGameOver \|\| alpha>=beta){ return evalValue; } int bestValue = + INFINITY ; for ( int pos=0; pos<9; pos++){ if (board[pos]== empty ){ // try board[pos] = o ; // minimixing bestValue = Math.min(bestValue, max(board, depth-1, alpha, Math.min(bestValue, beta))); // reset board[pos] = empty ; } } return evalValue; } 这里对极小极大算法的实现只是其中一种可行性，实际上可能会看到很多种不同的实现方式，但道理是一样的。使用开局库同时，你会发现，这样做视乎还不够，特别在一开局。我们都知道，中心的位置是最好的，但是按照我们上面的算法，第一步确实随机的...这在深度受限制的情况下就更显得重要了。于是就引申出了开局库的概念，这是我在某个讲象棋AI的网上看到的，就是给初始的棋盘设定一些格局。针对上面的例子，我们只要判断是否第一步棋，如果是则想办法让他选择中心的位置（4）。在WIKI百科中找到一幅图也能作为TIC-TAC-TOE开局库的参考：于是，估算函数会变成这样的（当然也可以在别的地方修改，只要合理）： //开局时，每个位置的估值 static final int [] INITIAL_POS_VALUE = { 3, 2, 3, 2, 4, 2, 3, 2, 3 }; /** * 估值函数，提供一个启发式的值，决定了游戏AI的高低 / public int gameState ( char [] board ) { int result = INPROGRESS ; boolean isFull = true ; int sum = 0; int index = 0; // is game over? for ( int pos=0; pos<9; pos++){ char chess = board[pos]; if ( empty ==chess){ isFull = false ; } else { sum += chess; index = pos; } } // 如果是初始状态，则使用开局库 boolean isInitial = (sum== x \|\|sum== o ); if (isInitial){ return (sum== x ?1:-1)INITIAL_POS_VALUE[index]; } // is Max win/lose? for ( int [] status : WIN_STATUS ){ char chess = board[status[0]]; if (chess== empty ){ break ; } int i = 1; for (; i<status.length; i++){ if (board[status[i]]!=chess){ break ; } } if (i==status.length){ result = chess== x ? WIN : LOSE ; break ; } } if (result!= WIN & result!= LOSE ){ if (isFull){ // is draw result = DRAW ; } else { // check double link // finds[0]->'x', finds[1]->'o' int [] finds = new int [2]; for ( int [] status : WIN_STATUS ){ char chess = empty ; boolean hasEmpty = false ; int count = 0; for ( int i=0; i<status.length; i++){ if (board[status[i]]== empty ){ hasEmpty = true ; } else { if (chess== empty ){ chess = board[status[i]]; } if (board[status[i]]==chess){ count++; } } } if (hasEmpty && count>1){ if (chess== x ){ finds[0]++; } else { finds[1]++; } } } // check if two in one line if (finds[1]>0){ result = - DOUBLE_LINK ; } else if (finds[0]>0){ result = DOUBLE_LINK ; } } } return result; } ---------------------------------------------------------------------------------------------------- 参考资料极大极小博弈树的简洁（附Tic-Tac-Toe源码） Tic-Tac-Toe算法笔记(一)：Minimax算法大小: 9.3 KB 大小: 35.1 KB 大小: 671 KB MinimaxDemos_TicTacToe-Java_.rar (4.3 KB) 描述: 分别是使用了深度限制和使用了Alpha-beta剪枝的例子（能直接编译运行）下载次数: 97 查看图片附件声明：ITeye文章版权属于作者，受法律保护。没有作者书面许可不得转载。推荐链接
返回顶楼

苍山洱海等级: 初级会员性别: 文章: 95 积分: 0 来自: 北京	发表时间：2011-09-12 我想知道你这个代码是怎么着色的？
返回顶楼	回帖地址 0 0 请登录后投票

univasity 等级: 性别: 文章: 35 积分: 160 来自: 广州	发表时间：2011-09-12 从Eclipse中粘贴出来就能带上颜色了，或者你用论坛提供的代码显示工具。额，论坛居然显示不完整... 苍山洱海写道我想知道你这个代码是怎么着色的？
返回顶楼	回帖地址 0 0 请登录后投票

论坛首页 → 综合技术版

跳转论坛: