emacs: lisp/play/landmark.el comparison

comparison lisp/play/landmark.el @ 111206:56f4300fbd9f

* lisp/play/landmark.el: Adjust commenting convention. (lm-nil-score): Rename from nil-score. (Xscore, XXscore, XXXscore, XXXXscore, Oscore, OOscore, OOOscore) (OOOOscore): Move into a let in lm-score-trans-table. (lm-winning-threshold, lm-loosing-threshold): Use lm-score-trans-table.

author	Stefan Monnier <monnier@iro.umontreal.ca>
date	Wed, 27 Oct 2010 10:31:44 -0400
parents	cc035ccb9275
children	029e4783cbae

comparison

equal deleted inserted replaced

-:e6399f46aefa
+:56f4300fbd9f
 ;; You should have received a copy of the GNU General Public License
 ;; along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.
 ;;; Commentary:
-;;; Lm is a relatively non-participatory game in which a robot
+;; Lm is a relatively non-participatory game in which a robot
-;;; attempts to maneuver towards a tree at the center of the window
+;; attempts to maneuver towards a tree at the center of the window
-;;; based on unique olfactory cues from each of the 4 directions. If
+;; based on unique olfactory cues from each of the 4 directions. If
-;;; the smell of the tree increases, then the weights in the robot's
+;; the smell of the tree increases, then the weights in the robot's
-;;; brain are adjusted to encourage this odor-driven behavior in the
+;; brain are adjusted to encourage this odor-driven behavior in the
-;;; future. If the smell of the tree decreases, the robots weights are
+;; future. If the smell of the tree decreases, the robots weights are
-;;; adjusted to discourage a correct move.
+;; adjusted to discourage a correct move.
-;;; In laymen's terms, the search space is initially flat. The point
+;; In laymen's terms, the search space is initially flat. The point
-;;; of training is to "turn up the edges of the search space" so that
+;; of training is to "turn up the edges of the search space" so that
-;;; the robot rolls toward the center.
+;; the robot rolls toward the center.
-;;; Further, do not become alarmed if the robot appears to oscillate
+;; Further, do not become alarmed if the robot appears to oscillate
-;;; back and forth between two or a few positions. This simply means
+;; back and forth between two or a few positions. This simply means
-;;; it is currently caught in a local minimum and is doing its best to
+;; it is currently caught in a local minimum and is doing its best to
-;;; work its way out.
+;; work its way out.
-;;; The version of this program as described has a small problem. a
+;; The version of this program as described has a small problem. a
-;;; move in a net direction can produce gross credit assignment. for
+;; move in a net direction can produce gross credit assignment. for
-;;; example, if moving south will produce positive payoff, then, if in
+;; example, if moving south will produce positive payoff, then, if in
-;;; a single move, one moves east,west and south, then both east and
+;; a single move, one moves east,west and south, then both east and
-;;; west will be improved when they shouldn't
+;; west will be improved when they shouldn't
-;;; Many thanks to Yuri Pryadkin (yuri@rana.usc.edu) for this
+;; Many thanks to Yuri Pryadkin (yuri@rana.usc.edu) for this
-;;; concise problem description.
+;; concise problem description.
 ;;;_* Require
 (eval-when-compile (require 'cl))
 ;;;_* From Gomoku
 ;; Here are the scores of the nine "non-polluted" configurations.  Tuning
 ;; these values will change (hopefully improve) the strength of the program
 ;; and may change its style (rather aggressive here).
-(defconst nil-score	  7  "Score of an empty qtuple.")
+(defconst lm-nil-score	  7  "Score of an empty qtuple.")
-(defconst Xscore	 15  "Score of a qtuple containing one X.")
-(defconst XXscore	400  "Score of a qtuple containing two X's.")
-(defconst XXXscore     1800  "Score of a qtuple containing three X's.")
-(defconst XXXXscore  100000  "Score of a qtuple containing four X's.")
-(defconst Oscore	 35  "Score of a qtuple containing one O.")
-(defconst OOscore	800  "Score of a qtuple containing two O's.")
-(defconst OOOscore    15000  "Score of a qtuple containing three O's.")
-(defconst OOOOscore  800000  "Score of a qtuple containing four O's.")
-;; These values are not just random: if, given the following situation:
-;;
-;;			  . . . . . . . O .
-;;			  . X X a . . . X .
-;;			  . . . X . . . X .
-;;			  . . . X . . . X .
-;;			  . . . . . . . b .
-;;
-;; you want Emacs to play in "a" and not in "b", then the parameters must
-;; satisfy the inequality:
-;;
-;;		   6 * XXscore > XXXscore + XXscore
-;;
-;; because "a" mainly belongs to six "XX" qtuples (the others are less
-;; important) while "b" belongs to one "XXX" and one "XX" qtuples.  Other
-;; conditions are required to obtain sensible moves, but the previous example
-;; should illustrate the point. If you manage to improve on these values,
-;; please send me a note. Thanks.
-;; As we chose values 0, 1 and 6 to denote empty, X and O squares, the
-;; contents of a qtuple are uniquely determined by the sum of its elements and
-;; we just have to set up a translation table.
 (defconst lm-score-trans-table
-(vector nil-score Xscore XXscore XXXscore XXXXscore 0
+(let ((Xscore		15)  ; Score of a qtuple containing one X.
-	  Oscore    0	   0	   0	    0	      0
+(XXscore       400)  ; Score of a qtuple containing two X's.
-	  OOscore   0	   0	   0	    0	      0
+(XXXscore     1800)  ; Score of a qtuple containing three X's.
-	  OOOscore  0	   0	   0	    0	      0
+(XXXXscore  100000)  ; Score of a qtuple containing four X's.
-	  OOOOscore 0	   0	   0	    0	      0
+(Oscore		35)  ; Score of a qtuple containing one O.
-	  0)
+(OOscore       800)  ; Score of a qtuple containing two O's.
+(OOOscore    15000)  ; Score of a qtuple containing three O's.
+(OOOOscore  800000)) ; Score of a qtuple containing four O's.
+;; These values are not just random: if, given the following situation:
+;;
+;;			  . . . . . . . O .
+;;			  . X X a . . . X .
+;;			  . . . X . . . X .
+;;			  . . . X . . . X .
+;;			  . . . . . . . b .
+;;
+;; you want Emacs to play in "a" and not in "b", then the parameters must
+;; satisfy the inequality:
+;;
+;;		   6 * XXscore > XXXscore + XXscore
+;;
+;; because "a" mainly belongs to six "XX" qtuples (the others are less
+;; important) while "b" belongs to one "XXX" and one "XX" qtuples.
+;; Other conditions are required to obtain sensible moves, but the
+;; previous example should illustrate the point.  If you manage to
+;; improve on these values, please send me a note.  Thanks.
+;; As we chose values 0, 1 and 6 to denote empty, X and O squares,
+;; the contents of a qtuple are uniquely determined by the sum of
+;; its elements and we just have to set up a translation table.
+(vector lm-nil-score Xscore XXscore XXXscore XXXXscore 0
+Oscore       0	0	0	 0	   0
+OOscore      0	0	0	 0	   0
+OOOscore     0	0	0	 0	   0
+OOOOscore    0	0	0	 0	   0
+0))
 "Vector associating qtuple contents to their score.")
 ;; If you do not modify drastically the previous constants, the only way for a
 ;; square to have a score higher than OOOOscore is to belong to a "OOOO"
 ;; qtuple, thus to be a winning move. Similarly, the only way for a square to
 ;; have a score between XXXXscore and OOOOscore is to belong to a "XXXX"
 ;; qtuple. We may use these considerations to detect when a given move is
 ;; winning or loosing.
-(defconst lm-winning-threshold OOOOscore
+(defconst lm-winning-threshold
+(aref lm-score-trans-table (+ 6 6 6 6)) ;; OOOOscore
 "Threshold score beyond which an Emacs move is winning.")
-(defconst lm-loosing-threshold XXXXscore
+(defconst lm-loosing-threshold
+(aref lm-score-trans-table (+ 1 1 1 1)) ;; XXXXscore
 "Threshold score beyond which a human move is winning.")
 (defun lm-strongest-square ()
 "Compute index of free square with highest score, or nil if none."
 	   (= lm-board-width  lm-saved-board-width)
 	   (= lm-board-height lm-saved-board-height))
 (setq lm-score-table (copy-sequence lm-saved-score-table))
 ;; No, compute it:
 (setq lm-score-table
-	    (make-vector lm-vector-length (* 20 nil-score)))
+	    (make-vector lm-vector-length (* 20 lm-nil-score)))
 (let (i j maxi maxj maxi2 maxj2)
 	(setq maxi  (/ (1+ lm-board-width) 2)
 	      maxj  (/ (1+ lm-board-height) 2)
 	      maxi2 (min 4 maxi)
 	      maxj2 (min 4 maxj))

Mercurial > emacs

comparison lisp/play/landmark.el @ 111206:56f4300fbd9f