/** * This applet demonstrates learning in a simple game. It isn't designed to be general or reusable.

* This program is the controller for a learning agent. The GUI is in MASLearningGUI.java. There is a learning controller at SGameController.java.

This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version.

This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.

You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. * @author David Poole poole@cs.ubc.ca * @version 0.01 2008-04-17 */ public class WolfLearningAgent { int numActions; double[] prob; double[] value; int visits = 0; double aveValue = 0.0; double actRandomlyWithProbability=0.05; int action=0; // the last action // Parameters Parameter[] parameter = { new Parameter("alpha",0.1), new Parameter("deltaWin",0.0001), new Parameter("deltaLose",0.001) }; static int alpha=0; static int deltaWin=1; static int deltaLose=2; WolfLearningAgent(int numActions) { this.numActions = numActions; prob = new double[numActions]; value = new double[numActions]; // visits = new int[numActions]; // aveValue = new double[numActions]; for (int i=0; i value[abest]) abest=(i+start)%numActions; double delta; if (value[abest]>aveValue) delta = parameter[deltaWin].value; else delta = parameter[deltaLose].value; prob[abest] += numActions*delta; for (int i=0; i