add multiple food scenario
This commit is contained in:
parent
7d3d097599
commit
19d5a87ce0
|
@ -86,8 +86,10 @@ public class OpeningDialog {
|
||||||
rl = new RLControllerGUI<DinoAction>(new DinoWorld(), (Method) algorithmSelection.getSelectedItem(), DinoAction.values());
|
rl = new RLControllerGUI<DinoAction>(new DinoWorld(), (Method) algorithmSelection.getSelectedItem(), DinoAction.values());
|
||||||
} else if(selectedScenario == Scenario.JUMPING_DINO_ADVANCED) {
|
} else if(selectedScenario == Scenario.JUMPING_DINO_ADVANCED) {
|
||||||
rl = new RLControllerGUI<DinoAction>(new DinoWorldAdvanced(), (Method) algorithmSelection.getSelectedItem(), DinoAction.values());
|
rl = new RLControllerGUI<DinoAction>(new DinoWorldAdvanced(), (Method) algorithmSelection.getSelectedItem(), DinoAction.values());
|
||||||
} else if(selectedScenario == Scenario.ANTGAME) {
|
} else if(selectedScenario == Scenario.ANTGAME_ONE_FOOD) {
|
||||||
rl = new RLControllerGUI<AntAction>(new AntWorldContinuous(Constants.DEFAULT_GRID_WIDTH, Constants.DEFAULT_GRID_HEIGHT), (Method) algorithmSelection.getSelectedItem(), AntAction.values());
|
rl = new RLControllerGUI<AntAction>(new AntWorldContinuous(Constants.DEFAULT_GRID_WIDTH, Constants.DEFAULT_GRID_HEIGHT, 1), (Method) algorithmSelection.getSelectedItem(), AntAction.values());
|
||||||
|
} else if(selectedScenario == Scenario.ANTGAME_TWO_FOOD) {
|
||||||
|
rl = new RLControllerGUI<AntAction>(new AntWorldContinuous(Constants.DEFAULT_GRID_WIDTH, Constants.DEFAULT_GRID_HEIGHT, 2), (Method) algorithmSelection.getSelectedItem(), AntAction.values());
|
||||||
} else if(selectedScenario == Scenario.BLACKJACK) {
|
} else if(selectedScenario == Scenario.BLACKJACK) {
|
||||||
rl = new RLControllerGUI<PlayerAction>(new BlackJackTable(), (Method) algorithmSelection.getSelectedItem(), PlayerAction.values());
|
rl = new RLControllerGUI<PlayerAction>(new BlackJackTable(), (Method) algorithmSelection.getSelectedItem(), PlayerAction.values());
|
||||||
} else {
|
} else {
|
||||||
|
@ -107,7 +109,8 @@ public class OpeningDialog {
|
||||||
private enum Scenario {
|
private enum Scenario {
|
||||||
JUMPING_DINO_SIMPLE,
|
JUMPING_DINO_SIMPLE,
|
||||||
JUMPING_DINO_ADVANCED,
|
JUMPING_DINO_ADVANCED,
|
||||||
ANTGAME,
|
ANTGAME_ONE_FOOD,
|
||||||
|
ANTGAME_TWO_FOOD,
|
||||||
BLACKJACK
|
BLACKJACK
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -36,12 +36,14 @@ public class AntWorld implements Environment<AntAction>, Visualizable {
|
||||||
* various lectures could be possible as well.
|
* various lectures could be possible as well.
|
||||||
*/
|
*/
|
||||||
protected AntAgent antAgent;
|
protected AntAgent antAgent;
|
||||||
|
protected int numberOfConcurrentFood;
|
||||||
|
|
||||||
protected int tick;
|
protected int tick;
|
||||||
private int maxEpisodeTicks;
|
private int maxEpisodeTicks;
|
||||||
|
|
||||||
public AntWorld(int width, int height) {
|
public AntWorld(int width, int height, int numberOfConcurrentFood) {
|
||||||
grid = new Grid(width, height);
|
this.numberOfConcurrentFood = numberOfConcurrentFood;
|
||||||
|
grid = new Grid(width, height, numberOfConcurrentFood);
|
||||||
antAgent = new AntAgent(width, height);
|
antAgent = new AntAgent(width, height);
|
||||||
myAnt = new Ant();
|
myAnt = new Ant();
|
||||||
maxEpisodeTicks = 1000;
|
maxEpisodeTicks = 1000;
|
||||||
|
@ -49,7 +51,7 @@ public class AntWorld implements Environment<AntAction>, Visualizable {
|
||||||
}
|
}
|
||||||
|
|
||||||
public AntWorld(){
|
public AntWorld(){
|
||||||
this(Constants.DEFAULT_GRID_WIDTH, Constants.DEFAULT_GRID_HEIGHT);
|
this(Constants.DEFAULT_GRID_WIDTH, Constants.DEFAULT_GRID_HEIGHT, Constants.DEFAULT_CONCURRENT_FOOD);
|
||||||
}
|
}
|
||||||
|
|
||||||
protected StepCalculation processStep(AntAction action) {
|
protected StepCalculation processStep(AntAction action) {
|
||||||
|
@ -62,7 +64,7 @@ public class AntWorld implements Environment<AntAction>, Visualizable {
|
||||||
sc.stayOnCell = true;
|
sc.stayOnCell = true;
|
||||||
// flag to enable a check if all food has been collected only fired if food was dropped
|
// flag to enable a check if all food has been collected only fired if food was dropped
|
||||||
// on the starting position
|
// on the starting position
|
||||||
sc.checkCompletion = false;
|
sc.foodCollected = false;
|
||||||
|
|
||||||
switch(action) {
|
switch(action) {
|
||||||
case MOVE_UP:
|
case MOVE_UP:
|
||||||
|
@ -110,7 +112,7 @@ public class AntWorld implements Environment<AntAction>, Visualizable {
|
||||||
} else {
|
} else {
|
||||||
sc.reward = Reward.FOOD_DROP_DOWN_SUCCESS;
|
sc.reward = Reward.FOOD_DROP_DOWN_SUCCESS;
|
||||||
myAnt.setPoints(myAnt.getPoints() + 1);
|
myAnt.setPoints(myAnt.getPoints() + 1);
|
||||||
sc.checkCompletion = true;
|
sc.foodCollected = true;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
|
@ -140,13 +142,9 @@ public class AntWorld implements Environment<AntAction>, Visualizable {
|
||||||
if(!sc.stayOnCell) {
|
if(!sc.stayOnCell) {
|
||||||
myAnt.getPos().setLocation(sc.potentialNextPos);
|
myAnt.getPos().setLocation(sc.potentialNextPos);
|
||||||
antAgent.getCell(myAnt.getPos());// the ant will move to a cell that was previously unknown
|
antAgent.getCell(myAnt.getPos());// the ant will move to a cell that was previously unknown
|
||||||
// TODO: not optimal for going straight for food
|
|
||||||
// sc.reward = Reward.UNKNOWN_FIELD_EXPLORED;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if(sc.foodCollected) {
|
||||||
|
|
||||||
if(sc.checkCompletion) {
|
|
||||||
sc.done = grid.isAllFoodCollected();
|
sc.done = grid.isAllFoodCollected();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -181,7 +179,7 @@ public class AntWorld implements Environment<AntAction>, Visualizable {
|
||||||
boolean stayOnCell = true;
|
boolean stayOnCell = true;
|
||||||
// flag to enable a check if all food has been collected only fired if food was dropped
|
// flag to enable a check if all food has been collected only fired if food was dropped
|
||||||
// on the starting position
|
// on the starting position
|
||||||
boolean checkCompletion = false;
|
boolean foodCollected = false;
|
||||||
}
|
}
|
||||||
|
|
||||||
public State reset() {
|
public State reset() {
|
||||||
|
|
|
@ -4,8 +4,8 @@ import core.State;
|
||||||
import core.StepResultEnvironment;
|
import core.StepResultEnvironment;
|
||||||
|
|
||||||
public class AntWorldContinuous extends AntWorld {
|
public class AntWorldContinuous extends AntWorld {
|
||||||
public AntWorldContinuous(int width, int height) {
|
public AntWorldContinuous(int width, int height, int numberOfConcurrentFood) {
|
||||||
super(width, height);
|
super(width, height, numberOfConcurrentFood);
|
||||||
}
|
}
|
||||||
|
|
||||||
public AntWorldContinuous() {
|
public AntWorldContinuous() {
|
||||||
|
@ -14,13 +14,15 @@ public class AntWorldContinuous extends AntWorld {
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public StepResultEnvironment step(AntAction action) {
|
public StepResultEnvironment step(AntAction action) {
|
||||||
Cell currentCell = grid.getCell(myAnt.getPos());
|
|
||||||
|
|
||||||
StepCalculation sc = processStep(action);
|
StepCalculation sc = processStep(action);
|
||||||
|
|
||||||
// flag is set to true if food gets dropped onto starts
|
// flag is set to true if food gets dropped onto starts
|
||||||
if(sc.checkCompletion) {
|
if(sc.foodCollected) {
|
||||||
grid.spawnNewFood();
|
grid.removeAllFood();
|
||||||
|
System.out.println(numberOfConcurrentFood);
|
||||||
|
for(int i = 0; i < numberOfConcurrentFood; ++i) {
|
||||||
|
grid.spawnNewFood();
|
||||||
|
}
|
||||||
}
|
}
|
||||||
// valid movement
|
// valid movement
|
||||||
if(!sc.stayOnCell) {
|
if(!sc.stayOnCell) {
|
||||||
|
|
|
@ -3,8 +3,8 @@ package evironment.antGame;
|
||||||
import core.State;
|
import core.State;
|
||||||
|
|
||||||
public class AntWorldContinuousOriginalState extends AntWorldContinuous {
|
public class AntWorldContinuousOriginalState extends AntWorldContinuous {
|
||||||
public AntWorldContinuousOriginalState(int width, int height) {
|
public AntWorldContinuousOriginalState(int width, int height, int numberOfConcurrentFood) {
|
||||||
super(width, height);
|
super(width, height, numberOfConcurrentFood);
|
||||||
}
|
}
|
||||||
|
|
||||||
public AntWorldContinuousOriginalState() {
|
public AntWorldContinuousOriginalState() {
|
||||||
|
|
|
@ -1,6 +1,7 @@
|
||||||
package evironment.antGame;
|
package evironment.antGame;
|
||||||
|
|
||||||
public class Constants {
|
public class Constants {
|
||||||
|
public static final int DEFAULT_CONCURRENT_FOOD = 1;
|
||||||
public static final int DEFAULT_GRID_WIDTH = 8;
|
public static final int DEFAULT_GRID_WIDTH = 8;
|
||||||
public static final int DEFAULT_GRID_HEIGHT = 8;
|
public static final int DEFAULT_GRID_HEIGHT = 8;
|
||||||
public static final int START_X = 5;
|
public static final int START_X = 5;
|
||||||
|
|
|
@ -10,10 +10,12 @@ public class Grid {
|
||||||
private Point start;
|
private Point start;
|
||||||
private Cell[][] grid;
|
private Cell[][] grid;
|
||||||
private Cell[][] initialGrid;
|
private Cell[][] initialGrid;
|
||||||
|
private int numberOfConcurrentFood;
|
||||||
|
|
||||||
public Grid(int width, int height) {
|
public Grid(int width, int height, int numberOfConcurrentFood) {
|
||||||
this.width = width;
|
this.width = width;
|
||||||
this.height = height;
|
this.height = height;
|
||||||
|
this.numberOfConcurrentFood = numberOfConcurrentFood;
|
||||||
grid = new Cell[width][height];
|
grid = new Cell[width][height];
|
||||||
initialGrid = new Cell[width][height];
|
initialGrid = new Cell[width][height];
|
||||||
start = new Point(Constants.START_X, Constants.START_Y);
|
start = new Point(Constants.START_X, Constants.START_Y);
|
||||||
|
@ -32,7 +34,9 @@ public class Grid {
|
||||||
}
|
}
|
||||||
spawnObstacles();
|
spawnObstacles();
|
||||||
initialGrid[start.x][start.y] = new Cell(new Point(start.x, start.y), CellType.START);
|
initialGrid[start.x][start.y] = new Cell(new Point(start.x, start.y), CellType.START);
|
||||||
spawnNewFood(initialGrid);
|
for(int i = 0; i < numberOfConcurrentFood; ++i) {
|
||||||
|
spawnNewFood(initialGrid);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
//TODO
|
//TODO
|
||||||
|
@ -70,6 +74,14 @@ public class Grid {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public void removeAllFood() {
|
||||||
|
for(int x = 0; x < width; ++x) {
|
||||||
|
for(int y = 0; y < height; ++y) {
|
||||||
|
grid[x][y].setFood(0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
public void spawnNewFood() {
|
public void spawnNewFood() {
|
||||||
spawnNewFood(grid);
|
spawnNewFood(grid);
|
||||||
}
|
}
|
||||||
|
|
|
@ -11,7 +11,7 @@ public class ContinuousAnt {
|
||||||
public static void main(String[] args) {
|
public static void main(String[] args) {
|
||||||
RNG.setSeed(13, true);
|
RNG.setSeed(13, true);
|
||||||
RLController<AntAction> rl = new RLControllerGUI<>(
|
RLController<AntAction> rl = new RLControllerGUI<>(
|
||||||
new AntWorldContinuous(8, 8),
|
new AntWorldContinuous(8, 8, 1),
|
||||||
Method.Q_LEARNING_OFF_POLICY_CONTROL,
|
Method.Q_LEARNING_OFF_POLICY_CONTROL,
|
||||||
AntAction.values());
|
AntAction.values());
|
||||||
rl.setDelay(200);
|
rl.setDelay(200);
|
||||||
|
|
|
@ -12,7 +12,7 @@ public class RunningAnt {
|
||||||
RNG.setSeed(56);
|
RNG.setSeed(56);
|
||||||
|
|
||||||
RLController<AntAction> rl = new RLControllerGUI<>(
|
RLController<AntAction> rl = new RLControllerGUI<>(
|
||||||
new AntWorld(8, 8),
|
new AntWorld(8, 8, 1),
|
||||||
Method.Q_LEARNING_OFF_POLICY_CONTROL,
|
Method.Q_LEARNING_OFF_POLICY_CONTROL,
|
||||||
AntAction.values());
|
AntAction.values());
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue