1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
/* *****************************************************************************
* A.L.E (Arcade Learning Environment)
* Copyright (c) 2009-2013 by Yavar Naddaf, Joel Veness, Marc G. Bellemare and
* the Reinforcement Learning and Artificial Intelligence Laboratory
* Released under the GNU General Public License; see License.txt for details.
*
* Based on: Stella -- "An Atari 2600 VCS Emulator"
* Copyright (c) 1995-2007 by Bradford W. Mott and the Stella team
*
* *****************************************************************************
*/
#include "Pong.hpp"
#include "../RomUtils.hpp"
namespace ale {
PongSettings::PongSettings() { reset(); }
/* create a new instance of the rom */
RomSettings* PongSettings::clone() const {
RomSettings* rval = new PongSettings();
*rval = *this;
return rval;
}
/* process the latest information from ALE */
void PongSettings::step(const System& system) {
// update the reward
int x = readRam(&system, 13); // cpu score
int y = readRam(&system, 14); // player score
reward_t score = y - x;
m_reward = score - m_score;
m_score = score;
// update terminal status
// (game over when a player reaches 21)
m_terminal = x == 21 || y == 21;
}
/* is end of game */
bool PongSettings::isTerminal() const { return m_terminal; };
/* get the most recently observed reward */
reward_t PongSettings::getReward() const { return m_reward; }
/* is an action part of the minimal set? */
bool PongSettings::isMinimal(const Action& a) const {
switch (a) {
case PLAYER_A_NOOP:
case PLAYER_A_FIRE:
case PLAYER_A_RIGHT:
case PLAYER_A_LEFT:
case PLAYER_A_RIGHTFIRE:
case PLAYER_A_LEFTFIRE:
return true;
default:
return false;
}
}
/* reset the state of the game */
void PongSettings::reset() {
m_reward = 0;
m_score = 0;
m_terminal = false;
}
/* saves the state of the rom settings */
void PongSettings::saveState(Serializer& ser) {
ser.putInt(m_reward);
ser.putInt(m_score);
ser.putBool(m_terminal);
}
// loads the state of the rom settings
void PongSettings::loadState(Deserializer& ser) {
m_reward = ser.getInt();
m_score = ser.getInt();
m_terminal = ser.getBool();
}
// returns a list of mode that the game can be played in
ModeVect PongSettings::getAvailableModes() {
ModeVect modes(getNumModes());
for (unsigned int i = 0; i < modes.size(); i++) {
modes[i] = i;
}
return modes;
}
// set the mode of the game
// the given mode must be one returned by the previous function
void PongSettings::setMode(
game_mode_t m, System& system,
std::unique_ptr<StellaEnvironmentWrapper> environment) {
if (m < getNumModes()) {
// read the mode we are currently in
unsigned char mode = readRam(&system, 0x96);
// press select until the correct mode is reached
while (mode != m) {
environment->pressSelect(2);
mode = readRam(&system, 0x96);
}
//reset the environment to apply changes.
environment->softReset();
} else {
throw std::runtime_error("This mode doesn't currently exist for this game");
}
}
DifficultyVect PongSettings::getAvailableDifficulties() {
DifficultyVect diff = {0, 1};
return diff;
}
} // namespace ale