atari_py/ale_interface/src/games/supported/Gopher.cpp (87 lines of code) (raw):

/* ***************************************************************************** * The method lives() is based on Xitari's code, from Google Inc. * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License version 2 * as published by the Free Software Foundation. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. * ***************************************************************************** * A.L.E (Arcade Learning Environment) * Copyright (c) 2009-2013 by Yavar Naddaf, Joel Veness, Marc G. Bellemare and * the Reinforcement Learning and Artificial Intelligence Laboratory * Released under the GNU General Public License; see License.txt for details. * * Based on: Stella -- "An Atari 2600 VCS Emulator" * Copyright (c) 1995-2007 by Bradford W. Mott and the Stella team * * ***************************************************************************** */ #include "Gopher.hpp" #include "../RomUtils.hpp" GopherSettings::GopherSettings() { reset(); } /* create a new instance of the rom */ RomSettings* GopherSettings::clone() const { RomSettings* rval = new GopherSettings(); *rval = *this; return rval; } /* process the latest information from ALE */ void GopherSettings::step(const System& system) { // update the reward int score = getDecimalScore(0xB2, 0xB1, 0xB0, &system); int reward = score - m_score; m_reward = reward; m_score = score; // update terminal status int carrot_bits = readRam(&system, 0xB4) & 0x7; m_terminal = carrot_bits == 0; // A very crude popcount static int livesFromCarrots[] = { 0, 1, 1, 2, 1, 2, 2, 3}; m_lives = livesFromCarrots[carrot_bits]; } /* is end of game */ bool GopherSettings::isTerminal() const { return m_terminal; }; /* get the most recently observed reward */ reward_t GopherSettings::getReward() const { return m_reward; } /* is an action part of the minimal set? */ bool GopherSettings::isMinimal(const Action &a) const { switch (a) { case PLAYER_A_NOOP: case PLAYER_A_FIRE: case PLAYER_A_UP: case PLAYER_A_RIGHT: case PLAYER_A_LEFT: case PLAYER_A_UPFIRE: case PLAYER_A_RIGHTFIRE: case PLAYER_A_LEFTFIRE: return true; default: return false; } } /* reset the state of the game */ void GopherSettings::reset() { m_reward = 0; m_score = 0; m_terminal = false; m_lives = 3; } /* saves the state of the rom settings */ void GopherSettings::saveState(Serializer & ser) { ser.putInt(m_reward); ser.putInt(m_score); ser.putBool(m_terminal); ser.putInt(m_lives); } // loads the state of the rom settings void GopherSettings::loadState(Deserializer & ser) { m_reward = ser.getInt(); m_score = ser.getInt(); m_terminal = ser.getBool(); m_lives = ser.getInt(); } ActionVect GopherSettings::getStartingActions() { ActionVect startingActions; startingActions.push_back(PLAYER_A_FIRE); return startingActions; } // returns a list of mode that the game can be played in ModeVect GopherSettings::getAvailableModes() { ModeVect modes = {0, 2}; return modes; } // set the mode of the game // the given mode must be one returned by the previous function void GopherSettings::setMode(game_mode_t m, System &system, std::unique_ptr<StellaEnvironmentWrapper> environment) { if(m == 0 || m == 2) { environment->softReset(); // read the mode we are currently in unsigned char mode = readRam(&system, 0xD3); // press select until the correct mode is reached while (mode != m) { environment->pressSelect(5); mode = readRam(&system, 0xD3); } //reset the environment to apply changes. environment->softReset(); } else { throw std::runtime_error("This mode doesn't currently exist for this game"); } } DifficultyVect GopherSettings::getAvailableDifficulties() { DifficultyVect diff = {0, 1}; return diff; }