Context Navigation

← Previous Changeset
Next Changeset →

Changeset 24962

Timestamp:

Feb 28, 2021, 1:16:32 PM (3 years ago)

Author:

wraitii

Message:

Add an 'Evaluate' RL endpoint, intended for dynamic game balancing

This adds a new endpoint to the RL interface for evaluating custom JavaScript. When combined with the ability to create arbitrary modifiers, this provides the required functionality for exploring quantitative game balancing.

Patch By: irishninja

Fixes #5981

Differential Revision: https://code.wildfiregames.com/D3479

Location:

ps/trunk/source

Files:

: 2 added
: 5 edited

rlinterface/RLInterface.cpp (modified) (7 diffs)
rlinterface/RLInterface.h (modified) (8 diffs)
tools/rlclient/python/tests/fastactions.js (added)
tools/rlclient/python/tests/test_actions.py (modified) (1 diff)
tools/rlclient/python/tests/test_evaluate.py (added)
tools/rlclient/python/zero_ad/api.py (modified) (1 diff)
tools/rlclient/python/zero_ad/environment.py (modified) (1 diff)

Legend:

: Unmodified
: Added
: Removed

ps/trunk/source/rlinterface/RLInterface.cpp

-              r24844
+              r24962
     m_GameMessage = std::move(msg);
     m_MsgApplied.wait(msgLock, [this]() { return m_GameMessage.type == GameMessageType::None; });
     return m_GameState;
+    return m_e;
+}
 …
     m_ScenarioConfig = std::move(scenario);
     return SendGameMessage({ GameMessageType::Reset });
+}
 …
                 stream << gameState.c_str();
+        }
         else if (uri == "/templates")
+        {
 …
     if (m_NeedsGameState && isGameStarted)
+    {
         m_GameState = GetGameState();
+        m_e = GetGameState();
         m_MsgApplied.notify_one();
         m_MsgLock.unlock();
 …
                 LDR_NonprogressiveLoad();
                 ENSURE(g_Game->ReallyStartGame() == PSRETURN_OK);
                 m_GameState = GetGameState();
+                m_e = GetGameState();
                 m_MsgApplied.notify_one();
                 m_MsgLock.unlock();
 …
             if (!g_Game)
+            {
                 m_GameState = EMPTY_STATE;
+                m_e = EMPTY_STATE;
                 m_MsgApplied.notify_one();
                 m_MsgLock.unlock();
 …
                 g_Game->Update(deltaRealTime);
             m_GameState = GetGameState();
+            m_e = GetGameState();
             m_MsgApplied.notify_one();
             m_MsgLock.unlock();
             break;
+        }
         default:
         break;

ps/trunk/source/rlinterface/RLInterface.h

-              r24839
+              r24962
 /* Copyright (C) 2020 Wildfire Games.
+/* Copyright (C) 202 Wildfire Games.
  * This file is part of 0 A.D.
+ *
 …
     Reset,
     Commands,
 };
 …
  *  0. The game/main thread calls TryApplyMessage()
  *    - If no messages are pending, GOTO 0 (the simulation is not advanced).
  *  1. TryApplyMessage locks m_MsgLock, pulls the message, processes it, advances the simulation, and sets m_GameState.
+ *  1. TryApplyMessage locks m_MsgLock, pulls the message, processes it, advances the simulation, and sets m_e.
  *  2. TryApplyMessage notifies the RL thread that it can carry on and unlocks m_MsgLock. The main thread carries on frame rendering and goes back to 0.
  *  3. The RL thread locks m_MsgLock, reads m_GameState, unlocks m_MsgLock, and sends the gamestate as HTTP Response to the RL client.
+ *  3. The RL thread locks m_MsgLock, reads m_e, unlocks m_MsgLock, and sends the gamestate as HTTP Response to the RL client.
  *  4. The client processes the response and ultimately sends a new HTTP message to the RL Interface.
  *  5. The RL thread locks m_MsgLock, pushes the message, and starts waiting on the game/main thread to notify it (step 2).
 …
     /**
      * Non-blocking call to process any pending messages from the RL client.
      * Updates m_GameState to the gamestate after messages have been processed.
+     * Updates m_e to the gamestate after messages have been processed.
      */
     void TryApplyMessage();
 …
      */
     std::string Reset(ScenarioConfig&& scenario);
     /**
 …
     /**
      * Process any pending messages from the RL client.
      * Updates m_GameState to the gamestate after messages have been processed.
+     * Updates m_e to the gamestate after messages have been processed.
      */
     void ApplyMessage(const GameMessage& msg);
 …
     GameMessage m_GameMessage;
     ScenarioConfig m_ScenarioConfig;
     std::string m_GameState;
+    std::string m_e;
     bool m_NeedsGameState = false;
 …
     std::mutex m_MsgLock;
     std::condition_variable m_MsgApplied;
 };

ps/trunk/source/tools/rlclient/python/tests/test_actions.py

-              r24816
+              r24962
 def test_attack():
     state = game.reset(config)
     units = state.units(owner=1, type='cavalry')
+    unit
     target = state.units(owner=2, type='female_citizen')[0]
+    initial_health = target.health()
+    initial_health_target = target.health()
+    initial_health_unit = unit.health()
     state = game.step([zero_ad.actions.reveal_map()])
     attack = zero_ad.actions.attack(units, target)
+    attack = zero_ad.actions.attack(, target)
     state = game.step([attack])
+    while state.unit(target.id()).health() >= initial_health:
+    while (state.unit(target.id()).health() >= initial_health_target
+        ) and (state.unit(unit.id()).health() >= initial_health_unit):
         state = game.step()

ps/trunk/source/tools/rlclient/python/zero_ad/api.py

r23917	r24962
28	28	response = self.post('templates', post_data)
29	29	return zip(names, response.decode().split('\n'))
	30
	31
	32
	33

ps/trunk/source/tools/rlclient/python/zero_ad/environment.py

-              r23917
+              r24962
         self.current_state = GameState(json.loads(state_json), self)
         return self.current_state
     def get_template(self, name):

Note: See TracChangeset for help on using the changeset viewer.