Kinds-of-Intelligence-CFI · benaslater · Apr 16, 2024 · Mar 22, 2024 · Apr 11, 2024 · Apr 15, 2024
diff --git a/Assets/Scripts/AAI3EnvironmentManager.cs b/Assets/Scripts/AAI3EnvironmentManager.cs
@@ -214,11 +214,6 @@ public void TriggerArenaChangeEvent(int currentArenaIndex, int totalArenas)
 		OnArenaChanged?.Invoke(currentArenaIndex, totalArenas);
 	}
 
-	public int getMaxArenaID()
-	{
-		return _arenasConfigurations.configurations.Count;
-	}
-
 	public bool GetRandomizeArenasStatus()
 	{
 		return _arenasConfigurations.randomizeArenas;
@@ -314,9 +309,14 @@ private Dictionary<string, int> RetrieveEnvironmentParameters()
 
 	#region Configuration Management Methods
 
-	public bool GetConfiguration(int arenaID, out ArenaConfiguration arenaConfiguration)
+	public ArenaConfiguration GetConfiguration(int arenaID)
 	{
-		return _arenasConfigurations.configurations.TryGetValue(arenaID, out arenaConfiguration);
+		ArenaConfiguration returnConfiguration;
+		if (!_arenasConfigurations.configurations.TryGetValue(arenaID, out returnConfiguration))
+		{
+			throw new KeyNotFoundException($"Tried to load arena {arenaID} but it did not exist");
+		}
+		return returnConfiguration;
 	}
 
 	public void AddConfiguration(int arenaID, ArenaConfiguration arenaConfiguration)

diff --git a/Assets/Scripts/ArenasParameters.cs b/Assets/Scripts/ArenasParameters.cs
@@ -141,6 +141,7 @@ public class ArenaConfiguration
 		public bool toUpdate = false;
 		public string protoString = "";
 		public int randomSeed = 0;
+		public bool mergeNextArena = false;
 
 		public ArenaConfiguration() { }
 
@@ -175,6 +176,7 @@ internal ArenaConfiguration(YAMLDefs.Arena yamlArena)
 			toUpdate = true;
 			protoString = yamlArena.ToString();
 			randomSeed = yamlArena.randomSeed;
+			this.mergeNextArena = yamlArena.mergeNextArena;
 		}
 
 		/// <summary>

diff --git a/Assets/Scripts/TrainingAgent.cs b/Assets/Scripts/TrainingAgent.cs
@@ -47,7 +47,7 @@ public class TrainingAgent : Agent, IPrefab
     private float _freezeDelay = 0f;
     private bool _isFrozen = false;
 
-    private bool _nextUpdateEpisodeEnd = false;
+    private bool _nextUpdateCompleteArena = false;
 
     [Header("Agent Notification")]
     public bool showNotification = false;
@@ -214,20 +214,20 @@ public override void Heuristic(in ActionBuffers actionsOut)
 
     #region Agent Health Methods
 
-    public void UpdateHealthNextStep(float updateAmount, bool andEndEpisode = false)
+    public void UpdateHealthNextStep(float updateAmount, bool andCompleteArena = false)
     {
         /// <summary>
         /// ML-Agents doesn't guarantee behaviour if an episode ends outside of OnActionReceived
         /// Therefore we queue any health updates to happen on the next action step.
         /// </summary>
         _nextUpdateHealth += updateAmount;
-        if (andEndEpisode)
+        if (andCompleteArena)
         {
-            _nextUpdateEpisodeEnd = true;
+            _nextUpdateCompleteArena = true;
         }
     }
 
-    public void UpdateHealth(float updateAmount, bool andEndEpisode = false)
+    public void UpdateHealth(float updateAmount, bool andCompleteArena = false)
     {
         if (NotificationManager.Instance == null && showNotification == true)
         {
@@ -260,12 +260,19 @@ public void UpdateHealth(float updateAmount, bool andEndEpisode = false)
             StartCoroutine(EndEpisodeAfterDelay());
             return;
         }
-        if (andEndEpisode || _nextUpdateEpisodeEnd)
+        if (andCompleteArena || _nextUpdateCompleteArena)
         {
+            _nextUpdateCompleteArena = false;
             float cumulativeReward = this.GetCumulativeReward();
 
             if (cumulativeReward >= Arena.CurrentPassMark)
             {
+                // If passed and the next arena is merged load that without ending the episode
+                if (_arena.mergeNextArena)
+                {
+                    _arena.LoadNextArena();
+                    return;
+                }
                 if (showNotification)
                 {
                     NotificationManager.Instance.ShowSuccessNotification();
@@ -278,7 +285,6 @@ public void UpdateHealth(float updateAmount, bool andEndEpisode = false)
                     NotificationManager.Instance.ShowFailureNotification();
                 }
             }
-            _nextUpdateEpisodeEnd = false;
             StartCoroutine(EndEpisodeAfterDelay());
         }
     }

diff --git a/Assets/Scripts/TrainingArena.cs b/Assets/Scripts/TrainingArena.cs
@@ -1,3 +1,4 @@
+using System;
 using System.Collections.Generic;
 using UnityEngine;
 using Unity.MLAgents;
@@ -40,8 +41,15 @@ public class TrainingArena : MonoBehaviour
 	private bool isFirstArenaReset = true;
 	private List<GameObject> spawnedRewards = new List<GameObject>();
 	private List<int> playedArenas = new List<int>();
+	private List<int> _mergedArenas = null;
 
 	public bool showNotification { get; set; }
+	public bool mergeNextArena
+	{
+		get {
+			return _arenaConfiguration.mergeNextArena;
+		}
+	}
 
 	public ArenaBuilder Builder
 	{
@@ -87,6 +95,25 @@ private void InitializeArenaComponents()
 		Spawner_InteractiveButton.RewardSpawned += OnRewardSpawned;
 	}
 
+	/// <summary>
+	/// Provides a list of the arenas in the current config file that are preceeded by an arena with
+	/// the mergeNextArena property, so that we can avoid loading them when arenas are randomised.
+	/// </summary>
+	private List<int> GetMergedArenas()
+	{
+		List<int> mergedArenas = new List<int>();
+		int totalArenas = _environmentManager.GetTotalArenas();
+		ArenaConfiguration currentArena = _environmentManager.GetConfiguration(0);
+		bool currentlyMerged = currentArena.mergeNextArena;
+		for (int i = 1; i < totalArenas; i++)
+		{
+			if (currentlyMerged) { mergedArenas.Add(i); }
+			currentArena = _environmentManager.GetConfiguration(i);
+			currentlyMerged = currentArena.mergeNextArena;
+		}
+		return mergedArenas;
+	}
+
 	#region Arena Handling Methods
 
 	/// <summary>
@@ -99,20 +126,39 @@ public void ResetArena()
 
 		CleanUpSpawnedObjects();
 
-		DetermineNextArenaID();
+		SetNextArenaID();
+
+		// Load the new configuration
+		ArenaConfiguration newConfiguration = _environmentManager.GetConfiguration(arenaID);
+
+		ApplyNewArenaConfiguration(newConfiguration);
+
+		CleanupRewards();
+
+		NotifyArenaChange();
+	}
 
-		if (!TryLoadArenaConfiguration(out ArenaConfiguration newConfiguration))
+	public void LoadNextArena()
+	{
+		// TrainingArena must have reset() called at first to initialise arenaID
+		if (isFirstArenaReset)
 		{
-			Debug.LogError("Failed to load arena configuration");
-			return;
+			throw new InvalidOperationException("LoadNextArena called before first reset");
 		}
 
+		Debug.Log($"Loading next arena. Previous: {arenaID}, next: {arenaID + 1}");
+		CleanUpSpawnedObjects();
+
+		arenaID += 1;
+		// Load the new configuration
+		// TODO: If mergeNextArena is put in the final arena this will throw. Add some validation to move this failure sooner in execution
+		ArenaConfiguration newConfiguration = _environmentManager.GetConfiguration(arenaID);
+
 		ApplyNewArenaConfiguration(newConfiguration);
 
 		CleanupRewards();
 
 		NotifyArenaChange();
-
 	}
 
 	private void CleanUpSpawnedObjects()
@@ -124,39 +170,55 @@ private void CleanUpSpawnedObjects()
 		}
 	}
 
-	private void DetermineNextArenaID()
+	private void SetNextArenaID()
 	{
-		int totalArenas = _environmentManager.getMaxArenaID();
+		int totalArenas = _environmentManager.GetTotalArenas();
 		bool randomizeArenas = _environmentManager.GetRandomizeArenasStatus();
 
 		if (isFirstArenaReset)
 		{
 			isFirstArenaReset = false;
-			arenaID = randomizeArenas ? Random.Range(0, totalArenas) : 0;
+			arenaID = randomizeArenas ? ChooseRandomArenaID(totalArenas) : 0;
 		}
 		else
 		{
-			arenaID = randomizeArenas ? ChooseRandomArenaID(totalArenas) : (arenaID + 1) % totalArenas;
+			if (randomizeArenas)
+			{
+				arenaID = ChooseRandomArenaID(totalArenas);
+			}
+			else
+			{
+				// If the next arena is merged, sequentially search for the next unmerged one
+				ArenaConfiguration preceedingArena = _arenaConfiguration;
+				arenaID = (arenaID + 1) % totalArenas;
+				while (preceedingArena.mergeNextArena)
+				{
+					preceedingArena = _environmentManager.GetConfiguration(arenaID);
+					arenaID = (arenaID + 1) % totalArenas;
+				}
+			}
 		}
 	}
 
 	private int ChooseRandomArenaID(int totalArenas)
 	{
+		// Populate the list of merged arenas if needed
+		if (_mergedArenas == null){ _mergedArenas = GetMergedArenas(); }
+
 		playedArenas.Add(arenaID);
 		if (playedArenas.Count >= totalArenas)
 		{
 			playedArenas = new List<int> { arenaID };
 		}
 
-		var availableArenas = Enumerable.Range(0, totalArenas).Except(playedArenas).ToList();
+		var availableArenas = Enumerable.Range(0, totalArenas).Except(playedArenas).Except(_mergedArenas).ToList();
 		return availableArenas[Random.Range(0, availableArenas.Count)];
-	}
 
-	private bool TryLoadArenaConfiguration(out ArenaConfiguration newConfiguration)
-	{
-		return _environmentManager.GetConfiguration(arenaID, out newConfiguration);
 	}
 
+	/* Note: to update the active arena to a new ID the following must be called in sequence
+	   GetConfiguration, ApplyNewArenaConfiguration, CleanupRewards, NotifyArenaChange
+	*/
 	private void ApplyNewArenaConfiguration(ArenaConfiguration newConfiguration)
 	{
 		_arenaConfiguration = newConfiguration;
@@ -175,7 +237,6 @@ private void ApplyNewArenaConfiguration(ArenaConfiguration newConfiguration)
 		{
 			Random.InitState(_arenaConfiguration.randomSeed);
 		}
-
 		Debug.Log($"TimeLimit set to: {_arenaConfiguration.TimeLimit}");
 	}
 

diff --git a/Assets/Scripts/YAMLclasses.cs b/Assets/Scripts/YAMLclasses.cs
@@ -51,6 +51,7 @@ public void SetCurrentPassMark()
 
 		public List<int> blackouts { get; set; } = new List<int>();
 		public int randomSeed { get; set; } = 0;
+		public bool mergeNextArena { get; set; } = false;
 	}
 
 	/// <summary>