123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819 |
- using UnityEngine;
- using NUnit.Framework;
- using System.Reflection;
-
- namespace MLAgents.Tests
- {
- public class TestAcademy : Academy
- {
- public int initializeAcademyCalls;
- public int academyResetCalls;
- public int AcademyStepCalls;
-
- public override void InitializeAcademy()
- {
- initializeAcademyCalls += 1;
- }
- public override void AcademyReset()
- {
- academyResetCalls += 1;
- }
-
- public override void AcademyStep()
- {
- AcademyStepCalls += 1;
- }
- }
- public class TestAgent : Agent
- {
- public int initializeAgentCalls;
- public int collectObservationsCalls;
- public int agentActionCalls;
- public int agentResetCalls;
- public int agentOnDoneCalls;
- public override void InitializeAgent()
- {
- initializeAgentCalls += 1;
- }
- public override void CollectObservations()
- {
- collectObservationsCalls += 1;
- }
-
- public override void AgentAction(float[] vectorAction, string textAction)
- {
- agentActionCalls += 1;
- AddReward(0.1f);
- }
-
- public override void AgentReset()
- {
- agentResetCalls += 1;
- }
-
- public override void AgentOnDone()
- {
- agentOnDoneCalls += 1;
- }
- }
-
- // This is an empty class for testing the behavior of agents and academy
- // It is left empty because we are not testing any brain behavior
- public class TestBrain : Brain
- {
- public int numberOfCallsToInitialize = 0;
- public int numberOfCallsToDecideAction = 0;
- public static TestBrain Instantiate()
- {
- return CreateInstance<TestBrain>();
- }
-
- protected override void Initialize()
- {
- numberOfCallsToInitialize++;
- }
-
- protected override void DecideAction()
- {
- numberOfCallsToDecideAction++;
- agentInfos.Clear();
- }
- }
-
-
- public class EditModeTestGeneration
- {
- [Test]
- public void TestAcademy()
- {
- // Use the Assert class to test conditions.
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- Assert.AreNotEqual(null, aca);
- Assert.AreEqual(0, aca.initializeAcademyCalls);
- Assert.AreEqual(0, aca.GetEpisodeCount());
- Assert.AreEqual(0, aca.GetStepCount());
- }
-
- [Test]
- public void TestAgent()
- {
- GameObject agentGO = new GameObject("TestAgent");
- agentGO.AddComponent<TestAgent>();
- TestAgent agent = agentGO.GetComponent<TestAgent>();
- Assert.AreNotEqual(null, agent);
- Assert.AreEqual(0, agent.initializeAgentCalls);
- }
- }
-
- public class EditModeTestInitialization
- {
-
- private Brain GenerateTestBrain()
- {
- return ScriptableObject.CreateInstance<TestBrain>();
- }
-
- [Test]
- public void TestAcademy()
- {
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- Assert.AreEqual(0, aca.initializeAcademyCalls);
- Assert.AreEqual(0, aca.GetStepCount());
- Assert.AreEqual(0, aca.GetEpisodeCount());
- Assert.AreEqual(false, aca.IsDone());
- //This will call the method even though it is private
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod("InitializeEnvironment",
- BindingFlags.Instance | BindingFlags.NonPublic);
- AcademyInitializeMethod.Invoke(aca, new object[] { });
- Assert.AreEqual(1, aca.initializeAcademyCalls);
- Assert.AreEqual(0, aca.GetEpisodeCount());
- Assert.AreEqual(0, aca.GetStepCount());
- Assert.AreEqual(false, aca.IsDone());
- Assert.AreEqual(0, aca.academyResetCalls);
- Assert.AreEqual(0, aca.AcademyStepCalls);
- }
-
- [Test]
- public void TestAgent()
- {
- GameObject agentGO1 = new GameObject("TestAgent");
- agentGO1.AddComponent<TestAgent>();
- TestAgent agent1 = agentGO1.GetComponent<TestAgent>();
- GameObject agentGO2 = new GameObject("TestAgent");
- agentGO2.AddComponent<TestAgent>();
- TestAgent agent2 = agentGO2.GetComponent<TestAgent>();
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- TestBrain brain = TestBrain.Instantiate();
- brain.brainParameters = new BrainParameters();
- brain.brainParameters.vectorObservationSize = 0;
- agent1.GiveBrain(brain);
- agent2.GiveBrain(brain);
-
- Assert.AreEqual(false, agent1.IsDone());
- Assert.AreEqual(false, agent2.IsDone());
- Assert.AreEqual(0, agent1.agentResetCalls);
- Assert.AreEqual(0, agent2.agentResetCalls);
- Assert.AreEqual(0, agent1.initializeAgentCalls);
- Assert.AreEqual(0, agent2.initializeAgentCalls);
- Assert.AreEqual(0, agent1.agentActionCalls);
- Assert.AreEqual(0, agent2.agentActionCalls);
-
- MethodInfo AgentEnableMethod = typeof(Agent).GetMethod("OnEnableHelper",
- BindingFlags.Instance | BindingFlags.NonPublic);
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod("InitializeEnvironment",
- BindingFlags.Instance | BindingFlags.NonPublic);
-
-
- AgentEnableMethod.Invoke(agent2, new object[] { aca });
- AcademyInitializeMethod.Invoke(aca, new object[] { });
- AgentEnableMethod.Invoke(agent1, new object[] { aca });
-
- Assert.AreEqual(false, agent1.IsDone());
- Assert.AreEqual(false, agent2.IsDone());
- // agent1 was not enabled when the academy started
- // The agents have been initialized
- Assert.AreEqual(0, agent1.agentResetCalls);
- Assert.AreEqual(0, agent2.agentResetCalls);
- Assert.AreEqual(1, agent1.initializeAgentCalls);
- Assert.AreEqual(1, agent2.initializeAgentCalls);
- Assert.AreEqual(0, agent1.agentActionCalls);
- Assert.AreEqual(0, agent2.agentActionCalls);
- }
-
- }
-
- public class EditModeTestStep
- {
- [Test]
- public void TestAcademy()
- {
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod("InitializeEnvironment",
- BindingFlags.Instance | BindingFlags.NonPublic);
- AcademyInitializeMethod.Invoke(aca, new object[] { });
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod("EnvironmentStep",
- BindingFlags.Instance | BindingFlags.NonPublic);
-
- int numberReset = 0;
- for (int i = 0; i < 10; i++)
- {
- Assert.AreEqual(1, aca.initializeAcademyCalls);
- Assert.AreEqual(numberReset, aca.GetEpisodeCount());
- Assert.AreEqual(i, aca.GetStepCount());
- Assert.AreEqual(false, aca.IsDone());
- Assert.AreEqual(numberReset, aca.academyResetCalls);
- Assert.AreEqual(i, aca.AcademyStepCalls);
-
- // The reset happens at the begining of the first step
- if (i == 0)
- {
- numberReset += 1;
- }
- AcademyStepMethod.Invoke((object)aca, new object[] { });
- }
- }
-
- [Test]
- public void TestAgent()
- {
- GameObject agentGO1 = new GameObject("TestAgent");
- agentGO1.AddComponent<TestAgent>();
- TestAgent agent1 = agentGO1.GetComponent<TestAgent>();
- GameObject agentGO2 = new GameObject("TestAgent");
- agentGO2.AddComponent<TestAgent>();
- TestAgent agent2 = agentGO2.GetComponent<TestAgent>();
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- TestBrain brain = TestBrain.Instantiate();
-
-
- MethodInfo AgentEnableMethod = typeof(Agent).GetMethod(
- "OnEnableHelper", BindingFlags.Instance | BindingFlags.NonPublic);
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
-
- agent1.agentParameters = new AgentParameters();
- agent2.agentParameters = new AgentParameters();
- brain.brainParameters = new BrainParameters();
- // We use event based so the agent will now try to send anything to the brain
- agent1.agentParameters.onDemandDecision = false;
- agent1.agentParameters.numberOfActionsBetweenDecisions = 2;
- // agent1 will take an action at every step and request a decision every 2 steps
- agent2.agentParameters.onDemandDecision = true;
- // agent2 will request decisions only when RequestDecision is called
- brain.brainParameters.vectorObservationSize = 0;
- brain.brainParameters.cameraResolutions = new Resolution[0];
- agent1.GiveBrain(brain);
- agent2.GiveBrain(brain);
-
- AgentEnableMethod.Invoke(agent1, new object[] { aca });
- AcademyInitializeMethod.Invoke(aca, new object[] { });
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- int numberAgent1Reset = 0;
- int numberAgent2Initialization = 0;
- int requestDecision = 0;
- int requestAction = 0;
- for (int i = 0; i < 50; i++)
- {
- Assert.AreEqual(numberAgent1Reset, agent1.agentResetCalls);
- // Agent2 is never reset since intialized after academy
- Assert.AreEqual(0, agent2.agentResetCalls);
- Assert.AreEqual(1, agent1.initializeAgentCalls);
- Assert.AreEqual(numberAgent2Initialization, agent2.initializeAgentCalls);
- Assert.AreEqual(i, agent1.agentActionCalls);
- Assert.AreEqual(requestAction, agent2.agentActionCalls);
- Assert.AreEqual((i + 1) / 2, agent1.collectObservationsCalls);
- Assert.AreEqual(requestDecision, agent2.collectObservationsCalls);
- // Agent 1 resets at the first step
- if (i == 0)
- {
- numberAgent1Reset += 1;
- }
- //Agent 2 is only initialized at step 2
- if (i == 2)
- {
- AgentEnableMethod.Invoke(agent2, new object[] { aca });
- numberAgent2Initialization += 1;
- }
-
- // We are testing request decision and request actions when called
- // at different intervals
- if ((i % 3 == 0) && (i > 2))
- {
- //Every 3 steps after agent 2 is initialized, request decision
- requestDecision += 1;
- requestAction += 1;
- agent2.RequestDecision();
- }
- else if ((i % 5 == 0) && (i > 2))
- {
- // Every 5 steps after agent 2 is initialized, request action
- requestAction += 1;
- agent2.RequestAction();
- }
- AcademyStepMethod.Invoke(aca, new object[] { });
- }
- }
- }
-
- public class EditModeTestReset
- {
- [Test]
- public void TestAcademy()
- {
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
- AcademyInitializeMethod.Invoke(aca, new object[] { });
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- int numberReset = 0;
- int stepsSinceReset = 0;
- for (int i = 0; i < 50; i++)
- {
-
- Assert.AreEqual(stepsSinceReset, aca.GetStepCount());
- Assert.AreEqual(1, aca.initializeAcademyCalls);
- Assert.AreEqual(numberReset, aca.GetEpisodeCount());
-
- Assert.AreEqual(false, aca.IsDone());
- Assert.AreEqual(numberReset, aca.academyResetCalls);
- Assert.AreEqual(i, aca.AcademyStepCalls);
- // Academy resets at the first step
- if (i == 0)
- {
- numberReset += 1;
- }
-
- stepsSinceReset += 1;
- // Regularly set the academy to done to check behavior
- if (i % 5 == 3)
- {
- aca.Done();
- numberReset += 1;
- stepsSinceReset = 1;
- Assert.AreEqual(true, aca.IsDone());
- }
- AcademyStepMethod.Invoke((object)aca, new object[] { });
-
-
- }
- }
-
- [Test]
- public void TestAgent()
- {
- GameObject agentGO1 = new GameObject("TestAgent");
- agentGO1.AddComponent<TestAgent>();
- TestAgent agent1 = agentGO1.GetComponent<TestAgent>();
- GameObject agentGO2 = new GameObject("TestAgent");
- agentGO2.AddComponent<TestAgent>();
- TestAgent agent2 = agentGO2.GetComponent<TestAgent>();
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- TestBrain brain = TestBrain.Instantiate();
-
-
- MethodInfo AgentEnableMethod = typeof(Agent).GetMethod(
- "OnEnableHelper", BindingFlags.Instance | BindingFlags.NonPublic);
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- agent1.agentParameters = new AgentParameters();
- agent2.agentParameters = new AgentParameters();
- brain.brainParameters = new BrainParameters();
- // We use event based so the agent will now try to send anything to the brain
- agent1.agentParameters.onDemandDecision = false;
- agent1.agentParameters.numberOfActionsBetweenDecisions = 2;
- // agent1 will take an action at every step and request a decision every 2 steps
- agent2.agentParameters.onDemandDecision = true;
- // agent2 will request decisions only when RequestDecision is called
- brain.brainParameters.vectorObservationSize = 0;
- brain.brainParameters.cameraResolutions = new Resolution[0];
- agent1.GiveBrain(brain);
- agent2.GiveBrain(brain);
-
- AgentEnableMethod.Invoke(agent2, new object[] { aca });
- AcademyInitializeMethod.Invoke(aca, new object[] { });
-
- int numberAgent1Reset = 0;
- int numberAgent2Reset = 0;
- int numberAcaReset = 0;
- int acaStepsSinceReset = 0;
- int agent1StepSinceReset = 0;
- int agent2StepSinceReset = 0;
- int requestDecision = 0;
- int requestAction = 0;
- for (int i = 0; i < 5000; i++)
- {
- Assert.AreEqual(acaStepsSinceReset, aca.GetStepCount());
- Assert.AreEqual(1, aca.initializeAcademyCalls);
- Assert.AreEqual(numberAcaReset, aca.GetEpisodeCount());
-
- Assert.AreEqual(false, aca.IsDone());
- Assert.AreEqual(numberAcaReset, aca.academyResetCalls);
- Assert.AreEqual(i, aca.AcademyStepCalls);
-
- Assert.AreEqual(agent2StepSinceReset, agent2.GetStepCount());
- Assert.AreEqual(numberAgent1Reset, agent1.agentResetCalls);
- Assert.AreEqual(numberAgent2Reset, agent2.agentResetCalls);
-
- // Agent 2 and academy reset at the first step
- if (i == 0)
- {
- numberAcaReset += 1;
- numberAgent2Reset += 1;
- }
- //Agent 1 is only initialized at step 2
- if (i == 2)
- {
- AgentEnableMethod.Invoke(agent1, new object[] { aca });
-
- }
- // Reset Academy every 100 steps
- if (i % 100 == 3)
- {
- aca.Done();
- numberAcaReset += 1;
- acaStepsSinceReset = 0;
- }
- // Set agent 1 to done every 11 steps to test behavior
- if (i % 11 == 5)
- {
- agent1.Done();
- }
- // Reseting agent 2 regularly
- if (i % 13 == 3)
- {
- if (!(agent2.IsDone() || aca.IsDone()))
- {
- // If the agent was already reset before the request decision
- // We should not reset again
- agent2.Done();
- numberAgent2Reset += 1;
- agent2StepSinceReset = 0;
- }
- }
- // Request a decision for agent 2 regularly
- if (i % 3 == 2)
- {
- requestDecision += 1;
- requestAction += 1;
- agent2.RequestDecision();
- }
- else if (i % 5 == 1)
- {
- // Request an action without decision regularly
- requestAction += 1;
- agent2.RequestAction();
- }
- if (agent1.IsDone() && (((acaStepsSinceReset) % agent1.agentParameters.numberOfActionsBetweenDecisions == 0)) || aca.IsDone())
- {
- numberAgent1Reset += 1;
- agent1StepSinceReset = 0;
- }
- if (aca.IsDone())
- {
- numberAgent2Reset += 1;
- agent2StepSinceReset = 0;
- }
-
- acaStepsSinceReset += 1;
- agent1StepSinceReset += 1;
- agent2StepSinceReset += 1;
- //Agent 1 is only initialized at step 2
- if (i < 2)
- {
- agent1StepSinceReset = 0;
- }
- AcademyStepMethod.Invoke((object)aca, new object[] { });
-
-
- }
- }
- }
-
- public class EditModeTestMaxStep
- {
- [Test]
- public void TestAcademy()
- {
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
- AcademyInitializeMethod.Invoke(aca, new object[] { });
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- FieldInfo maxStep = typeof(Academy).GetField(
- "maxSteps", BindingFlags.Instance | BindingFlags.NonPublic);
- maxStep.SetValue((object)aca, 20);
-
- int numberReset = 0;
- int stepsSinceReset = 0;
- for (int i = 0; i < 50; i++)
- {
- Assert.AreEqual(stepsSinceReset, aca.GetStepCount());
- Assert.AreEqual(1, aca.initializeAcademyCalls);
- Assert.AreEqual(false, aca.IsDone());
-
- Assert.AreEqual(i, aca.AcademyStepCalls);
- Assert.AreEqual(numberReset, aca.GetEpisodeCount());
- Assert.AreEqual(numberReset, aca.academyResetCalls);
- stepsSinceReset += 1;
- // Make sure max step is reached every 20 steps
- if (i % 20 == 0)
- {
- numberReset += 1;
- stepsSinceReset = 1;
-
- }
- AcademyStepMethod.Invoke((object)aca, new object[] { });
- }
- }
-
- [Test]
- public void TestAgent()
- {
- GameObject agentGO1 = new GameObject("TestAgent");
- agentGO1.AddComponent<TestAgent>();
- TestAgent agent1 = agentGO1.GetComponent<TestAgent>();
- GameObject agentGO2 = new GameObject("TestAgent");
- agentGO2.AddComponent<TestAgent>();
- TestAgent agent2 = agentGO2.GetComponent<TestAgent>();
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- TestBrain brain = TestBrain.Instantiate();
-
-
- MethodInfo AgentEnableMethod = typeof(Agent).GetMethod(
- "OnEnableHelper", BindingFlags.Instance | BindingFlags.NonPublic);
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- FieldInfo maxStep = typeof(Academy).GetField(
- "maxSteps", BindingFlags.Instance | BindingFlags.NonPublic);
- maxStep.SetValue((object)aca, 100);
-
- agent1.agentParameters = new AgentParameters();
- agent2.agentParameters = new AgentParameters();
- brain.brainParameters = new BrainParameters();
- // We use event based so the agent will now try to send anything to the brain
- agent1.agentParameters.onDemandDecision = false;
- agent1.agentParameters.numberOfActionsBetweenDecisions = 1;
- // agent1 will take an action at every step and request a decision every 2 steps
- agent2.agentParameters.onDemandDecision = true;
- // agent2 will request decisions only when RequestDecision is called
- agent1.agentParameters.maxStep = 20;
- agent2.agentParameters.maxStep = 30;
- brain.brainParameters.vectorObservationSize = 0;
- brain.brainParameters.cameraResolutions = new Resolution[0];
- agent1.GiveBrain(brain);
- agent2.GiveBrain(brain);
-
- AgentEnableMethod.Invoke(agent2, new object[] { aca });
- AcademyInitializeMethod.Invoke(aca, new object[] { });
-
-
- int numberAgent1Reset = 0;
- int numberAgent2Reset = 0;
- int numberAcaReset = 0;
- int acaStepsSinceReset = 0;
- int agent1StepSinceReset = 0;
- int agent2StepSinceReset = 0;
-
- for (int i = 0; i < 500; i++)
- {
- Assert.AreEqual(acaStepsSinceReset, aca.GetStepCount());
- Assert.AreEqual(1, aca.initializeAcademyCalls);
-
- Assert.AreEqual(i, aca.AcademyStepCalls);
-
- Assert.AreEqual(agent1StepSinceReset, agent1.GetStepCount());
- Assert.AreEqual(agent2StepSinceReset, agent2.GetStepCount());
-
-
- Assert.AreEqual(numberAcaReset, aca.GetEpisodeCount());
- Assert.AreEqual(numberAcaReset, aca.academyResetCalls);
- Assert.AreEqual(numberAgent1Reset, agent1.agentResetCalls);
- Assert.AreEqual(numberAgent2Reset, agent2.agentResetCalls);
-
- //At the first step, Academy and agent 2 reset
- if (i == 0)
- {
- numberAcaReset += 1;
- numberAgent2Reset += 1;
- }
- //Agent 1 is only initialized at step 2
- if (i == 2)
- {
- AgentEnableMethod.Invoke(agent1, new object[] { aca });
- }
-
- // we request a decision at each step
- agent2.RequestDecision();
-
- if (i > 3)
- {
- // Make sure the academy max steps at 100
- if (i % 100 == 0)
- {
- acaStepsSinceReset = 0;
- agent1StepSinceReset = 0;
- agent2StepSinceReset = 0;
- numberAcaReset += 1;
- numberAgent1Reset += 1;
- numberAgent2Reset += 1;
- }
- else
- {
- //Make sure the agents reset when their max steps is reached
- if (agent1StepSinceReset % 21 == 0)
- {
- agent1StepSinceReset = 0;
- numberAgent1Reset += 1;
- }
- if (agent2StepSinceReset % 31 == 0)
- {
- agent2StepSinceReset = 0;
- numberAgent2Reset += 1;
- }
- }
- }
-
- acaStepsSinceReset += 1;
- agent1StepSinceReset += 1;
- agent2StepSinceReset += 1;
-
- //Agent 1 is only initialized at step 2
- if (i < 2)
- {
- agent1StepSinceReset = 0;
- }
-
- AcademyStepMethod.Invoke((object)aca, new object[] { });
-
- }
-
- }
- }
-
- public class EditModeTestMiscellaneous
- {
- [Test]
- public void TestResetOnDone()
- {
- GameObject agentGO1 = new GameObject("TestAgent");
- agentGO1.AddComponent<TestAgent>();
- TestAgent agent1 = agentGO1.GetComponent<TestAgent>();
- GameObject agentGO2 = new GameObject("TestAgent");
- agentGO2.AddComponent<TestAgent>();
- TestAgent agent2 = agentGO2.GetComponent<TestAgent>();
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- TestBrain brain = TestBrain.Instantiate();
-
-
- MethodInfo AgentEnableMethod = typeof(Agent).GetMethod(
- "OnEnableHelper", BindingFlags.Instance | BindingFlags.NonPublic);
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- agent1.agentParameters = new AgentParameters();
- agent2.agentParameters = new AgentParameters();
- brain.brainParameters = new BrainParameters();
- // We use event based so the agent will now try to send anything to the brain
- agent1.agentParameters.onDemandDecision = false;
- // agent1 will take an action at every step and request a decision every steps
- agent1.agentParameters.numberOfActionsBetweenDecisions = 1;
- // agent2 will request decisions only when RequestDecision is called
- agent2.agentParameters.onDemandDecision = true;
- agent1.agentParameters.maxStep = 20;
- //Here we specify that the agent does not reset when done
- agent1.agentParameters.resetOnDone = false;
- agent2.agentParameters.resetOnDone = false;
- brain.brainParameters.vectorObservationSize = 0;
- brain.brainParameters.cameraResolutions = new Resolution[0];
- agent1.GiveBrain(brain);
- agent2.GiveBrain(brain);
-
- AgentEnableMethod.Invoke(agent2, new object[] { aca });
- AcademyInitializeMethod.Invoke(aca, new object[] { });
- AgentEnableMethod.Invoke(agent1, new object[] { aca });
-
- int agent1ResetOnDone = 0;
- int agent2ResetOnDone = 0;
- int acaStepsSinceReset = 0;
- int agent1StepSinceReset = 0;
- int agent2StepSinceReset = 0;
-
- for (int i = 0; i < 50; i++)
- {
- Assert.AreEqual(i, aca.AcademyStepCalls);
-
- Assert.AreEqual(agent1StepSinceReset, agent1.GetStepCount());
- Assert.AreEqual(agent2StepSinceReset, agent2.GetStepCount());
- Assert.AreEqual(agent1ResetOnDone, agent1.agentOnDoneCalls);
- Assert.AreEqual(agent2ResetOnDone, agent2.agentOnDoneCalls);
-
- // we request a decision at each step
- agent2.RequestDecision();
- acaStepsSinceReset += 1;
- if (agent1ResetOnDone == 0)
- agent1StepSinceReset += 1;
- if (agent2ResetOnDone == 0)
- agent2StepSinceReset += 1;
-
- if ((i > 2) && (i % 21 == 0))
- {
- agent1ResetOnDone = 1;
- }
-
- if (i == 31)
- {
- agent2ResetOnDone = 1;
- agent2.Done();
- }
-
-
- AcademyStepMethod.Invoke((object)aca, new object[] { });
- }
-
- }
-
- [Test]
- public void TestCumulativeReward()
- {
- GameObject agentGO1 = new GameObject("TestAgent");
- agentGO1.AddComponent<TestAgent>();
- TestAgent agent1 = agentGO1.GetComponent<TestAgent>();
- GameObject agentGO2 = new GameObject("TestAgent");
- agentGO2.AddComponent<TestAgent>();
- TestAgent agent2 = agentGO2.GetComponent<TestAgent>();
- GameObject acaGO = new GameObject("TestAcademy");
- acaGO.AddComponent<TestAcademy>();
- TestAcademy aca = acaGO.GetComponent<TestAcademy>();
- TestBrain brain = TestBrain.Instantiate();
-
-
- MethodInfo AgentEnableMethod = typeof(Agent).GetMethod(
- "OnEnableHelper", BindingFlags.Instance | BindingFlags.NonPublic);
- MethodInfo AcademyInitializeMethod = typeof(Academy).GetMethod(
- "InitializeEnvironment", BindingFlags.Instance | BindingFlags.NonPublic);
-
- MethodInfo AcademyStepMethod = typeof(Academy).GetMethod(
- "EnvironmentStep", BindingFlags.Instance | BindingFlags.NonPublic);
-
- agent1.agentParameters = new AgentParameters();
- agent2.agentParameters = new AgentParameters();
- brain.brainParameters = new BrainParameters();
- // We use event based so the agent will now try to send anything to the brain
- agent1.agentParameters.onDemandDecision = false;
- agent1.agentParameters.numberOfActionsBetweenDecisions = 3;
- // agent1 will take an action at every step and request a decision every 2 steps
- agent2.agentParameters.onDemandDecision = true;
- // agent2 will request decisions only when RequestDecision is called
- agent1.agentParameters.maxStep = 20;
- brain.brainParameters.vectorObservationSize = 0;
- brain.brainParameters.cameraResolutions = new Resolution[0];
- agent1.GiveBrain(brain);
- agent2.GiveBrain(brain);
-
- AgentEnableMethod.Invoke(agent2, new object[] { aca });
- AcademyInitializeMethod.Invoke(aca, new object[] { });
- AgentEnableMethod.Invoke(agent1, new object[] { aca });
-
-
- int j = 0;
- for (int i = 0; i < 500; i++)
- {
- agent2.RequestAction();
- Assert.LessOrEqual(Mathf.Abs(j * 0.1f + j * 10f - agent1.GetCumulativeReward()), 0.05f);
- Assert.LessOrEqual(Mathf.Abs(i * 0.1f - agent2.GetCumulativeReward()), 0.05f);
-
-
- AcademyStepMethod.Invoke((object)aca, new object[] { });
- agent1.AddReward(10f);
-
- if ((i % 21 == 0) && (i > 0))
- {
- j = 0;
- }
- j++;
- }
- }
- }
-
- }
|