partial work for #63

author: Luong Hoang <lhoang@live.com> 2014-10-17 01:16:39 +0400
committer: Luong Hoang <lhoang@live.com> 2014-10-17 01:16:39 +0400
commit: c1a759d4e35d1f07bcd4549b60030ddea2d4ed3b (patch)
tree: c9f463618831a53af12ac56398fa694c58b5acad /cs_test
parent: 689666754894b1c011f163801cb083182156f125 (diff)
2 files changed, 219 insertions, 211 deletions
diff --git a/cs_test/ExploreSample.cs b/cs_test/ExploreSample.cs
index a2f05947..b0f3f7e8 100644
--- a/cs_test/ExploreSample.cs
+++ b/cs_test/ExploreSample.cs
@@ -1,214 +1,222 @@
-using System;
-using System.Collections.Generic;
-using System.Linq;
-using System.Text;
-using MultiWorldTesting;
-
-namespace cs_test
-{
-    class ExploreSample
-    {
-        private static UInt32 SampleStatefulPolicyFunc(int parameters, CONTEXT context)
-        {
-            return (uint)((parameters + context.Features.Length) % 10 + 1);
-        }
-
-        private static UInt32 SampleStatefulPolicyFunc2(int parameters, CONTEXT context)
-        {
-            return (uint)((parameters + context.Features.Length) % 10 + 2);
-        }
-
-        private static UInt32 SampleStatefulPolicyFunc(CustomParams parameters, CONTEXT context)
-        {
-            return (uint)((parameters.Value1 + parameters.Value2 + context.Features.Length) % 10 + 1);
-        }
-
-        private static UInt32 SampleStatelessPolicyFunc(CONTEXT applicationContext)
-        {
-            return (UInt32)applicationContext.Features.Length;
-        }
-
-        private static UInt32 SampleStatelessPolicyFunc2(CONTEXT applicationContext)
-        {
-            return (UInt32)applicationContext.Features.Length + 1;
-        }
-
-        private static void SampleStatefulScorerFunc(int parameters, CONTEXT applicationContext, float[] scores)
-        {
-            for (uint i = 0; i < scores.Length; i++)
-            {
-                scores[i] = (int)parameters + i;
-            }
-        }
-
-        private static void SampleStatelessScorerFunc(CONTEXT applicationContext, float[] scores)
-        {
-            for (uint i = 0; i < scores.Length; i++)
-            {
-                scores[i] = applicationContext.Features.Length + i;
-            }
-        }
-
-        class CustomParams
-        {
-            public int Value1;
-            public int Value2;
-        }
-
-        public static void Run()
-        {
-            MwtExplorer mwt = new MwtExplorer();
-
-            uint numActions = 10;
-            
-            float epsilon = 0.2f;
-            uint tau = 0;
-            uint bags = 2;
-            float lambda = 0.5f;
-
-            int policyParams = 1003;
-            CustomParams customParams = new CustomParams() { Value1 = policyParams, Value2 = policyParams + 1 };
-
-            /*** Initialize Epsilon-Greedy explore algorithm using a default policy function that accepts parameters ***/
-            //mwt.InitializeEpsilonGreedy<int>(epsilon, new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), policyParams, numActions);
-
-            /*** Initialize Epsilon-Greedy explore algorithm using a stateless default policy function ***/
-            //mwt.InitializeEpsilonGreedy(epsilon, new StatelessPolicyDelegate(SampleStatelessPolicyFunc), numActions);
-
-            /*** Initialize Tau-First explore algorithm using a default policy function that accepts parameters ***/
-            //mwt.InitializeTauFirst<CustomParams>(tau, new StatefulPolicyDelegate<CustomParams>(SampleStatefulPolicyFunc), customParams, numActions);
-
-            /*** Initialize Tau-First explore algorithm using a stateless default policy function ***/
-            //mwt.InitializeTauFirst(tau, new StatelessPolicyDelegate(SampleStatelessPolicyFunc), numActions);
-
-            /*** Initialize Bagging explore algorithm using a default policy function that accepts parameters ***/
-            //StatefulPolicyDelegate<int>[] funcs = 
-            //{
-            //    new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), 
-            //    new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc2) 
-            //};
-            //int[] parameters = { policyParams, policyParams };
-            //mwt.InitializeBagging<int>(bags, funcs, parameters, numActions);
-
-            /*** Initialize Bagging explore algorithm using a stateless default policy function ***/
-            //StatelessPolicyDelegate[] funcs = 
-            //{
-            //    new StatelessPolicyDelegate(SampleStatelessPolicyFunc), 
-            //    new StatelessPolicyDelegate(SampleStatelessPolicyFunc2) 
-            //};
-            //mwt.InitializeBagging(bags, funcs, numActions);
-
-            /*** Initialize Softmax explore algorithm using a default policy function that accepts parameters ***/
-            //mwt.InitializeSoftmax<int>(lambda, new StatefulScorerDelegate<int>(SampleStatefulScorerFunc), policyParams, numActions);
-
-            /*** Initialize Softmax explore algorithm using a stateless default policy function ***/
-            mwt.InitializeSoftmax(lambda, new StatelessScorerDelegate(SampleStatelessScorerFunc), numActions);
-
-            FEATURE[] f = new FEATURE[2];
-            f[0].X = 0.5f;
-            f[0].WeightIndex = 1;
-            f[1].X = 0.9f;
-            f[1].WeightIndex = 2;
-
-            string otherContext = "Some other context data that might be helpful to log";
-            CONTEXT context = new CONTEXT(f, otherContext);
-
-            UInt32 chosenAction = mwt.ChooseAction(context, "myId");
-
-            INTERACTION[] interactions = mwt.GetAllInteractions();
-
-            mwt.Unintialize();
-
-            MwtRewardReporter mrr = new MwtRewardReporter(interactions);
-
-            string joinKey = "myId";
-            float reward = 0.5f;
-            if (!mrr.ReportReward(joinKey, reward))
-            {
-                throw new Exception();
-            }
-
-            MwtOptimizer mot = new MwtOptimizer(interactions, numActions);
-            
-            float eval1 = mot.EvaluatePolicy(new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), policyParams);
-
-            mot.OptimizePolicyVWCSOAA("model_file");
-            float eval2 = mot.EvaluatePolicyVWCSOAA("model_file");
-
-            Console.WriteLine(chosenAction);
-            Console.WriteLine(interactions);
-        }
-
-        public static void Clock()
-        {
-            float epsilon = .2f;
-            int policyParams = 1003;
-            string uniqueKey = "clock";
-            int numFeatures = 1000;
-            int numIter = 1000;
-            int numWarmup = 100;
-            int numInteractions = 1;
-            uint numActions = 10;
-            string otherContext = null;
-            
-            double timeInit = 0, timeChoose = 0, timeSerializedLog = 0, timeTypedLog = 0;
-
-            System.Diagnostics.Stopwatch watch = new System.Diagnostics.Stopwatch();
-            for (int iter = 0; iter < numIter + numWarmup; iter++)
-            {
-                watch.Restart();
-                
-                MwtExplorer mwt = new MwtExplorer();
-                mwt.InitializeEpsilonGreedy<int>(epsilon, new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), policyParams, numActions);
-
-                timeInit += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
-
-                FEATURE[] f = new FEATURE[numFeatures];
-                for (int i = 0; i < numFeatures; i++)
-                {
-                    f[i].WeightIndex = (uint)i + 1;
-                    f[i].X = 0.5f;
-                }
-                
-                watch.Restart();
-
-                CONTEXT context = new CONTEXT(f, otherContext);
-
-                for (int i = 0; i < numInteractions; i++)
-                {
-                    mwt.ChooseAction(context, uniqueKey);
-                }
-
-                timeChoose += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
-
-                watch.Restart();
-
-                string interactions = mwt.GetAllInteractionsAsString();
-
-                timeSerializedLog += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
-
-                for (int i = 0; i < numInteractions; i++)
-                {
-                    mwt.ChooseAction(context, uniqueKey);
-                }
-
-                watch.Restart();
-
-                mwt.GetAllInteractions();
-
-                timeTypedLog += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
-            }
-            Console.WriteLine("--- PER ITERATION ---");
-            Console.WriteLine("# iterations: {0}, # interactions: {1}, # context features {2}", numIter, numInteractions, numFeatures);
-            Console.WriteLine("Init: {0} micro", timeInit * 1000 / numIter);
-            Console.WriteLine("Choose Action: {0} micro", timeChoose * 1000 / (numIter * numInteractions));
-            Console.WriteLine("Get Serialized Log: {0} micro", timeSerializedLog * 1000 / numIter);
-            Console.WriteLine("Get Typed Log: {0} micro", timeTypedLog * 1000 / numIter);
-            Console.WriteLine("--- TOTAL TIME: {0} micro", (timeInit + timeChoose + timeSerializedLog + timeTypedLog) * 1000);
+using System;
+using System.Collections.Generic;
+using System.Linq;
+using System.Text;
+using MultiWorldTesting;
+
+namespace cs_test
+{
+    class ExploreSample
+    {
+        private static UInt32 SampleStatefulPolicyFunc(int parameters, CONTEXT context)
+        {
+            return (uint)((parameters + context.Features.Length) % 10 + 1);
+        }
+
+        private static UInt32 SampleStatefulPolicyFunc2(int parameters, CONTEXT context)
+        {
+            return (uint)((parameters + context.Features.Length) % 10 + 2);
+        }
+
+        private static UInt32 SampleStatefulPolicyFunc(CustomParams parameters, CONTEXT context)
+        {
+            return (uint)((parameters.Value1 + parameters.Value2 + context.Features.Length) % 10 + 1);
+        }
+
+        private static UInt32 SampleStatelessPolicyFunc(CONTEXT applicationContext)
+        {
+            return (UInt32)applicationContext.Features.Length;
+        }
+
+        private static UInt32 SampleStatelessPolicyFunc2(CONTEXT applicationContext)
+        {
+            return (UInt32)applicationContext.Features.Length + 1;
+        }
+
+        private static void SampleStatefulScorerFunc(int parameters, CONTEXT applicationContext, float[] scores)
+        {
+            for (uint i = 0; i < scores.Length; i++)
+            {
+                scores[i] = (int)parameters + i;
+            }
+        }
+
+        private static void SampleStatelessScorerFunc(CONTEXT applicationContext, float[] scores)
+        {
+            for (uint i = 0; i < scores.Length; i++)
+            {
+                scores[i] = applicationContext.Features.Length + i;
+            }
+        }
+
+        class CustomParams
+        {
+            public int Value1;
+            public int Value2;
+        }
+
+        public static void Run()
+        {
+            MwtExplorer mwt = new MwtExplorer();
+
+            uint numActions = 10;
+            
+            float epsilon = 0.2f;
+            uint tau = 0;
+            uint bags = 2;
+            float lambda = 0.5f;
+
+            int policyParams = 1003;
+            CustomParams customParams = new CustomParams() { Value1 = policyParams, Value2 = policyParams + 1 };
+
+            /*** Initialize Epsilon-Greedy explore algorithm using a default policy function that accepts parameters ***/
+            mwt.InitializeEpsilonGreedy<int>(epsilon, new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), policyParams, numActions);
+
+            /*** Initialize Epsilon-Greedy explore algorithm using a stateless default policy function ***/
+            //mwt.InitializeEpsilonGreedy(epsilon, new StatelessPolicyDelegate(SampleStatelessPolicyFunc), numActions);
+
+            /*** Initialize Tau-First explore algorithm using a default policy function that accepts parameters ***/
+            //mwt.InitializeTauFirst<CustomParams>(tau, new StatefulPolicyDelegate<CustomParams>(SampleStatefulPolicyFunc), customParams, numActions);
+
+            /*** Initialize Tau-First explore algorithm using a stateless default policy function ***/
+            //mwt.InitializeTauFirst(tau, new StatelessPolicyDelegate(SampleStatelessPolicyFunc), numActions);
+
+            /*** Initialize Bagging explore algorithm using a default policy function that accepts parameters ***/
+            //StatefulPolicyDelegate<int>[] funcs = 
+            //{
+            //    new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), 
+            //    new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc2) 
+            //};
+            //int[] parameters = { policyParams, policyParams };
+            //mwt.InitializeBagging<int>(bags, funcs, parameters, numActions);
+
+            /*** Initialize Bagging explore algorithm using a stateless default policy function ***/
+            //StatelessPolicyDelegate[] funcs = 
+            //{
+            //    new StatelessPolicyDelegate(SampleStatelessPolicyFunc), 
+            //    new StatelessPolicyDelegate(SampleStatelessPolicyFunc2) 
+            //};
+            //mwt.InitializeBagging(bags, funcs, numActions);
+
+            /*** Initialize Softmax explore algorithm using a default policy function that accepts parameters ***/
+            //mwt.InitializeSoftmax<int>(lambda, new StatefulScorerDelegate<int>(SampleStatefulScorerFunc), policyParams, numActions);
+
+            /*** Initialize Softmax explore algorithm using a stateless default policy function ***/
+            //mwt.InitializeSoftmax(lambda, new StatelessScorerDelegate(SampleStatelessScorerFunc), numActions);
+
+            FEATURE[] f = new FEATURE[2];
+            f[0].X = 0.5f;
+            f[0].WeightIndex = 1;
+            f[1].X = 0.9f;
+            f[1].WeightIndex = 2;
+
+            string otherContext = "Some other context data that might be helpful to log";
+            CONTEXT context = new CONTEXT(f, otherContext);
+
+            UInt32 chosenAction = mwt.ChooseAction(context, "myId");
+
+            INTERACTION[] interactions = mwt.GetAllInteractions();
+
+            mwt.Unintialize();
+
+            MwtRewardReporter mrr = new MwtRewardReporter(interactions);
+
+            string joinKey = "myId";
+            float reward = 0.5f;
+            if (!mrr.ReportReward(joinKey, reward))
+            {
+                throw new Exception();
+            }
+
+            MwtOptimizer mot = new MwtOptimizer(interactions, numActions);
+            
+            float eval1 = mot.EvaluatePolicy(new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), policyParams);
+
+            mot.OptimizePolicyVWCSOAA("model_file");
+            float eval2 = mot.EvaluatePolicyVWCSOAA("model_file");
+
+            Console.WriteLine(chosenAction);
+            Console.WriteLine(interactions);
+
+            string file = "serialized.txt";
+            MwtLogger logger = new MwtLogger(file);
+            logger.Initialize(interactions);
+            logger.Flush();
+
+            logger = new MwtLogger(file);
+            INTERACTION[] inters = logger.GetAllInteractions();
+        }
+
+        public static void Clock()
+        {
+            float epsilon = .2f;
+            int policyParams = 1003;
+            string uniqueKey = "clock";
+            int numFeatures = 1000;
+            int numIter = 1000;
+            int numWarmup = 100;
+            int numInteractions = 1;
+            uint numActions = 10;
+            string otherContext = null;
+            
+            double timeInit = 0, timeChoose = 0, timeSerializedLog = 0, timeTypedLog = 0;
+
+            System.Diagnostics.Stopwatch watch = new System.Diagnostics.Stopwatch();
+            for (int iter = 0; iter < numIter + numWarmup; iter++)
+            {
+                watch.Restart();
+                
+                MwtExplorer mwt = new MwtExplorer();
+                mwt.InitializeEpsilonGreedy<int>(epsilon, new StatefulPolicyDelegate<int>(SampleStatefulPolicyFunc), policyParams, numActions);
+
+                timeInit += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
+
+                FEATURE[] f = new FEATURE[numFeatures];
+                for (int i = 0; i < numFeatures; i++)
+                {
+                    f[i].WeightIndex = (uint)i + 1;
+                    f[i].X = 0.5f;
+                }
+                
+                watch.Restart();
+
+                CONTEXT context = new CONTEXT(f, otherContext);
+
+                for (int i = 0; i < numInteractions; i++)
+                {
+                    mwt.ChooseAction(context, uniqueKey);
+                }
+
+                timeChoose += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
+
+                watch.Restart();
+
+                string interactions = mwt.GetAllInteractionsAsString();
+
+                timeSerializedLog += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
+
+                for (int i = 0; i < numInteractions; i++)
+                {
+                    mwt.ChooseAction(context, uniqueKey);
+                }
+
+                watch.Restart();
+
+                mwt.GetAllInteractions();
+
+                timeTypedLog += (iter < numWarmup) ? 0 : watch.Elapsed.TotalMilliseconds;
+            }
+            Console.WriteLine("--- PER ITERATION ---");
+            Console.WriteLine("# iterations: {0}, # interactions: {1}, # context features {2}", numIter, numInteractions, numFeatures);
+            Console.WriteLine("Init: {0} micro", timeInit * 1000 / numIter);
+            Console.WriteLine("Choose Action: {0} micro", timeChoose * 1000 / (numIter * numInteractions));
+            Console.WriteLine("Get Serialized Log: {0} micro", timeSerializedLog * 1000 / numIter);
+            Console.WriteLine("Get Typed Log: {0} micro", timeTypedLog * 1000 / numIter);
+            Console.WriteLine("--- TOTAL TIME: {0} micro", (timeInit + timeChoose + timeSerializedLog + timeTypedLog) * 1000);
         }
 
         /************************ LAB CODE ************************/
 
-		
-    }
-}
+		
+    }
+}
diff --git a/cs_test/LabDemo.cs b/cs_test/LabDemo.cs
index b2956fda..02daf1d4 100755
--- a/cs_test/LabDemo.cs
+++ b/cs_test/LabDemo.cs
@@ -3,7 +3,7 @@ using System.Collections.Generic;
 using System.Linq;
 using System.Text;
 using System.IO;
-using MultiWorldTesting;
+using MultiWorldTesting;
 
 
 public class LabDemo
author	Luong Hoang <lhoang@live.com>	2014-10-17 01:16:39 +0400
committer	Luong Hoang <lhoang@live.com>	2014-10-17 01:16:39 +0400
commit	c1a759d4e35d1f07bcd4549b60030ddea2d4ed3b (patch)
tree	c9f463618831a53af12ac56398fa694c58b5acad /cs_test
parent	689666754894b1c011f163801cb083182156f125 (diff)