/
MainWindow.xaml.cs
75 lines (64 loc) · 2.16 KB
/
MainWindow.xaml.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
using System;
using System.Collections.Generic;
using System.Windows;
using MachineLearningQLearning.Logic;
namespace MachineLearningQLearning
{
/// <summary>
/// Interaction logic for MainWindow.xaml
/// </summary>
public partial class MainWindow : Window
{
private StateActionTable _stateRewardTable;
private List<List<string>> qList;
private StateActionTableManager manager;
public MainWindow()
{
InitializeComponent();
manager = new StateActionTableManager();
InitTestTable();
}
public StateActionTable StateRewardTable
{
get { return _stateRewardTable; }
set { _stateRewardTable = value; }
}
private void InitTestTable()
{
StateGrid.ItemsSource = manager.CreateRoomExampleTable();
manager.CreateStateActionMatrix();
manager.InitQMatrix();
qList = manager.ConvertQMatrixToList();
lst.ItemsSource = qList;
}
private void Button_Click_1(object sender, RoutedEventArgs e)
{
qList = manager.PerformTrainStep();
//List<string> test = StateRewardTableManager.GetBestRouteOfState("C");
}
private void Button_Click_2(object sender, RoutedEventArgs e)
{
int cycles = Convert.ToInt32(cycleTB.Text);
for (int i = 0; i < cycles; i++)
{
qList = manager.PerformTrainStep();
lst.ItemsSource = qList;
currentCycleLabel.Content = (i+1).ToString();
}
}
private void initB_Click(object sender, RoutedEventArgs e)
{
manager.GoalState = goalTB.Text;
manager.DiscountRate = Convert.ToDouble(gammaTB.Text) / 10;
}
private void Button_Click_3(object sender, RoutedEventArgs e)
{
string bestRoute =StartStateTB.Text;
foreach (var state in manager.GetBestRouteOfState(StartStateTB.Text))
{
bestRoute += "-" + state;
}
RouteLabel.Content = bestRoute;
}
}
}