-
Notifications
You must be signed in to change notification settings - Fork 22
/
Copy pathOptimizers.hpp
90 lines (78 loc) · 2.58 KB
/
Optimizers.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
/*******************************************************
* Copyright (c) 2017, ArrayFire
* All rights reserved.
*
* This file is distributed under 3-clause BSD license.
* The complete license agreement can be obtained at:
* http://arrayfire.com/licenses/BSD-3-Clause
********************************************************/
#pragma once
#include <af/autograd/Variable.hpp>
#include <arrayfire.h>
#include <vector>
namespace af
{
namespace optim
{
class Optimizer
{
protected:
std::vector<autograd::Variable> m_parameters;
public:
Optimizer(const std::vector<autograd::Variable> ¶meters);
virtual void update() = 0;
void zeroGrad();
};
class SGDOptimizer : public Optimizer
{
bool m_use_nesterov;
double m_lr;
double m_mu;
double m_wd;
std::vector<af::array> m_velocities;
public:
SGDOptimizer(const std::vector<autograd::Variable> ¶meters,
double learning_rate, double momentum = 0,
double weight_decay = 0,
bool use_nesterov = false);
void update();
};
class AdamOptimizer : public Optimizer
{
double m_lr;
double m_beta1;
double m_beta2;
double m_eps;
double m_wd;
int m_count;
std::vector<af::array> m_biased_first;
std::vector<af::array> m_biased_second;
public:
AdamOptimizer(const std::vector<autograd::Variable> ¶meters,
double learning_rate,
double beta1 = 0.9,
double beta2 = 0.999,
double epsilon = 1E-8,
double weight_decay = 0);
void update();
};
class RMSPropOptimizer : public Optimizer
{
bool m_use_first;
double m_lr;
double m_rho;
double m_eps;
double m_wd;
std::vector<af::array> m_first;
std::vector<af::array> m_second;
public:
RMSPropOptimizer(const std::vector<autograd::Variable> ¶meters,
double learning_rate,
double rho = 0.99,
double epsilon = 1E-8,
double weight_decay = 0,
bool use_first = false);
void update();
};
}
}