-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathAF_ANN.hpp
136 lines (125 loc) · 3.68 KB
/
AF_ANN.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
// *************************************************************
// Author: Abhirup Das
// Github: https://github.com/codebuddha
// LinkedIn: https://www.linkedin.com/in/abhirup-das-5a174212a/
// *************************************************************
#include <iostream>
#include <arrayfire.h>
#include <af/util.h>
#include <af/gfor.h>
#include <cmath>
#include <cassert>
#include <vector>
#include <unordered_map>
#include <string>
#include "Layer.hpp"
using std::vector;
using std::string;
class Net{
public:
int num_layers;
vector<Layer> network;
vector<af::array> weights;
vector<int> topology;
vector<string> activations;
Net();
Net(const vector<int> &topo, const vector<string> activs, double range);
void setNetwork(const af::array &inputVals);
void feedForward();
void backProp(float lr_rate);
void getLoss(const af::array &targetVals);
void L1loss(const af::array &targetVals);
void BCEloss(const af::array &targetVals);
af::array getOutput();
void print_all_layers();
void weight_dims();
af::array net_loss;
float alpha;
};
void Net::print_all_layers()
{
for(auto &i: network)
af_print(i.layer);
}
void Net::weight_dims()
{
std::cout << "Weights:\n";
for(auto &w: weights)
std::cout << w.dims() << "\n";
}
Net::Net(const vector<int> &topo, const vector<string> activs, double range)
{
topology = topo;
activations = activs;
num_layers = topology.size();
network.resize(topology.size());
weights.resize(topology.size() - 1);
for(int i=0; i<topo.size()-1; i++)
weights[i] = range * af::randu(topo[i]+1, topo[i+1]) - range/2;
net_loss = 0;
}
void Net::setNetwork(const af::array &inputVals)
{
assert ((inputVals.dims(1) == topology[0]) && "Invalid inputVals dimensions.");
int b_size = inputVals.dims(0);
for(int i=0; i<num_layers; i++)
if(i != num_layers-1){
network[i] = Layer(b_size, topology[i]+1, activations[i]);
network[i].layer(af::span, topology[i]) = 1.0;
}
else
network[i] = Layer(b_size, topology[i], activations[i]);
network[0].layer(af::span, af::seq(inputVals.dims(1))) = inputVals;
}
void Net::feedForward()
{
for(int i=0; i<num_layers-1; i++)
{
Layer &ll = network[i+1];
af::array tmp = af::matmul(network[i].layer, weights[i]);
ll.layer(af::span, af::seq(tmp.dims(1))) = ll.activ_fn(tmp);
}
}
void Net::L1loss(const af::array &targetVals)
{
af::array &out = network.back().layer;
assert (targetVals.dims(0) == out.dims(0) && targetVals.dims(1) == out.dims(1) && "Invalid targetVals dimensions.");
net_loss = (out - targetVals);
}
void Net::BCEloss(const af::array &targetVals)
{
af::array &out = network.back().layer;
assert (targetVals.dims(0) == out.dims(0) && targetVals.dims(1) == out.dims(1) && "Invalid targetVals dimensions.");
net_loss = (-targetVals*af::log2(out));
}
void Net::backProp(float lr_rate)
{
alpha = lr_rate;//learning rate
af::array out = network.back().layer;
int batch_size = out.dims(0);
//func.pointer 'deriv' points to appropriate activation fn.
//... for respective layers
af::array (*deriv)(const af::array&) = network.back().activ_deriv_fn;
af::array err = net_loss;
for(int i=num_layers-2; i>=0; i--)
{
Layer curr = network[i];
af::array delta = (deriv(out)*err).T();
//adjusting Weights
af::array grad = -(alpha * af::matmul(delta, curr.layer)) / batch_size;
weights[i] += grad.T();
//'out' will denote current layer in next step of backprop
//'out' excludes bias of current layer
out = curr.layer(af::span, af::seq(curr.layer.dims(1)-1));
// //updating the activation function for 'out'
deriv = curr.activ_deriv_fn;
//
err = af::matmulTT(delta, weights[i]);
// //Removing error bias
err = err(af::span, af::seq(out.dims(1)));
}
}
af::array Net::getOutput()
{
return network.back().layer;
}