This repository has been archived by the owner on Mar 3, 2020. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 94
/
Copy pathNonlinearity.h
executable file
·85 lines (67 loc) · 1.88 KB
/
Nonlinearity.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
/*
* Copyright (c) 2015-present, Facebook, Inc.
* All rights reserved.
*
* This source code is licensed under the BSD-style license found in the
* LICENSE file in the root directory of this source tree. An additional grant
* of patent rights can be found in the PATENTS file in the same directory.
*
*/
#ifndef _NONLINEARITY_
#define _NONLINEARITY_
#include <algorithm>
#include <vector>
#include "common.h"
#include "Vec.h"
namespace rnn{
struct Softmax{
void static forward(Vec& v, my_int b = 0, my_int e = -1){
if(e == -1) e = v.size();
my_real max=v[b], denom = 0;
for(my_int i = b; i < e; i++)
if(v[i] > max) max = v[i];
for(my_int i = b; i < e; i++){
v[i] = exp(v[i]-max);
denom += v[i];
}
for(my_int i = b; i < e; i++)
v[i] = v[i] / denom;
}
void static backward(Vec& err, const Vec& v, my_int b = 0, my_int e = -1){
if(e == -1) e = v.size();
Vec grad = err;
for(my_int i = b; i < e; i++){
grad[i] = err[i] * v[i];
for(my_int j = b; j < e; j++)
grad[i] -= err[j] * v[j] * v[i];
}
err = grad;
}
};
struct Sigmoid{
void static forward(my_real& v){
if(v > 50 ) v = 50;
if(v < -50 ) v = -50;
v = 1 / (1 + exp(-v));
}
void static forward(Vec& v, my_int b = -1, my_int e = -1){
if(b == - 1) b =0;
if(e == -1 ) e = v.size();
for (my_int i = b; i < e; i++)
{
if(v[i] > 50 ) v[i] = 50;
if(v[i] < -50 ) v[i] = -50;
v[i] = 1 / (1 + exp(-v[i]));
}
}
void static backward(my_real& err, const my_real& v){
err = err * v * (1 - v);
}
void static backward(Vec& err, const Vec& v, my_int b = 0, my_int e = -1){
if(e == -1) e = err.size();
for(my_int i = b; i < e; i++)
err[i] = err[i] * (v[i] * (1 - v[i]));
}
};
}
#endif