forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
gather_ranges_to_dense_op.cc
102 lines (92 loc) · 3.22 KB
/
gather_ranges_to_dense_op.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
#include "caffe2/operators/gather_ranges_to_dense_op.h"
namespace caffe2 {
namespace {
OPERATOR_SCHEMA(GatherRangesToDense)
.NumInputs(2, 3)
.NumOutputs(1, INT_MAX)
.SetDoc(R"DOC(
Given DATA tensor of rank 1, and RANGES tensor of rank 3, gather values
corresponding to each range into a separate output tensor. If the optional input
KEY tensor is also given, the output will be sorted by KEY for each example.
RANGES dimensions description:
1: represents list of examples within a batch
2: represents list features
3: two values which are start and length or a range (to be applied on DATA)
Each feature has fixed lengths which are passed as lengths argument and a
separate tensor will be produced for each feature.
i.e. DATA.dim(1) = len(lengths) = NumOuptuts.
Missing features (represented by empty ranges) filled with default_value.
Example 1:
DATA = [1, 2, 3, 4, 5, 6, 7, 8]
RANGES = [
[
[2, 4],
[0, 2],
],
[
[0, 0],
[6, 2],
]
]
lengths = [4, 2]
OUTPUT[0] = [[3, 4, 5, 6], [0, 0, 0, 0]]
OUTPUT[1] = [[1, 2], [7, 8]]
Example 2 (with KEY):
DATA = [1, 2, 3, 4, 5, 6, 7, 8]
KEY = [0, 1, 3, 2, 1, 0, 1, 0]
RANGES = [
[
[2, 4],
[0, 2],
],
[
[0, 0],
[6, 2],
]
]
lengths = [4, 2]
OUTPUT[0] = [[6, 5, 4, 3], [0, 0, 0, 0]]
OUTPUT[1] = [[1, 2], [8, 7]]
Contrast Example 2 with Example 1. For each data point per feature, the values
are sorted by the corresponding KEY.
)DOC")
.Input(0, "DATA", "Tensor of rank 1.")
.Input(
1,
"RANGES",
"Tensor of int32/int64 ranges, of dims (N, M, 2). "
"Where N is number of examples and M is a size of each example. "
"Last dimention represents a range in the format (start, lengths)")
.Input(2, "KEY", "Tensor of rank 1 and type int64.")
.Output(0, "OUTPUT", "1-D tensor of size sum of range lengths")
.Arg("lengths", "Expected lengths for ranges")
.Arg(
"min_observation",
"The number of observations needed before deciding that the ratio of "
"mismatched ranges is alarming, also determines whether an info "
"sumarizing the empty and mismatch ratio will be printed at the end.")
.Arg(
"max_mismatched_ratio",
"An error is raised when ratio of mismatched ranges exceeds this.")
.TensorInferenceFunction([](const OperatorDef& def,
const vector<TensorShape>& in) {
ArgumentHelper helper(def);
auto lengths = helper.GetRepeatedArgument<int>("lengths");
CAFFE_ENFORCE_EQ(in[0].dims_size(), 1, "DATA should be 1-D tensor.");
CAFFE_ENFORCE_EQ(in[1].dims_size(), 3, "RANGES should be 3-D tensor.");
if (in.size() > 2) {
CAFFE_ENFORCE_EQ(in[2].dims_size(), 1, "KEY should be 1-D tensor.");
}
CAFFE_ENFORCE_GT(lengths.size(), 0, "lengths should be non-empty.");
std::vector<TensorShape> out(lengths.size());
for (int i = 0; i < lengths.size(); ++i) {
out[i].set_data_type(in[0].data_type());
out[i].add_dims(in[1].dims(0));
out[i].add_dims(lengths[i]);
}
return out;
});
REGISTER_CPU_OPERATOR(GatherRangesToDense, GatherRangesToDenseOp<CPUContext>);
NO_GRADIENT(GatherRangesToDense);
} // namespace
} // namespace caffe2