forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathLinear.cpp
64 lines (50 loc) · 1.77 KB
/
Linear.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
#include <ATen/ATen.h>
#include <ATen/Config.h>
#include <ATen/NativeFunctions.h>
#if !AT_MKLDNN_ENABLED()
namespace at {
namespace native {
Tensor mkldnn_linear(
const Tensor& self,
const Tensor& weight,
const Tensor& bias) {
AT_ERROR("mkldnn_linear: ATen not compiled with MKLDNN support");
}
} // namespace native
} // namespace at
#else // AT_MKLDNN_EBABLED
#include <ATen/native/mkldnn/MKLDNNCommon.h>
namespace at {
namespace native {
Tensor mkldnn_linear(
const Tensor& self,
const Tensor& weight,
const Tensor& bias) {
TORCH_CHECK(self.dim() >= 2,
"mkldnn_linear: input needs to has dim at least 2, input dim ", self.dim());
TORCH_CHECK(self.is_mkldnn(),
"mkldnn_linear: input needs to be mkldnn layout");
TORCH_CHECK(weight.is_mkldnn() && bias.is_mkldnn(),
"mkldnn_linear: weight and bias need to be mkldnn layout");
// reshape first if input dim is greater than 2 and the reshape will cost a memory copy.
auto self_reshaped = self.dim() > 2 ? self.reshape({-1, self.size(self.dim() - 1)}) : self;
const ideep::tensor x = itensor_from_mkldnn(self_reshaped);
const ideep::tensor w = itensor_from_mkldnn(weight);
ideep::tensor y;
if (bias.defined()) {
const ideep::tensor b = itensor_from_mkldnn(bias);
ideep::inner_product_forward::compute(x, w, b, y);
} else {
ideep::inner_product_forward::compute(x, w, y);
}
auto input_size = self.sizes();
std::vector<int64_t> output_size(input_size.begin(), input_size.end() - 1);
output_size.push_back(weight.size(0));
if (self.dim() > 2) {
return new_with_itensor_mkldnn(std::move(y), self.options()).reshape(output_size);
}
return new_with_itensor_mkldnn(std::move(y), self.options());
}
} // namespace native
} // namespace at
#endif // AT_MKLDNN_EBABLED