forked from apache/mxnet
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[MKLDNN]Add quantized relu (apache#14604)
* add quantized relu * fix testcase * add author and skip quantized-relu for gpu * fix comments * retrigger ci * retrigger ci * comment fix * retrigger ci * retrigger ci
- Loading branch information
zhiyuan-huang
authored and
haohuw
committed
Jun 23, 2019
1 parent
209c7c2
commit 5af3df3
Showing
6 changed files
with
372 additions
and
70 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,74 @@ | ||
/* | ||
* Licensed to the Apache Software Foundation (ASF) under one | ||
* or more contributor license agreements. See the NOTICE file | ||
* distributed with this work for additional information | ||
* regarding copyright ownership. The ASF licenses this file | ||
* to you under the Apache License, Version 2.0 (the | ||
* "License"); you may not use this file except in compliance | ||
* with the License. You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the License is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
* KIND, either express or implied. See the License for the | ||
* specific language governing permissions and limitations | ||
* under the License. | ||
*/ | ||
|
||
/*! | ||
* Copyright (c) 2019 by Contributors | ||
* \file mkldnn_act-inl.h | ||
* \brief MKLDNN(Quantized) Activation operator based on subgraph | ||
* /author Zhiyuan Huang | ||
*/ | ||
|
||
#ifndef MXNET_OPERATOR_NN_MKLDNN_MKLDNN_ACT_INL_H_ | ||
#define MXNET_OPERATOR_NN_MKLDNN_MKLDNN_ACT_INL_H_ | ||
|
||
|
||
#if MXNET_USE_MKLDNN == 1 | ||
#include <vector> | ||
#include <utility> | ||
#include "../activation-inl.h" | ||
#include "./mkldnn_ops-inl.h" | ||
#include "./mkldnn_base-inl.h" | ||
|
||
namespace mxnet { | ||
namespace op { | ||
|
||
mkldnn::algorithm GetMKLDNNActAlgo(const ActivationParam& param); | ||
mkldnn::eltwise_forward::primitive_desc GetActFwdDescImpl( | ||
const ActivationParam& param, bool is_train, | ||
const mkldnn::memory &input_mem, int dtype); | ||
|
||
class MKLDNNActForward { | ||
public: | ||
const mkldnn::eltwise_forward::primitive_desc fwd_pd; | ||
|
||
MKLDNNActForward(const ActivationParam& param, bool is_train, | ||
const NDArray &data, const mkldnn::memory &mem): fwd_pd( | ||
GetActFwdDescImpl(param, is_train, mem, data.dtype())) {} | ||
void SetNewMem(const mkldnn::memory &data, const mkldnn::memory &output); | ||
const mkldnn::eltwise_forward &GetFwd() const; | ||
|
||
private: | ||
std::shared_ptr<mkldnn::eltwise_forward> fwd_; | ||
std::shared_ptr<mkldnn::memory> data_; | ||
std::shared_ptr<mkldnn::memory> out_; | ||
}; | ||
|
||
typedef ParamOpSign<ActivationParam> MKLDNNActSignature; | ||
MKLDNNActForward &GetActForward(const ActivationParam& param, | ||
const OpContext &ctx, const NDArray &in_data, | ||
const mkldnn::memory &in_mem); | ||
|
||
void MKLDNNActivationForward(const nnvm::NodeAttrs& attrs, const OpContext &ctx, | ||
const NDArray &in_data, const OpReqType &req, | ||
const NDArray &out_data); | ||
} // namespace op | ||
} // namespace mxnet | ||
|
||
#endif // MXNET_USE_MKLDNN == 1 | ||
#endif // MXNET_OPERATOR_NN_MKLDNN_MKLDNN_ACT_INL_H_ |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,55 @@ | ||
/* | ||
* Licensed to the Apache Software Foundation (ASF) under one | ||
* or more contributor license agreements. See the NOTICE file | ||
* distributed with this work for additional information | ||
* regarding copyright ownership. The ASF licenses this file | ||
* to you under the Apache License, Version 2.0 (the | ||
* "License"); you may not use this file except in compliance | ||
* with the License. You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the License is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
* KIND, either express or implied. See the License for the | ||
* specific language governing permissions and limitations | ||
* under the License. | ||
*/ | ||
/*! | ||
* Copyright (c) 2019 by Contributors | ||
* \file mkldnn_quantized_act.cc | ||
* \brief MKLDNN(Quantized) Activation operator based on subgraph | ||
* /author Zhiyuan Huang | ||
*/ | ||
#if MXNET_USE_MKLDNN == 1 | ||
|
||
#include "../../nn/mkldnn/mkldnn_act-inl.h" | ||
#include "../quantization_utils.h" | ||
|
||
namespace mxnet { | ||
namespace op { | ||
|
||
static void MKLDNNQuantizedActForward(const nnvm::NodeAttrs& attrs, | ||
const OpContext& ctx, | ||
const std::vector<NDArray>& in_data, | ||
const std::vector<OpReqType>& req, | ||
const std::vector<NDArray>& out_data) { | ||
CHECK(in_data[0].dtype() == mshadow::kUint8 || | ||
in_data[0].dtype() == mshadow::kInt8) | ||
<< "_contrib_quantized_act op only supports uint8 and int8 as input " | ||
"type"; | ||
|
||
MKLDNNActivationForward(attrs, ctx, in_data[0], req[0], out_data[0]); | ||
out_data[1].data().dptr<float>()[0] = in_data[1].data().dptr<float>()[0]; | ||
out_data[2].data().dptr<float>()[0] = in_data[2].data().dptr<float>()[0]; | ||
} | ||
|
||
NNVM_REGISTER_OP(_contrib_quantized_act) | ||
.set_attr<bool>("TIsMKLDNN", true) | ||
.set_attr<FComputeEx>("FComputeEx<cpu>", MKLDNNQuantizedActForward); | ||
|
||
} // namespace op | ||
} // namespace mxnet | ||
|
||
#endif // MXNET_USE_MKLDNN == 1 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.