summaryrefslogtreecommitdiff
path: root/thirdparty/oidn/mkl-dnn/src/cpu/ref_eltwise.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'thirdparty/oidn/mkl-dnn/src/cpu/ref_eltwise.hpp')
-rw-r--r--thirdparty/oidn/mkl-dnn/src/cpu/ref_eltwise.hpp168
1 files changed, 168 insertions, 0 deletions
diff --git a/thirdparty/oidn/mkl-dnn/src/cpu/ref_eltwise.hpp b/thirdparty/oidn/mkl-dnn/src/cpu/ref_eltwise.hpp
new file mode 100644
index 0000000000..8f4ab35413
--- /dev/null
+++ b/thirdparty/oidn/mkl-dnn/src/cpu/ref_eltwise.hpp
@@ -0,0 +1,168 @@
+/*******************************************************************************
+* Copyright 2016-2018 Intel Corporation
+*
+* Licensed under the Apache License, Version 2.0 (the "License");
+* you may not use this file except in compliance with the License.
+* You may obtain a copy of the License at
+*
+* http://www.apache.org/licenses/LICENSE-2.0
+*
+* Unless required by applicable law or agreed to in writing, software
+* distributed under the License is distributed on an "AS IS" BASIS,
+* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+* See the License for the specific language governing permissions and
+* limitations under the License.
+*******************************************************************************/
+
+#ifndef CPU_REF_ELTWISE_HPP
+#define CPU_REF_ELTWISE_HPP
+
+#include <assert.h>
+
+#include "c_types_map.hpp"
+#include "type_helpers.hpp"
+#include "utils.hpp"
+
+#include "cpu_eltwise_pd.hpp"
+#include "cpu_primitive.hpp"
+
+namespace mkldnn {
+namespace impl {
+namespace cpu {
+
+struct ref_eltwise_scalar_fwd_t {
+public:
+ ref_eltwise_scalar_fwd_t(alg_kind_t alg, float alpha, float beta);
+
+ // note that eltwise.scale is ignored
+ ref_eltwise_scalar_fwd_t(const post_ops_t::entry_t::eltwise_t &eltwise);
+
+ float compute_scalar(float s);
+
+ const alg_kind_t alg_;
+ const float alpha_;
+ const float beta_;
+};
+
+template <impl::data_type_t data_type>
+struct ref_eltwise_fwd_t: public cpu_primitive_t {
+ struct pd_t: public cpu_eltwise_fwd_pd_t {
+ using cpu_eltwise_fwd_pd_t::cpu_eltwise_fwd_pd_t;
+
+ DECLARE_COMMON_PD_T("ref:any", ref_eltwise_fwd_t);
+
+ status_t init() {
+ using namespace utils;
+
+ auto src_d = memory_desc_wrapper(src_md());
+
+ use_dense_ = false
+ || src_d.is_dense()
+ || (src_d.is_dense(true) && is_zero_preserved());
+
+ use_nCspBc_padded_ = !use_dense_
+ && src_d.blocking_desc().inner_nblks == 1
+ && one_of(src_d.blocking_desc().inner_blks[0], 8, 16)
+ && src_d.blocking_desc().inner_idxs[0] == 1
+ && src_d.only_padded_dim(1)
+ && src_d.is_dense(true);
+
+ if (has_zero_dim_memory())
+ use_dense_ = use_nCspBc_padded_ = false;
+
+ const bool use_generic = !use_dense_ && !use_nCspBc_padded_;
+
+ bool ok = true
+ && is_fwd()
+ && everyone_is(data_type, desc()->data_desc.data_type)
+ && IMPLICATION(use_generic, one_of(src_d.ndims(), 4, 5))
+ && attr()->has_default_values();
+ if (!ok) return status::unimplemented;
+
+ return status::success;
+ }
+
+ bool use_dense_, use_nCspBc_padded_;
+ };
+
+ ref_eltwise_fwd_t(const pd_t *apd): cpu_primitive_t(apd) {}
+ typedef typename prec_traits<data_type>::type data_t;
+
+ virtual status_t execute(const exec_ctx_t &ctx) const override {
+ if (pd()->use_dense_)
+ execute_forward_dense(ctx);
+ else if (pd()->use_nCspBc_padded_)
+ execute_forward_nCspBc_padded(ctx);
+ else
+ execute_forward_generic(ctx);
+ return status::success;
+ }
+
+private:
+ void execute_forward_nCspBc_padded(const exec_ctx_t &ctx) const;
+ void execute_forward_dense(const exec_ctx_t &ctx) const;
+ void execute_forward_generic(const exec_ctx_t &ctx) const;
+ const pd_t *pd() const { return (const pd_t *)primitive_t::pd(); }
+};
+
+template <impl::data_type_t data_type>
+struct ref_eltwise_bwd_t: public cpu_primitive_t {
+ struct pd_t: public cpu_eltwise_bwd_pd_t {
+ using cpu_eltwise_bwd_pd_t::cpu_eltwise_bwd_pd_t;
+
+ DECLARE_COMMON_PD_T("ref:any", ref_eltwise_bwd_t);
+
+ status_t init() {
+ using namespace utils;
+
+ bool ok = true
+ && !is_fwd()
+ && everyone_is(data_type,
+ desc()->data_desc.data_type,
+ desc()->diff_data_desc.data_type)
+ && attr()->has_default_values();
+ if (!ok) return status::unimplemented;
+
+ auto diff_dst_d = memory_desc_wrapper(diff_dst_md());
+ const bool same_fmt_ = diff_dst_d == memory_desc_wrapper(src_md());
+
+ use_dense_ = true
+ && same_fmt_
+ && diff_dst_d.is_dense(true)
+ && is_zero_preserved()
+ && !has_zero_dim_memory();
+ const bool use_generic = !use_dense_;
+
+ if (use_generic && !one_of(diff_dst_d.ndims(), 4, 5))
+ return status::unimplemented;
+
+ return status::success;
+ }
+
+ bool use_dense_;
+ };
+
+ ref_eltwise_bwd_t(const pd_t *apd): cpu_primitive_t(apd) {}
+ typedef typename prec_traits<data_type>::type data_t;
+
+ virtual status_t execute(const exec_ctx_t &ctx) const override {
+ if (pd()->use_dense_)
+ execute_backward_dense(ctx);
+ else
+ execute_backward_generic(ctx);
+ return status::success;
+ }
+
+private:
+ void execute_backward_dense(const exec_ctx_t &ctx) const;
+ void execute_backward_generic(const exec_ctx_t &ctx) const;
+ const pd_t *pd() const { return (const pd_t *)primitive_t::pd(); }
+};
+
+}
+}
+}
+
+#endif
+
+// vim: et ts=4 sw=4 cindent cino^=l0,\:0,N-s