/******************************************************************************* * Copyright 2018 Intel Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. *******************************************************************************/ #ifndef CPU_REF_SHUFFLE_HPP #define CPU_REF_SHUFFLE_HPP #include #include "c_types_map.hpp" #include "type_helpers.hpp" #include "utils.hpp" #include "cpu_shuffle_pd.hpp" #include "cpu_primitive.hpp" namespace mkldnn { namespace impl { namespace cpu { template struct ref_shuffle_t : public cpu_primitive_t { using shuffle_class = ref_shuffle_t; struct pd_t: public cpu_shuffle_pd_t { using cpu_shuffle_pd_t::cpu_shuffle_pd_t; DECLARE_COMMON_PD_T("ref:any", shuffle_class); status_t init() { using namespace format_tag; bool ok = true && data_type_size == types::data_type_size(data_md()->data_type); if (!ok) return status::unimplemented; if (ndims() == 5) { dat_tag_ = memory_desc_matches_one_of_tag( *data_md(), nCdhw16c, nCdhw8c, ncdhw, ndhwc); } else if (ndims() == 4) { dat_tag_ = memory_desc_matches_one_of_tag( *data_md(), nChw16c, nChw8c, nchw, nhwc); } else dat_tag_ = any; return status::success; } format_tag_t dat_tag_; }; ref_shuffle_t(const pd_t *apd): cpu_primitive_t(apd) { const int axis_size = pd()->axis_size(); const int group_size = pd()->group_size(); const int transpose_row = pd()->is_fwd() ? group_size : axis_size / group_size; const int transpose_col = pd()->is_fwd() ? axis_size / group_size : group_size; rev_transposed_ = (int *)malloc(axis_size * sizeof(int), 64); parallel_nd(transpose_col, transpose_row, [&](int i, int j) { rev_transposed_[j * transpose_col + i] = i * transpose_row + j; }); } ~ref_shuffle_t() { free(rev_transposed_); } typedef typename typesize_traits::type data_t; virtual status_t execute(const exec_ctx_t &ctx) const override { using namespace format_tag; switch (pd()->dat_tag_) { case nCdhw16c: execute_(ctx); break; case nChw16c: execute_(ctx); break; case nCdhw8c: execute_(ctx); break; case nChw8c: execute_(ctx); break; case ncdhw: execute_(ctx); break; case nchw: execute_(ctx); break; case ndhwc: execute_(ctx); break; case nhwc: execute_(ctx); break; default: execute_(ctx); break; } return status::success; } private: template void execute_(const exec_ctx_t &ctx) const; const pd_t *pd() const { return (const pd_t *)primitive_t::pd(); } int *rev_transposed_; }; } } } #endif // vim: et ts=4 sw=4 cindent cino^=l0,\:0,N-s