1bea8e1eac
-Added LocalVector (needed it) -Added stb_rect_pack (It's pretty cool, we could probably use it for other stuff too) -Fixes and changes all around the place -Added library for 128 bits fixed point (required for Delaunay3D)
97 lines
2.8 KiB
C++
97 lines
2.8 KiB
C++
/*******************************************************************************
|
|
* Copyright 2017-2018 Intel Corporation
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*******************************************************************************/
|
|
|
|
#ifndef CPU_JIT_AVX512_COMMON_LRN_HPP
|
|
#define CPU_JIT_AVX512_COMMON_LRN_HPP
|
|
|
|
#include "c_types_map.hpp"
|
|
|
|
#include "cpu_isa_traits.hpp"
|
|
#include "cpu_lrn_pd.hpp"
|
|
#include "cpu_primitive.hpp"
|
|
|
|
namespace mkldnn {
|
|
namespace impl {
|
|
namespace cpu {
|
|
|
|
struct jit_avx512_common_lrn_fwd_t: public cpu_primitive_t {
|
|
struct pd_t: public cpu_lrn_fwd_pd_t {
|
|
using cpu_lrn_fwd_pd_t::cpu_lrn_fwd_pd_t;
|
|
|
|
DECLARE_COMMON_PD_T(
|
|
JIT_IMPL_NAME_HELPER("jit:", avx512_common, ""),
|
|
jit_avx512_common_lrn_fwd_t);
|
|
|
|
status_t init();
|
|
};
|
|
|
|
jit_avx512_common_lrn_fwd_t(const pd_t *apd);
|
|
~jit_avx512_common_lrn_fwd_t();
|
|
|
|
typedef typename prec_traits<data_type::f32>::type data_t;
|
|
|
|
virtual status_t execute(const exec_ctx_t &ctx) const override {
|
|
execute_forward(ctx);
|
|
return status::success;
|
|
}
|
|
|
|
private:
|
|
void execute_forward(const exec_ctx_t &ctx) const;
|
|
const pd_t *pd() const { return (const pd_t *)primitive_t::pd(); }
|
|
|
|
int use_h_parallelism;
|
|
struct jit_avx512_common_lrn_kernel_f32;
|
|
jit_avx512_common_lrn_kernel_f32 *ker_, *ker_first_, *ker_last_;
|
|
};
|
|
|
|
struct jit_avx512_common_lrn_bwd_t: public cpu_primitive_t {
|
|
struct pd_t: public cpu_lrn_bwd_pd_t {
|
|
using cpu_lrn_bwd_pd_t::cpu_lrn_bwd_pd_t;
|
|
|
|
DECLARE_COMMON_PD_T(
|
|
JIT_IMPL_NAME_HELPER("jit:", avx512_common, ""),
|
|
jit_avx512_common_lrn_bwd_t);
|
|
|
|
status_t init();
|
|
};
|
|
|
|
jit_avx512_common_lrn_bwd_t(const pd_t *apd);
|
|
~jit_avx512_common_lrn_bwd_t();
|
|
|
|
typedef typename prec_traits<data_type::f32>::type data_t;
|
|
|
|
virtual status_t execute(const exec_ctx_t &ctx) const override {
|
|
execute_backward(ctx);
|
|
return status::success;
|
|
}
|
|
|
|
private:
|
|
void execute_backward(const exec_ctx_t &ctx) const;
|
|
const pd_t *pd() const { return (const pd_t *)primitive_t::pd(); }
|
|
|
|
int use_h_parallelism;
|
|
struct jit_avx512_common_lrn_kernel_f32;
|
|
jit_avx512_common_lrn_kernel_f32 *ker_, *ker_first_, *ker_last_;
|
|
};
|
|
|
|
}
|
|
}
|
|
}
|
|
|
|
#endif
|
|
|
|
// vim: et ts=4 sw=4 cindent cino^=l0,\:0,N-s
|