Skip to content

Commit

Permalink
Fix warnings
Browse files Browse the repository at this point in the history
  • Loading branch information
larroy committed May 28, 2019
1 parent b8151c4 commit 18ae9b6
Show file tree
Hide file tree
Showing 7 changed files with 64 additions and 3 deletions.
3 changes: 3 additions & 0 deletions src/operator/contrib/deformable_psroi_pooling.cc
Original file line number Diff line number Diff line change
Expand Up @@ -70,7 +70,10 @@ namespace mshadow {
const index_t num_classes,
const index_t channels_each_class,
DType* top_data, DType* top_count) {
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
#pragma omp parallel for num_threads(omp_threads)
for (index_t index = 0; index < count; index++) {
// The output is in order (n, ctop, ph, pw)
Expand Down
4 changes: 3 additions & 1 deletion src/operator/contrib/multibox_detection.cc
Original file line number Diff line number Diff line change
Expand Up @@ -96,8 +96,10 @@ inline void MultiBoxDetectionForward(const Tensor<cpu, 3, DType> &out,
const int num_anchors = cls_prob.size(2);
const int num_batches = cls_prob.size(0);
const DType *p_anchor = anchors.dptr_;

#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
std::vector<DType> outputs;
outputs.reserve(num_anchors * 6);
for (int nbatch = 0; nbatch < num_batches; ++nbatch) {
Expand Down
3 changes: 3 additions & 0 deletions src/operator/contrib/psroi_pooling.cc
Original file line number Diff line number Diff line change
Expand Up @@ -51,7 +51,10 @@ template <typename DType>
const int output_dim,
const int group_size,
DType* top_data) {
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
#pragma omp parallel for num_threads(omp_threads)
for (int index = 0; index < count; index++) {
// The output is in order (n, ctop, ph, pw)
Expand Down
3 changes: 3 additions & 0 deletions src/operator/l2_normalization.cc
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,10 @@ class L2NormalizationOpCPU : public L2NormalizationOp<cpu, DType> {
CHECK_EQ(out_data.size(), 2U);
Stream<cpu> *s = ctx.get_stream<cpu>();
mxnet::TShape orig_shape = in_data[l2_normalization::kData].shape_;
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
auto omp_threads = engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (this->param_.mode == l2_normalization::kInstance) {
Shape<2> dshape = Shape2(orig_shape[0],
orig_shape.ProdShape(1, orig_shape.ndim()));
Expand Down
50 changes: 48 additions & 2 deletions src/operator/rnn_impl.h
Original file line number Diff line number Diff line change
Expand Up @@ -97,8 +97,10 @@ void LstmForwardTrainingSingleLayer(DType* ws,
const DType beta = 0.0;
const int cell_size = N * H;
linalg_gemm(x, wx, yx_flat, alpha, beta, false, true);

#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
for (int i = 0; i < T; ++i) {
int t = bid ? T - 1 - i : i;
linalg_gemm(i ? h : hx, wh, yh_flat, alpha, beta, false, true);
Expand Down Expand Up @@ -158,7 +160,10 @@ void LstmForwardTraining(DType* ws,
const int cell_size = N * H;
unsigned int seed_ = 17 + rand() % 4096; // NOLINT(runtime/threadsafe_fn)
int idx = 0; // state & cell state's idx;
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
for (int i = 0; i < L; ++i) {
const int input_size = i ? H * D : I;
const int w_size = (input_size + H) * H * 4;
Expand Down Expand Up @@ -240,8 +245,10 @@ void LstmForwardInferenceSingleLayer(DType* ws,
const DType beta = 0.0;
const int cell_size = N * H;
linalg_gemm(x, wx, yx_flat, alpha, beta, false, true);

#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
for (int i = 0; i < T; ++i) {
int t = bid ? T - 1 - i : i;
linalg_gemm(i ? h : hx, wh, yh_flat, alpha, beta, false, true);
Expand Down Expand Up @@ -367,7 +374,10 @@ void LstmBackwardSingleLayer(DType* ws,
DType *c_ptr = bid ? rs + T * N * H * 7 : rs;
const Tensor<cpu, 3, DType> c(c_ptr, Shape3(T, N, H));
const Tensor<cpu, 4, DType> ifgo(c_ptr + T * N * H, Shape4(T, N, H, 4));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (req_params != kNullOp && req_params != kAddTo) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < H * 4 * H; ++i) {
Expand Down Expand Up @@ -577,7 +587,10 @@ void LstmBackward(DType* ws,
}
if (dropout > 0.0f && i > 0 && req_data != kNullOp) {
dropout_random = dropout_random - T * N * D * H;
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
#pragma omp parallel for num_threads(omp_threads)
for (int j = 0; j < T * N * D * H; j++) {
if (dropout_random[j] == 0) {
Expand Down Expand Up @@ -632,7 +645,10 @@ void GruForwardInferenceSingleLayer(DType* ws,
const Tensor<cpu, 2, DType> back_wh(back_wh_ptr, Shape2(H * 3, H));
const Tensor<cpu, 2, DType> back_bx(back_bx_ptr, Shape2(3, H));
const Tensor<cpu, 2, DType> back_bh(back_bh_ptr, Shape2(3, H));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (D == 1) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < N; i++)
Expand Down Expand Up @@ -844,7 +860,10 @@ void GruForwardTrainingSingleLayer(DType* ws,
const Tensor<cpu, 2, DType> back_wh(back_wh_ptr, Shape2(H * 3, H));
const Tensor<cpu, 2, DType> back_bx(back_bx_ptr, Shape2(3, H));
const Tensor<cpu, 2, DType> back_bh(back_bh_ptr, Shape2(3, H));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (D == 1) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < N; i++)
Expand Down Expand Up @@ -1008,7 +1027,10 @@ void GruForwardTraining(DType* ws,
y_l = y_l + T * N * H * D;
}
if (dropout > 0.0f && l > 0) {
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < T * N * I; i++) {
int rand_data = rand_r(&seed_);
Expand Down Expand Up @@ -1040,7 +1062,10 @@ void GruForwardTraining(DType* ws,
}
wh_l = wx_l + I * 3 * H;
}
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < T * N * H * D; ++i) {
y_ptr[i] = y_l[i];
Expand Down Expand Up @@ -1106,7 +1131,10 @@ void GruBackwardSingleLayer(DType* ws,
const Tensor<cpu, 2, DType> wh(wh_ptr, Shape2(H * 3, H));
const Tensor<cpu, 2, DType> back_wx(back_wx_ptr, Shape2(H * 3, I));
const Tensor<cpu, 2, DType> back_wh(back_wh_ptr, Shape2(H * 3, H));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (req_params != kNullOp && req_params != kAddTo) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < D * H * 3 * H; ++i) {
Expand Down Expand Up @@ -1451,7 +1479,10 @@ void GruBackward(DType* ws,
Tensor<cpu, 3, DType> hx(hx_ptr, Shape3(L, D * N, H));
int inputsize = I;
DType* y_tmp = y_l - T * N * H * D;
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
for (int l = L - 1; l >= 0; --l) {
if (l == 0) {
I = inputsize;
Expand Down Expand Up @@ -1546,7 +1577,10 @@ void VanillaRNNForwardInferenceSingleLayer(DType* ws,
const Tensor<cpu, 2, DType> back_wh(back_wh_ptr, Shape2(H, H));
const Tensor<cpu, 2, DType> back_bx(back_bx_ptr, Shape2(1, H));
const Tensor<cpu, 2, DType> back_bh(back_bh_ptr, Shape2(1, H));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (D == 1) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < N; i++)
Expand Down Expand Up @@ -1747,7 +1781,10 @@ void VanillaRNNForwardTrainingSingleLayer(DType* ws,
const Tensor<cpu, 2, DType> back_wh(back_wh_ptr, Shape2(H * 1, H));
const Tensor<cpu, 2, DType> back_bx(back_bx_ptr, Shape2(1, H));
const Tensor<cpu, 2, DType> back_bh(back_bh_ptr, Shape2(1, H));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (D == 1) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < N; i++)
Expand Down Expand Up @@ -1887,7 +1924,10 @@ void VanillaRNNForwardTraining(DType* ws,
DType* bx_l = bx;
DType* bh_l = bh;
DType* y_tmp = x_ptr;
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
unsigned int seed_ = 17 + rand() % 4096; // NOLINT(runtime/threadsafe_fn)
for (int l = 0; l < L; l++) {
if (l != 0) {
Expand Down Expand Up @@ -1979,7 +2019,10 @@ void VanillaRNNBackwardSingleLayer(DType* ws,
const Tensor<cpu, 2, DType> wh(wh_ptr, Shape2(H, H));
const Tensor<cpu, 2, DType> back_wx(back_wx_ptr, Shape2(H, I));
const Tensor<cpu, 2, DType> back_wh(back_wh_ptr, Shape2(H, H));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
if (req_params != kNullOp && req_params != kAddTo) {
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < D * H * H; ++i) {
Expand Down Expand Up @@ -2306,7 +2349,10 @@ void VanillaRNNBackward(DType* ws,
Tensor<cpu, 3, DType> hx(hx_ptr, Shape3(L, D * N, H));
int inputsize = I;
DType* y_tmp = y_l - T * N * H * D;
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads = mxnet::engine::OpenMP::Get()->GetRecommendedOMPThreadCount();
#pragma GCC diagnostic pop
for (int l = L - 1; l >= 0; --l) {
if (l == 0) {
I = inputsize;
Expand Down
3 changes: 3 additions & 0 deletions src/operator/tensor/ordering_op-inl.h
Original file line number Diff line number Diff line change
Expand Up @@ -202,7 +202,10 @@ MSHADOW_FORCE_INLINE void TopKSort(const Tensor<cpu, 1, DType>& dat,
const bool full_sort(K*8 > N);
// Batch size.
const int M(work.size(0)/(sizeof(DType)*N));
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
const int omp_threads(engine::OpenMP::Get()->GetRecommendedOMPThreadCount());
#pragma GCC diagnostic pop
#pragma omp parallel for num_threads(omp_threads)
for (int i = 0; i < M; ++i) {
// Tensor `work` stores the flattened source data, while `dat` stores the sorted result.
Expand Down
1 change: 1 addition & 0 deletions tests/cpp/misc/libinfo_test.cc
Original file line number Diff line number Diff line change
Expand Up @@ -30,4 +30,5 @@ using namespace mxnet::features;
TEST(RuntimeTest, RuntimeTestAll) {
EXPECT_EQ(EnumNames::names.size(), MAX_FEATURES);
const auto& features = LibInfo::getInstance()->getFeatures();
EXPECT_GE(features.size(), 0);
}

0 comments on commit 18ae9b6

Please sign in to comment.