151 lines
4.3 KiB
C++
151 lines
4.3 KiB
C++
/*******************************************************************************
|
|
* Copyright (c) 2015-2018 Skymind, Inc.
|
|
*
|
|
* This program and the accompanying materials are made available under the
|
|
* terms of the Apache License, Version 2.0 which is available at
|
|
* https://www.apache.org/licenses/LICENSE-2.0.
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
* License for the specific language governing permissions and limitations
|
|
* under the License.
|
|
*
|
|
* SPDX-License-Identifier: Apache-2.0
|
|
******************************************************************************/
|
|
|
|
//
|
|
// Created by raver119 on 30.06.18.
|
|
//
|
|
|
|
#include "testlayers.h"
|
|
#include <NDArray.h>
|
|
#include <OmpLaunchHelper.h>
|
|
|
|
|
|
using namespace nd4j;
|
|
using namespace nd4j::graph;
|
|
|
|
class OmpLaunchHelperTests : public testing::Test {
|
|
private:
|
|
int ewt = 0;
|
|
public:
|
|
OmpLaunchHelperTests() {
|
|
this->ewt = Environment::getInstance()->elementwiseThreshold();
|
|
Environment::getInstance()->setElementwiseThreshold(1000);
|
|
};
|
|
|
|
~OmpLaunchHelperTests() {
|
|
Environment::getInstance()->setElementwiseThreshold(this->ewt);
|
|
}
|
|
};
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterSpan_1) {
|
|
auto span = OmpLaunchHelper::betterSpan(1000, 4);
|
|
ASSERT_EQ(250, span);
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterSpan_2) {
|
|
auto span = OmpLaunchHelper::betterSpan(1001, 4);
|
|
ASSERT_EQ(251, span);
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterSpan_3) {
|
|
auto span = OmpLaunchHelper::betterSpan(1002, 4);
|
|
ASSERT_EQ(251, span);
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterSpan_5) {
|
|
auto span = OmpLaunchHelper::betterSpan(1003, 4);
|
|
ASSERT_EQ(251, span);
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterSpan_6) {
|
|
auto span = OmpLaunchHelper::betterSpan(1004, 4);
|
|
ASSERT_EQ(251, span);
|
|
}
|
|
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterThreads_1) {
|
|
auto n = OmpLaunchHelper::betterThreads(4000, 6);
|
|
ASSERT_EQ(4, n);
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterThreads_2) {
|
|
auto n = OmpLaunchHelper::betterThreads(12000, 6);
|
|
ASSERT_EQ(6, n);
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, Test_BetterThreads_3) {
|
|
auto n = OmpLaunchHelper::betterThreads(899, 6);
|
|
ASSERT_EQ(1, n);
|
|
}
|
|
|
|
//////////////////////////////////////////////////////////////////////
|
|
TEST_F(OmpLaunchHelperTests, loop_test1) {
|
|
|
|
const Nd4jLong N = 20010;
|
|
Nd4jLong desiredNumThreads = 2;
|
|
int x[N] = {0};
|
|
|
|
OmpLaunchHelper info(N, desiredNumThreads);
|
|
PRAGMA_OMP_PARALLEL_THREADS(info._numThreads)
|
|
{
|
|
auto threadNum = omp_get_thread_num();
|
|
auto xi = x + info.getThreadOffset(threadNum);
|
|
|
|
auto ulen = static_cast<unsigned int>(info.getItersPerThread(threadNum));
|
|
|
|
PRAGMA_OMP_SIMD
|
|
for (Nd4jLong i = 0; i < ulen; i++)
|
|
xi[i] = xi[i] + 1;
|
|
}
|
|
|
|
#ifdef _OPENMP
|
|
ASSERT_TRUE(info._numThreads == desiredNumThreads);
|
|
#else
|
|
ASSERT_TRUE(info._numThreads == 1);
|
|
#endif
|
|
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, test_tad_threads_1) {
|
|
Nd4jLong numTads = 16;
|
|
Nd4jLong tadLength = 16;
|
|
|
|
// nd4j_printf("TT: [%i]; ET: [%i];\n", Environment::getInstance()->tadThreshold(), Environment::getInstance()->elementwiseThreshold());
|
|
ASSERT_EQ(1, OmpLaunchHelper::tadThreads(tadLength, numTads));
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, test_tad_threads_2) {
|
|
if (omp_get_max_threads() <= 1)
|
|
return;
|
|
|
|
Nd4jLong numTads = 2;
|
|
Nd4jLong tadLength = Environment::getInstance()->elementwiseThreshold();
|
|
|
|
ASSERT_EQ(2, OmpLaunchHelper::tadThreads(tadLength, numTads));
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, test_tad_threads_3) {
|
|
Nd4jLong numTads = 2;
|
|
Nd4jLong tadLength = 128;
|
|
|
|
ASSERT_EQ(1, OmpLaunchHelper::tadThreads(tadLength, numTads));
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, test_tad_threads_4) {
|
|
Nd4jLong numTads = 4;
|
|
Nd4jLong tadLength = 64;
|
|
|
|
ASSERT_EQ(1, OmpLaunchHelper::tadThreads(tadLength, numTads));
|
|
}
|
|
|
|
TEST_F(OmpLaunchHelperTests, test_tad_threads_5) {
|
|
auto exp = omp_get_max_threads();
|
|
|
|
Nd4jLong numTads = exp;
|
|
Nd4jLong tadLength = Environment::getInstance()->elementwiseThreshold();
|
|
|
|
ASSERT_EQ(exp, OmpLaunchHelper::tadThreads(tadLength, numTads));
|
|
} |