cavis/libnd4j/include/ops/declarable/helpers/cpu/adjust_hue.cpp

/*******************************************************************************
 * Copyright (c) 2015-2018 Skymind, Inc.
 *
 * This program and the accompanying materials are made available under the
 * terms of the Apache License, Version 2.0 which is available at
 * https://www.apache.org/licenses/LICENSE-2.0.
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
 * License for the specific language governing permissions and limitations
 * under the License.
 *
 * SPDX-License-Identifier: Apache-2.0
 ******************************************************************************/

//
// @author raver119@gmail.com
// @author Yurii Shyrma (iuriish@yahoo.com)
//

#include <ops/declarable/helpers/adjust_hue.h>
#include <helpers/ConstantTadHelper.h>

namespace nd4j {
namespace ops {
namespace helpers {


template <typename T>
static void adjustHue_(const NDArray *input, const NDArray* deltaScalarArr, NDArray *output, const int dimC) {

    const T delta  = deltaScalarArr->e<T>(0);
    const int rank = input->rankOf();

    const T* x = input->bufferAsT<T>();
          T* z = output->bufferAsT<T>();

    if(dimC == rank - 1 && input->ews() == 1 && output->ews() == 1 && input->ordering() == 'c' && output->ordering() == 'c') {

        PRAGMA_OMP_PARALLEL_FOR_SIMD
        for (Nd4jLong i = 0; i < input->lengthOf(); i += 3) {

            T h, s, v;

            rgbToHsv<T>(x[i], x[i+1], x[i+2], h, s, v);

            h += delta * 360;
            if(h > 360)
                h -= 360;
            else if(h < 0)
                h += 360;

            hsvToRgb<T>(h, s, v, z[i], z[i+1], z[i+2]);
        }
    }
    else {

        auto packX = nd4j::ConstantTadHelper::getInstance()->tadForDimensions(input->getShapeInfo(),  {dimC});
        auto packZ = nd4j::ConstantTadHelper::getInstance()->tadForDimensions(output->getShapeInfo(), {dimC});

        const Nd4jLong numOfTads   = packX.numberOfTads();
        const Nd4jLong xDimCstride = input->stridesOf()[dimC];
        const Nd4jLong zDimCstride = output->stridesOf()[dimC];

        PRAGMA_OMP_PARALLEL_FOR_SIMD
        for(Nd4jLong i = 0; i < numOfTads; ++i) {

            const T* xTad = x + packX.platformOffsets()[i];
                  T* zTad = z + packZ.platformOffsets()[i];

            T h, s, v;

            rgbToHsv<T>(xTad[0], xTad[xDimCstride], xTad[2 * xDimCstride], h, s, v);

            h += delta * 360;
            if(h > 360)
                h -= 360;
            else if(h < 0)
                h += 360;

            hsvToRgb<T>(h, s, v, zTad[0], zTad[zDimCstride], zTad[2 * zDimCstride]);

        }
    }
}


void adjustHue(nd4j::LaunchContext* context, const NDArray *input, const NDArray* deltaScalarArr, NDArray *output, const int dimC) {

    BUILD_SINGLE_SELECTOR(input->dataType(), adjustHue_, (input, deltaScalarArr, output, dimC), LIBND4J_TYPES);
}

/*
template <typename T>
static void adjust_hue_single_(nd4j::LaunchContext * context, NDArray *array, NDArray *output, float delta, bool isNHWC) {
    // we're 100% sure it's 3
    const int numChannels = 3;
    int tuples = array->lengthOf() /  numChannels;
    auto bIn = reinterpret_cast<T *>(array->buffer());
    auto bOut = reinterpret_cast<T *>(output->buffer());
    static const int kChannelRange = 6;

    int stridesDim = isNHWC ? 2 : 0;
    if (isNHWC) {
        // for NHWC our rgb values are stored one by one
        PRAGMA_OMP_PARALLEL_FOR_SIMD
        for (int e = 0; e < tuples; e++) {
            auto i = bIn + e * numChannels;
            auto o = bOut + e * numChannels;

            T h, v_min, v_max;
            helpers::rgb_to_hv(i[0], i[1], i[2], &h, &v_min, &v_max);

            h += delta * kChannelRange;
            while (h < (T) 0.)
                h += (T) kChannelRange;

            while (h >= (T) kChannelRange)
                h -= (T) kChannelRange;

            helpers::hv_to_rgb(h, v_min, v_max, o, o + 1, o + 2);
        }
    } else {
        auto tadsChannelsIn  = array->allTensorsAlongDimension({0});
        auto tadsChannelsOut = output->allTensorsAlongDimension( {0});

        auto bufferR = reinterpret_cast<T *>(tadsChannelsIn->at(0)->buffer());
        auto bufferG = reinterpret_cast<T *>(tadsChannelsIn->at(1)->buffer());
        auto bufferB = reinterpret_cast<T *>(tadsChannelsIn->at(2)->buffer());

        auto outputR = reinterpret_cast<T *>(tadsChannelsOut->at(0)->buffer());
        auto outputG = reinterpret_cast<T *>(tadsChannelsOut->at(1)->buffer());
        auto outputB = reinterpret_cast<T *>(tadsChannelsOut->at(2)->buffer());

        PRAGMA_OMP_PARALLEL_FOR_SIMD
        for (int e = 0; e < tuples; e++) {
            auto _ri = bufferR + e;
            auto _gi = bufferG + e;
            auto _bi = bufferB + e;

            auto _ro = outputR + e;
            auto _go = outputG + e;
            auto _bo = outputB + e;

            T h, v_min, v_max;
            helpers::rgb_to_hv(_ri[0], _gi[0], _bi[0], &h, &v_min, &v_max);

            h += delta * kChannelRange;
            while (h < (T) 0)
                h += (T) kChannelRange;

            while (h >= (T) kChannelRange)
                h -= (T) kChannelRange;

            helpers::hv_to_rgb(h, v_min, v_max, _ro, _go, _bo);
        }

        delete tadsChannelsIn;
        delete tadsChannelsOut;
    }
}

void adjust_hue_(nd4j::LaunchContext * context, NDArray *array, NDArray *output, NDArray* delta, bool isNHWC) {
    auto xType = array->dataType();

    float d = delta->e<float>(0);
    if (array->rankOf() == 4) {
        auto tadsIn = array->allTensorsAlongDimension({0});
        auto tadsOut = output->allTensorsAlongDimension({0});
        int tSize = tadsIn->size();
        // FIXME: template selector should be moved out of loop
        PRAGMA_OMP_PARALLEL_FOR
        for (int e = 0; e < tSize; e++) {
            BUILD_SINGLE_SELECTOR(xType, adjust_hue_single_, (context, tadsIn->at(e), tadsOut->at(e), d, isNHWC);, FLOAT_TYPES);
        }


        delete tadsIn;
        delete tadsOut;
    } else {
        BUILD_SINGLE_SELECTOR(xType, adjust_hue_single_, (context, array, output, d, isNHWC);, FLOAT_TYPES);
    }
}

BUILD_SINGLE_TEMPLATE(template void adjust_hue_single_, (nd4j::LaunchContext * context, NDArray *array, NDArray *output, float delta, bool isNHWC);, FLOAT_TYPES);
*/


}
}
}
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00			`/*******************************************************************************`
			`* Copyright (c) 2015-2018 Skymind, Inc.`
			`*`
			`* This program and the accompanying materials are made available under the`
			`* terms of the Apache License, Version 2.0 which is available at`
			`* https://www.apache.org/licenses/LICENSE-2.0.`
			`*`
			`* Unless required by applicable law or agreed to in writing, software`
			`* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT`
			`* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the`
			`* License for the specific language governing permissions and limitations`
			`* under the License.`
			`*`
			`* SPDX-License-Identifier: Apache-2.0`
			`******************************************************************************/`

			`//`
[WIP] More of CUDA operations (#69) * initial commit Signed-off-by: raver119 <raver119@gmail.com> * - gruCell_bp further Signed-off-by: Yurii <yurii@skymind.io> * - further work on gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * Inverse matrix cublas implementation. Partial working revision. * Separation of segment ops helpers. Max separation. * Separated segment_min ops. * Separation of segment_mean/sum/prod/sqrtN ops heleprs. * Fixed diagonal processing with LUP decomposition. * Modified inversion approach using current state of LU decomposition. * Implementation of matrix_inverse op with cuda kernels. Working revision. * Implemented sequence_mask cuda helper. Eliminated waste printf with matrix_inverse implementation. Added proper tests. * - further work on gruCell_bp (ff/cuda) Signed-off-by: Yurii <yurii@skymind.io> * comment one test for gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * - provide cuda static_rnn Signed-off-by: Yurii <yurii@skymind.io> * Refactored random_shuffle op to use new random generator. * Refactored random_shuffle op helper. * Fixed debug tests with random ops tests. * Implement random_shuffle op cuda kernel helper and tests. * - provide cuda scatter_update Signed-off-by: Yurii <yurii@skymind.io> * Implementation of random_shuffle for linear case with cuda kernels and tests. * Implemented random_shuffle with cuda kernels. Final revision. * - finally gruCell_bp is completed Signed-off-by: Yurii <yurii@skymind.io> * Dropout op cuda helper implementation. * Implemented dropout_bp cuda helper. * Implemented alpha_dropout_bp with cuda kernel helpers. * Refactored helper. * Implementation of suppresion helper with cuda kernels. * - provide cpu code fot hsvToRgb, rgbToHsv, adjustHue Signed-off-by: Yurii <yurii@skymind.io> * Using sort by value method. * Implementation of image.non_max_suppression op cuda-based helper. * - correcting and testing adjust_hue, adjust_saturation cpu/cuda code Signed-off-by: Yurii <yurii@skymind.io> * Added cuda device prefixes to declarations. * Implementation of hashcode op with cuda helper. Initital revision. * rnn cu impl removed Signed-off-by: raver119 <raver119@gmail.com> 2019-07-20 08:58:44 +03:00			`// @author raver119@gmail.com`
			`// @author Yurii Shyrma (iuriish@yahoo.com)`
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00			`//`

			`#include <ops/declarable/helpers/adjust_hue.h>`
[WIP] More of CUDA operations (#69) * initial commit Signed-off-by: raver119 <raver119@gmail.com> * - gruCell_bp further Signed-off-by: Yurii <yurii@skymind.io> * - further work on gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * Inverse matrix cublas implementation. Partial working revision. * Separation of segment ops helpers. Max separation. * Separated segment_min ops. * Separation of segment_mean/sum/prod/sqrtN ops heleprs. * Fixed diagonal processing with LUP decomposition. * Modified inversion approach using current state of LU decomposition. * Implementation of matrix_inverse op with cuda kernels. Working revision. * Implemented sequence_mask cuda helper. Eliminated waste printf with matrix_inverse implementation. Added proper tests. * - further work on gruCell_bp (ff/cuda) Signed-off-by: Yurii <yurii@skymind.io> * comment one test for gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * - provide cuda static_rnn Signed-off-by: Yurii <yurii@skymind.io> * Refactored random_shuffle op to use new random generator. * Refactored random_shuffle op helper. * Fixed debug tests with random ops tests. * Implement random_shuffle op cuda kernel helper and tests. * - provide cuda scatter_update Signed-off-by: Yurii <yurii@skymind.io> * Implementation of random_shuffle for linear case with cuda kernels and tests. * Implemented random_shuffle with cuda kernels. Final revision. * - finally gruCell_bp is completed Signed-off-by: Yurii <yurii@skymind.io> * Dropout op cuda helper implementation. * Implemented dropout_bp cuda helper. * Implemented alpha_dropout_bp with cuda kernel helpers. * Refactored helper. * Implementation of suppresion helper with cuda kernels. * - provide cpu code fot hsvToRgb, rgbToHsv, adjustHue Signed-off-by: Yurii <yurii@skymind.io> * Using sort by value method. * Implementation of image.non_max_suppression op cuda-based helper. * - correcting and testing adjust_hue, adjust_saturation cpu/cuda code Signed-off-by: Yurii <yurii@skymind.io> * Added cuda device prefixes to declarations. * Implementation of hashcode op with cuda helper. Initital revision. * rnn cu impl removed Signed-off-by: raver119 <raver119@gmail.com> 2019-07-20 08:58:44 +03:00			`#include <helpers/ConstantTadHelper.h>`
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00
			`namespace nd4j {`
			`namespace ops {`
			`namespace helpers {`

[WIP] More of CUDA operations (#69) * initial commit Signed-off-by: raver119 <raver119@gmail.com> * - gruCell_bp further Signed-off-by: Yurii <yurii@skymind.io> * - further work on gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * Inverse matrix cublas implementation. Partial working revision. * Separation of segment ops helpers. Max separation. * Separated segment_min ops. * Separation of segment_mean/sum/prod/sqrtN ops heleprs. * Fixed diagonal processing with LUP decomposition. * Modified inversion approach using current state of LU decomposition. * Implementation of matrix_inverse op with cuda kernels. Working revision. * Implemented sequence_mask cuda helper. Eliminated waste printf with matrix_inverse implementation. Added proper tests. * - further work on gruCell_bp (ff/cuda) Signed-off-by: Yurii <yurii@skymind.io> * comment one test for gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * - provide cuda static_rnn Signed-off-by: Yurii <yurii@skymind.io> * Refactored random_shuffle op to use new random generator. * Refactored random_shuffle op helper. * Fixed debug tests with random ops tests. * Implement random_shuffle op cuda kernel helper and tests. * - provide cuda scatter_update Signed-off-by: Yurii <yurii@skymind.io> * Implementation of random_shuffle for linear case with cuda kernels and tests. * Implemented random_shuffle with cuda kernels. Final revision. * - finally gruCell_bp is completed Signed-off-by: Yurii <yurii@skymind.io> * Dropout op cuda helper implementation. * Implemented dropout_bp cuda helper. * Implemented alpha_dropout_bp with cuda kernel helpers. * Refactored helper. * Implementation of suppresion helper with cuda kernels. * - provide cpu code fot hsvToRgb, rgbToHsv, adjustHue Signed-off-by: Yurii <yurii@skymind.io> * Using sort by value method. * Implementation of image.non_max_suppression op cuda-based helper. * - correcting and testing adjust_hue, adjust_saturation cpu/cuda code Signed-off-by: Yurii <yurii@skymind.io> * Added cuda device prefixes to declarations. * Implementation of hashcode op with cuda helper. Initital revision. * rnn cu impl removed Signed-off-by: raver119 <raver119@gmail.com> 2019-07-20 08:58:44 +03:00
			`template <typename T>`
			`static void adjustHue_(const NDArray input, const NDArray deltaScalarArr, NDArray *output, const int dimC) {`

			`const T delta = deltaScalarArr->e<T>(0);`
			`const int rank = input->rankOf();`

			`const T* x = input->bufferAsT<T>();`
			`T* z = output->bufferAsT<T>();`

			`if(dimC == rank - 1 && input->ews() == 1 && output->ews() == 1 && input->ordering() == 'c' && output->ordering() == 'c') {`

			`PRAGMA_OMP_PARALLEL_FOR_SIMD`
			`for (Nd4jLong i = 0; i < input->lengthOf(); i += 3) {`

			`T h, s, v;`

			`rgbToHsv<T>(x[i], x[i+1], x[i+2], h, s, v);`

			`h += delta * 360;`
			`if(h > 360)`
			`h -= 360;`
			`else if(h < 0)`
			`h += 360;`

			`hsvToRgb<T>(h, s, v, z[i], z[i+1], z[i+2]);`
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00			`}`
			`}`
[WIP] More of CUDA operations (#69) * initial commit Signed-off-by: raver119 <raver119@gmail.com> * - gruCell_bp further Signed-off-by: Yurii <yurii@skymind.io> * - further work on gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * Inverse matrix cublas implementation. Partial working revision. * Separation of segment ops helpers. Max separation. * Separated segment_min ops. * Separation of segment_mean/sum/prod/sqrtN ops heleprs. * Fixed diagonal processing with LUP decomposition. * Modified inversion approach using current state of LU decomposition. * Implementation of matrix_inverse op with cuda kernels. Working revision. * Implemented sequence_mask cuda helper. Eliminated waste printf with matrix_inverse implementation. Added proper tests. * - further work on gruCell_bp (ff/cuda) Signed-off-by: Yurii <yurii@skymind.io> * comment one test for gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * - provide cuda static_rnn Signed-off-by: Yurii <yurii@skymind.io> * Refactored random_shuffle op to use new random generator. * Refactored random_shuffle op helper. * Fixed debug tests with random ops tests. * Implement random_shuffle op cuda kernel helper and tests. * - provide cuda scatter_update Signed-off-by: Yurii <yurii@skymind.io> * Implementation of random_shuffle for linear case with cuda kernels and tests. * Implemented random_shuffle with cuda kernels. Final revision. * - finally gruCell_bp is completed Signed-off-by: Yurii <yurii@skymind.io> * Dropout op cuda helper implementation. * Implemented dropout_bp cuda helper. * Implemented alpha_dropout_bp with cuda kernel helpers. * Refactored helper. * Implementation of suppresion helper with cuda kernels. * - provide cpu code fot hsvToRgb, rgbToHsv, adjustHue Signed-off-by: Yurii <yurii@skymind.io> * Using sort by value method. * Implementation of image.non_max_suppression op cuda-based helper. * - correcting and testing adjust_hue, adjust_saturation cpu/cuda code Signed-off-by: Yurii <yurii@skymind.io> * Added cuda device prefixes to declarations. * Implementation of hashcode op with cuda helper. Initital revision. * rnn cu impl removed Signed-off-by: raver119 <raver119@gmail.com> 2019-07-20 08:58:44 +03:00			`else {`

			`auto packX = nd4j::ConstantTadHelper::getInstance()->tadForDimensions(input->getShapeInfo(), {dimC});`
			`auto packZ = nd4j::ConstantTadHelper::getInstance()->tadForDimensions(output->getShapeInfo(), {dimC});`

			`const Nd4jLong numOfTads = packX.numberOfTads();`
			`const Nd4jLong xDimCstride = input->stridesOf()[dimC];`
			`const Nd4jLong zDimCstride = output->stridesOf()[dimC];`

			`PRAGMA_OMP_PARALLEL_FOR_SIMD`
			`for(Nd4jLong i = 0; i < numOfTads; ++i) {`

			`const T* xTad = x + packX.platformOffsets()[i];`
			`T* zTad = z + packZ.platformOffsets()[i];`

			`T h, s, v;`

			`rgbToHsv<T>(xTad[0], xTad[xDimCstride], xTad[2 * xDimCstride], h, s, v);`

			`h += delta * 360;`
			`if(h > 360)`
			`h -= 360;`
			`else if(h < 0)`
			`h += 360;`

			`hsvToRgb<T>(h, s, v, zTad[0], zTad[zDimCstride], zTad[2 * zDimCstride]);`
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00
			`}`
			`}`
[WIP] More of CUDA operations (#69) * initial commit Signed-off-by: raver119 <raver119@gmail.com> * - gruCell_bp further Signed-off-by: Yurii <yurii@skymind.io> * - further work on gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * Inverse matrix cublas implementation. Partial working revision. * Separation of segment ops helpers. Max separation. * Separated segment_min ops. * Separation of segment_mean/sum/prod/sqrtN ops heleprs. * Fixed diagonal processing with LUP decomposition. * Modified inversion approach using current state of LU decomposition. * Implementation of matrix_inverse op with cuda kernels. Working revision. * Implemented sequence_mask cuda helper. Eliminated waste printf with matrix_inverse implementation. Added proper tests. * - further work on gruCell_bp (ff/cuda) Signed-off-by: Yurii <yurii@skymind.io> * comment one test for gruCell_bp Signed-off-by: Yurii <yurii@skymind.io> * - provide cuda static_rnn Signed-off-by: Yurii <yurii@skymind.io> * Refactored random_shuffle op to use new random generator. * Refactored random_shuffle op helper. * Fixed debug tests with random ops tests. * Implement random_shuffle op cuda kernel helper and tests. * - provide cuda scatter_update Signed-off-by: Yurii <yurii@skymind.io> * Implementation of random_shuffle for linear case with cuda kernels and tests. * Implemented random_shuffle with cuda kernels. Final revision. * - finally gruCell_bp is completed Signed-off-by: Yurii <yurii@skymind.io> * Dropout op cuda helper implementation. * Implemented dropout_bp cuda helper. * Implemented alpha_dropout_bp with cuda kernel helpers. * Refactored helper. * Implementation of suppresion helper with cuda kernels. * - provide cpu code fot hsvToRgb, rgbToHsv, adjustHue Signed-off-by: Yurii <yurii@skymind.io> * Using sort by value method. * Implementation of image.non_max_suppression op cuda-based helper. * - correcting and testing adjust_hue, adjust_saturation cpu/cuda code Signed-off-by: Yurii <yurii@skymind.io> * Added cuda device prefixes to declarations. * Implementation of hashcode op with cuda helper. Initital revision. * rnn cu impl removed Signed-off-by: raver119 <raver119@gmail.com> 2019-07-20 08:58:44 +03:00			`}`


			`void adjustHue(nd4j::LaunchContext* context, const NDArray input, const NDArray deltaScalarArr, NDArray *output, const int dimC) {`

			`BUILD_SINGLE_SELECTOR(input->dataType(), adjustHue_, (input, deltaScalarArr, output, dimC), LIBND4J_TYPES);`
			`}`

			`/*`
			`template <typename T>`
			`static void adjust_hue_single_(nd4j::LaunchContext * context, NDArray array, NDArray output, float delta, bool isNHWC) {`
			`// we're 100% sure it's 3`
			`const int numChannels = 3;`
			`int tuples = array->lengthOf() / numChannels;`
			`auto bIn = reinterpret_cast<T *>(array->buffer());`
			`auto bOut = reinterpret_cast<T *>(output->buffer());`
			`static const int kChannelRange = 6;`

			`int stridesDim = isNHWC ? 2 : 0;`
			`if (isNHWC) {`
			`// for NHWC our rgb values are stored one by one`
			`PRAGMA_OMP_PARALLEL_FOR_SIMD`
			`for (int e = 0; e < tuples; e++) {`
			`auto i = bIn + e * numChannels;`
			`auto o = bOut + e * numChannels;`

			`T h, v_min, v_max;`
			`helpers::rgb_to_hv(i[0], i[1], i[2], &h, &v_min, &v_max);`

			`h += delta * kChannelRange;`
			`while (h < (T) 0.)`
			`h += (T) kChannelRange;`

			`while (h >= (T) kChannelRange)`
			`h -= (T) kChannelRange;`

			`helpers::hv_to_rgb(h, v_min, v_max, o, o + 1, o + 2);`
			`}`
			`} else {`
			`auto tadsChannelsIn = array->allTensorsAlongDimension({0});`
			`auto tadsChannelsOut = output->allTensorsAlongDimension( {0});`

			`auto bufferR = reinterpret_cast<T *>(tadsChannelsIn->at(0)->buffer());`
			`auto bufferG = reinterpret_cast<T *>(tadsChannelsIn->at(1)->buffer());`
			`auto bufferB = reinterpret_cast<T *>(tadsChannelsIn->at(2)->buffer());`

			`auto outputR = reinterpret_cast<T *>(tadsChannelsOut->at(0)->buffer());`
			`auto outputG = reinterpret_cast<T *>(tadsChannelsOut->at(1)->buffer());`
			`auto outputB = reinterpret_cast<T *>(tadsChannelsOut->at(2)->buffer());`

			`PRAGMA_OMP_PARALLEL_FOR_SIMD`
			`for (int e = 0; e < tuples; e++) {`
			`auto _ri = bufferR + e;`
			`auto _gi = bufferG + e;`
			`auto _bi = bufferB + e;`

			`auto _ro = outputR + e;`
			`auto _go = outputG + e;`
			`auto _bo = outputB + e;`

			`T h, v_min, v_max;`
			`helpers::rgb_to_hv(_ri[0], _gi[0], _bi[0], &h, &v_min, &v_max);`

			`h += delta * kChannelRange;`
			`while (h < (T) 0)`
			`h += (T) kChannelRange;`

			`while (h >= (T) kChannelRange)`
			`h -= (T) kChannelRange;`

			`helpers::hv_to_rgb(h, v_min, v_max, _ro, _go, _bo);`
			`}`

			`delete tadsChannelsIn;`
			`delete tadsChannelsOut;`
			`}`
			`}`

			`void adjust_hue_(nd4j::LaunchContext * context, NDArray array, NDArray output, NDArray* delta, bool isNHWC) {`
			`auto xType = array->dataType();`

			`float d = delta->e<float>(0);`
			`if (array->rankOf() == 4) {`
			`auto tadsIn = array->allTensorsAlongDimension({0});`
			`auto tadsOut = output->allTensorsAlongDimension({0});`
			`int tSize = tadsIn->size();`
			`// FIXME: template selector should be moved out of loop`
			`PRAGMA_OMP_PARALLEL_FOR`
			`for (int e = 0; e < tSize; e++) {`
			`BUILD_SINGLE_SELECTOR(xType, adjust_hue_single_, (context, tadsIn->at(e), tadsOut->at(e), d, isNHWC);, FLOAT_TYPES);`
			`}`


			`delete tadsIn;`
			`delete tadsOut;`
			`} else {`
			`BUILD_SINGLE_SELECTOR(xType, adjust_hue_single_, (context, array, output, d, isNHWC);, FLOAT_TYPES);`
			`}`
			`}`

			`BUILD_SINGLE_TEMPLATE(template void adjust_hue_single_, (nd4j::LaunchContext * context, NDArray array, NDArray output, float delta, bool isNHWC);, FLOAT_TYPES);`
			`*/`
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00

			`}`
			`}`
			`}`