/* ****************************************************************************** * * * This program and the accompanying materials are made available under the * terms of the Apache License, Version 2.0 which is available at * https://www.apache.org/licenses/LICENSE-2.0. * * See the NOTICE file distributed with this work for additional * information regarding copyright ownership. * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the * License for the specific language governing permissions and limitations * under the License. * * SPDX-License-Identifier: Apache-2.0 ******************************************************************************/ // // @author GS // #include #include #include namespace sd { namespace ops { namespace helpers { template static void reluDerivative__(NDArray* theFirst, NDArray* theSecond) { auto functor = LAMBDA_TT(x, y){ return x > (T) 0.f ? y : T(0.f); }; theFirst->applyPairwiseLambda(*theSecond, functor, *theFirst); } void reluDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), reluDerivative__, (theFirst, theSecond), FLOAT_TYPES); } template static void reluDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { T zero = (T) 0.f; auto functor = LAMBDA_TT(x, y, zero){ return x > zero ? y : zero; }; input->applyPairwiseLambda(*epsilon, functor, *output); /* auto x = input->bufferAsT(); auto y = epsilon->bufferAsT(); auto z = output->bufferAsT(); int length = input->lengthOf(); T zero = (T) 0.f; PRAGMA_OMP_PARALLEL_FOR for (int e = 0; e < length; e++) { z[e] = x[e] > zero ? y[e] : zero; } */ } void reluDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), reluDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void relu6Derivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return x > (T)0.f && x < (T)6.f? y : T(0.f); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void relu6Derivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), relu6Derivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void leakyReluDerivative_(NDArray* input, NDArray* epsilon, NDArray* output, const float alpha) { const T alphaT = static_cast(alpha); auto functor = LAMBDA_TT(x, y, alphaT) { return x < 0 ? alphaT * y : y; }; input->applyPairwiseLambda(*epsilon, functor, *output); } void leakyReluDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput, const float alpha) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), leakyReluDerivative_, (theFirst, theSecond, theOutput, alpha), FLOAT_TYPES); } template static void eluDerivative_(NDArray* input, NDArray* epsilon, NDArray* output, const float alpha) { const T alphaT = static_cast(alpha); auto functor = LAMBDA_TT(x, y, alphaT){ return y * sd::math::nd4j_eluderivative(x, alphaT); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void eluDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput, const float alpha) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), eluDerivative_, (theFirst, theSecond, theOutput, alpha), FLOAT_TYPES); } template static void seluDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return y * simdOps::SELUDerivative::op(x, nullptr); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void seluDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), seluDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void cubeDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return y * (3 * x * x); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void cubeDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), cubeDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } //return (x >= X(0.f) ? y: -y); template static void reduceNorm1_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return x > T(0.f)? y : -y; }; input->applyPairwiseLambda(*epsilon, functor, *output); } void reduceNorm1(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), reduceNorm1_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } //////////////////////////////////////////////////////////////////////// template static void sigmCrossEntropy_(NDArray* logits, NDArray* labels, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return sd::math::nd4j_max(x, (T)0.f) - x * y + sd::math::nd4j_log((T)1.f + sd::math::nd4j_exp(-sd::math::nd4j_abs(x))); }; logits->applyPairwiseLambda(*labels, functor, *output); } void sigmCrossEntropy(sd::LaunchContext * context, NDArray* logits, NDArray* labels, NDArray* output) { BUILD_SINGLE_SELECTOR(logits->dataType(), sigmCrossEntropy_, (logits, labels, output), FLOAT_TYPES); } //////////////////////////////////////////////////////////////////////// template static void sigmCrossEntropyGrad_(NDArray* logits, NDArray* labels, NDArray* output) { // 1 - labels - 1 / (1 + exp(logits)) auto functor = LAMBDA_TT(x, y) { if(x <= 0) return static_cast(1.) - y - static_cast(1.) / (static_cast(1.) + sd::math::nd4j_exp(x)); auto e = sd::math::nd4j_exp(-x); return static_cast(1.) - y - e / (static_cast(1.) + e); }; logits->applyPairwiseLambda(*labels, functor, *output); } void sigmCrossEntropyGrad(sd::LaunchContext * context, NDArray* logits, NDArray* labels, NDArray* output) { BUILD_SINGLE_SELECTOR(logits->dataType(), sigmCrossEntropyGrad_, (logits, labels, output), FLOAT_TYPES); } //////////////////////////////////////////////////////////////////////// template static void tanhDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ T th = sd::math::nd4j_tanh(x); return y * ((T)1.0f - (th * th)); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void tanhDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), tanhDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } // return static_cast(d2) * simdOps::HardTanhDerivative::op(d1, nullptr); template static void hardTanhDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ T th = sd::math::nd4j_tanh(x); return y * simdOps::HardTanhDerivative::op(x, nullptr); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void hardTanhDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), hardTanhDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void rationalTanhDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return y * simdOps::RationalTanhDerivative::op(x, nullptr); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void rationalTanhDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), rationalTanhDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void rectifiedTanhDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return x > (T) 0.0f ? y * (sd::math::nd4j_tanhderivative(x)) : (T) 0.0f; }; input->applyPairwiseLambda(*epsilon, functor, *output); } void rectifiedTanhDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), rectifiedTanhDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } // X f = (X) 1.0f + sd::math::nd4j_abs(d1); // return (X) d2 * ((X) 1.0f / (f * f)); template static void softSignDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ T ss = (T)1.f + sd::math::nd4j_abs(x); return y * ((T) 1.0f / (ss * ss)); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void softSignDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), softSignDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void softPlusDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ T p = sd::math::nd4j_pow(static_cast(M_E), x); return y * (p / (p + 1.)); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void softPlusDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), softPlusDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } /// /// \param theFirst /// \param theSecond /// \param theOutput template static void sigmoidDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ T s = sd::math::nd4j_sigmoid(x); return y * (s * ((T) 1.0f - s)); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void sigmoidDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), sigmoidDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void hardSigmoidDerivative_(NDArray* input, NDArray* epsilon, NDArray* output) { auto functor = LAMBDA_TT(x, y){ return y * simdOps::HardSigmoidDerivative::op(x, nullptr); }; input->applyPairwiseLambda(*epsilon, functor, *output); } void hardSigmoidDerivative(sd::LaunchContext * context, NDArray* theFirst, NDArray* theSecond, NDArray* theOutput) { BUILD_SINGLE_SELECTOR(theFirst->dataType(), hardSigmoidDerivative_, (theFirst, theSecond, theOutput), FLOAT_TYPES); } template static void logSumExp_(NDArray* input, NDArray* axis, NDArray* output) { // reduce along axis with NDArray tempInput = input->dup(); input->applyTransform(transform::Exp, tempInput); std::vector axisVector; if (axis != nullptr) { axisVector.resize(axis->lengthOf()); for (size_t i = 0; i < axisVector.size(); ++i) axisVector[i] = axis->e(i); } tempInput.reduceAlongDimension(reduce::Sum, *output, axisVector); output->applyTransform(transform::Log, *output); } template static void logSumExp_(NDArray* input, NDArray* subtrah, NDArray* axis, NDArray* output) { // reduce along axis with NDArray tempInput = input->dup(); input->applyPairwiseTransform(pairwise::Subtract, *subtrah, tempInput); tempInput.applyTransform(transform::Exp, tempInput); std::vector axisVector; if (axis != nullptr) { axisVector.resize(axis->lengthOf()); for (size_t i = 0; i < axisVector.size(); ++i) axisVector[i] = axis->e(i); } tempInput.reduceAlongDimension(reduce::Sum, *output, axisVector); output->applyTransform(transform::Log, *output); } void logSumExp(sd::LaunchContext * context, NDArray* input, NDArray* axis, NDArray* output) { BUILD_SINGLE_SELECTOR(input->dataType(), logSumExp_, (input, axis, output), FLOAT_TYPES); } void logSumExp(sd::LaunchContext * context, NDArray* input, NDArray* subtrah, NDArray* axis, NDArray* output) { BUILD_SINGLE_SELECTOR(input->dataType(), logSumExp_, (input, subtrah, axis, output), FLOAT_TYPES); } ////////////////////////////////////////////////////////////////////////// template static void weightedCrossEntropyWithLogitsFunctor_(NDArray const* targets, NDArray const* input, NDArray const* weights, NDArray* output) { T posWeight = weights->e(0); auto mainRoutineT1 = LAMBDA_TT(_x, _z, posWeight) { T targetWeight = (1. + (posWeight - (T)1.f) * _z); return (1. - _z) * _x + targetWeight * (sd::math::nd4j_log((T)1.f + sd::math::nd4j_exp(-sd::math::nd4j_abs(_x))) + sd::math::nd4j_max(-_x, T(0.f)) ); }; auto mainRoutineT2 = LAMBDA_TTT(_x, _z, _w) { return (((T)1.0 - _z) * _x) + _w * (sd::math::nd4j_log(T(1.) + sd::math::nd4j_exp(-sd::math::nd4j_abs(_x))) + sd::math::nd4j_max(-_x, T(0.f))); }; if (weights->isScalar()) { const_cast(input)->applyPairwiseLambda(const_cast(*targets), mainRoutineT1, *output); } else { std::unique_ptr targetVector(new NDArray(*weights)); targetVector->applyScalar(scalar::Add, -1.f, *targetVector); std::unique_ptr targetTensor(new NDArray(*targets)); *targetTensor = (*targetVector * *targetTensor) + T(1.f); const_cast(input)->applyTriplewiseLambda(const_cast(*targets), *targetTensor.get(), mainRoutineT2, *output); } } void weightedCrossEntropyWithLogitsFunctor(sd::LaunchContext * context, NDArray const* targets, NDArray const* input, NDArray const* weights, NDArray* output) { BUILD_SINGLE_SELECTOR(targets->dataType(), weightedCrossEntropyWithLogitsFunctor_, (targets, input, weights, output), FLOAT_TYPES); } } } }