2019-06-06 14:21:15 +02:00
/*******************************************************************************
* Copyright ( c ) 2015 - 2018 Skymind , Inc .
*
* This program and the accompanying materials are made available under the
* terms of the Apache License , Version 2.0 which is available at
* https : //www.apache.org/licenses/LICENSE-2.0.
*
* Unless required by applicable law or agreed to in writing , software
* distributed under the License is distributed on an " AS IS " BASIS , WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied . See the
* License for the specific language governing permissions and limitations
* under the License .
*
* SPDX - License - Identifier : Apache - 2.0
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
//
// @author Yurii Shyrma (iuriish@yahoo.com), created on 18.06.2018
//
2020-03-02 10:49:41 +01:00
# include <system/op_boilerplate.h>
2019-06-06 14:21:15 +02:00
# if NOT_EXCLUDED(OP_softmax_cross_entropy_loss_with_logits)
# include <ops/declarable/CustomOperations.h>
2020-03-02 10:49:41 +01:00
namespace sd {
2019-06-06 14:21:15 +02:00
namespace ops {
//////////////////////////////////////////////////////////////////////////
CUSTOM_OP_IMPL ( softmax_cross_entropy_loss_with_logits , 2 , 1 , false , 0 , 0 ) {
auto logits = INPUT_VARIABLE ( 0 ) ;
auto labels = INPUT_VARIABLE ( 1 ) ;
auto output = OUTPUT_VARIABLE ( 0 ) ;
const int classesDim = block . getIArguments ( ) - > size ( ) > 0 ? INT_ARG ( 0 ) : logits - > rankOf ( ) - 1 ;
2019-12-20 20:35:39 +01:00
// input validation
2019-06-06 14:21:15 +02:00
REQUIRE_TRUE ( labels - > isSameShape ( logits ) , 0 , " SOFTMAX_CROSS_ENTROPY_LOSS_WITH_LOGITS OP: labels and logits arrays must have the same shapes, but got %s and %s correspondingly ! " , ShapeUtils : : shapeAsString ( labels ) . c_str ( ) , ShapeUtils : : shapeAsString ( logits ) . c_str ( ) ) ;
REQUIRE_TRUE ( classesDim < logits - > rankOf ( ) , 0 , " SOFTMAX_CROSS_ENTROPY_LOSS_WITH_LOGITS OP: class dimension must be smaller than rank of logits, but got %i and %i correspondingly ! " , classesDim , logits - > rankOf ( ) ) ;
2019-12-20 20:35:39 +01:00
std : : vector < int > dimension = { classesDim } ;
auto maxAlongDim = logits - > reduceAlongDimension ( reduce : : Max , { classesDim } , true ) ;
2019-06-06 14:21:15 +02:00
auto logExp = ( * logits - maxAlongDim ) . transform ( transform : : Exp ) ;
2019-12-20 20:35:39 +01:00
auto logSoftMax = ( logExp / logExp . reduceAlongDimension ( reduce : : Sum , { classesDim } , true ) ) . transform ( transform : : Log ) ;
( - ( * labels ) * logSoftMax ) . reduceAlongDimension ( reduce : : Sum , * output , dimension ) ;
2019-06-06 14:21:15 +02:00
return Status : : OK ( ) ;
}
//////////////////////////////////////////////////////////////////////////
DECLARE_TYPES ( softmax_cross_entropy_loss_with_logits ) {
2019-12-20 20:35:39 +01:00
2020-03-02 10:49:41 +01:00
getOpDescriptor ( ) - > setAllowedInputTypes ( sd : : DataType : : ANY ) - > setAllowedOutputTypes ( { ALL_FLOATS } ) ;
2019-06-06 14:21:15 +02:00
}
//////////////////////////////////////////////////////////////////////////
DECLARE_SHAPE_FN ( softmax_cross_entropy_loss_with_logits ) {
2019-12-20 20:35:39 +01:00
2019-06-06 14:21:15 +02:00
auto logitsShapeInfo = inputShape - > at ( 0 ) ;
auto labelsShapeInfo = inputShape - > at ( 1 ) ;
const int classesDim = block . getIArguments ( ) - > size ( ) > 0 ? INT_ARG ( 0 ) : - 1 ;
std : : vector < int > dimensions = { classesDim } ;
2019-12-20 20:35:39 +01:00
// labels and logits must have the same shapes
2019-06-06 14:21:15 +02:00
REQUIRE_TRUE ( shape : : shapeEquals ( logitsShapeInfo , labelsShapeInfo ) , 0 , " SOFTMAX_CROSS_ENTROPY_LOSS_WITH_LOGITS OP: labels and logits arrays must have the same shapes, but got %s and %s correspondingly! " , ShapeUtils : : shapeAsString ( labelsShapeInfo ) . c_str ( ) , ShapeUtils : : shapeAsString ( logitsShapeInfo ) . c_str ( ) ) ;
auto outType = DataTypeUtils : : pickFloatingType ( ArrayOptions : : dataType ( logitsShapeInfo ) ) ;
auto reducedShapeInfo = ShapeUtils : : evalReduceShapeInfo ( shape : : order ( labelsShapeInfo ) , dimensions , labelsShapeInfo , outType , false , false , block . getWorkspace ( ) ) ;
return SHAPELIST ( reducedShapeInfo ) ;
}
//////////////////////////////////////////////////////////////////////////
CUSTOM_OP_IMPL ( softmax_cross_entropy_loss_with_logits_grad , 2 , 2 , false , 0 , 0 ) {
auto logits = INPUT_VARIABLE ( 0 ) ;
auto labels = INPUT_VARIABLE ( 1 ) ;
auto output = OUTPUT_VARIABLE ( 0 ) ;
auto dLdp = OUTPUT_VARIABLE ( 0 ) ; // dL/dlogits
auto dLdl = OUTPUT_VARIABLE ( 1 ) ; // dL/dlabels
const int classesDim = block . getIArguments ( ) - > size ( ) > 0 ? INT_ARG ( 0 ) : logits - > rankOf ( ) - 1 ;
2019-12-20 20:35:39 +01:00
// input validation
2019-06-06 14:21:15 +02:00
REQUIRE_TRUE ( labels - > isSameShape ( logits ) , 0 , " SOFTMAX_CROSS_ENTROPY_LOSS_WITH_LOGITS_GRAD OP: labels and logits arrays must have the same shapes, but got %s and %s correspondingly ! " , ShapeUtils : : shapeAsString ( labels ) . c_str ( ) , ShapeUtils : : shapeAsString ( logits ) . c_str ( ) ) ;
REQUIRE_TRUE ( classesDim < logits - > rankOf ( ) , 0 , " SOFTMAX_CROSS_ENTROPY_LOSS_WITH_LOGITS_GRAD OP: class dimension must be smaller than rank of logits, but got %i and %i correspondingly ! " , classesDim , logits - > rankOf ( ) ) ;
2019-12-20 20:35:39 +01:00
std : : vector < int > dimension = { classesDim } ;
NDArray softmax = ( * logits - logits - > reduceAlongDimension ( reduce : : Max , dimension , true ) ) . transform ( transform : : Exp ) ;
softmax / = softmax . reduceAlongDimension ( reduce : : Sum , dimension , true ) ;
2019-06-06 14:21:15 +02:00
// dEdp = softmax * sum_i(labels_i) - labels
2019-12-20 20:35:39 +01:00
dLdp - > assign ( softmax * labels - > reduceAlongDimension ( reduce : : Sum , dimension , true ) - * labels ) ;
// dEdl = -log(softmax)
( - softmax ) . applyTransform ( transform : : Log , * dLdl ) ;
2019-06-06 14:21:15 +02:00
return Status : : OK ( ) ;
}
//////////////////////////////////////////////////////////////////////////
DECLARE_TYPES ( softmax_cross_entropy_loss_with_logits_grad ) {
2019-12-20 20:35:39 +01:00
2020-03-02 10:49:41 +01:00
getOpDescriptor ( ) - > setAllowedInputTypes ( sd : : DataType : : ANY ) - > setAllowedOutputTypes ( { ALL_FLOATS } ) ;
2019-06-06 14:21:15 +02:00
}
//////////////////////////////////////////////////////////////////////////
DECLARE_SHAPE_FN ( softmax_cross_entropy_loss_with_logits_grad ) {
2019-12-20 20:35:39 +01:00
auto logitsShapeInfo = inputShape - > at ( 0 ) ;
2019-06-06 14:21:15 +02:00
auto labelsShapeInfo = inputShape - > at ( 1 ) ;
2019-12-20 20:35:39 +01:00
// labels and logits must have the same shapes
2019-06-06 14:21:15 +02:00
REQUIRE_TRUE ( shape : : shapeEquals ( logitsShapeInfo , labelsShapeInfo ) , 0 , " SOFTMAX_CROSS_ENTROPY_LOSS_WITH_LOGITS_GRAD OP: labels and logits arrays must have the same shapes, but got %s and %s correspondingly! " , ShapeUtils : : shapeAsString ( labelsShapeInfo ) . c_str ( ) , ShapeUtils : : shapeAsString ( logitsShapeInfo ) . c_str ( ) ) ;
2019-12-20 20:35:39 +01:00
DataType outType = DataTypeUtils : : pickFloatingType ( ArrayOptions : : dataType ( logitsShapeInfo ) ) ;
2019-06-06 14:21:15 +02:00
auto dLdpShapeInfo = ConstantShapeHelper : : getInstance ( ) - > createShapeInfo ( ShapeDescriptor ( outType , shape : : order ( logitsShapeInfo ) , shape : : shapeOf ( logitsShapeInfo ) , shape : : rank ( logitsShapeInfo ) ) ) ;
auto dLdlShapeInfo = ConstantShapeHelper : : getInstance ( ) - > createShapeInfo ( ShapeDescriptor ( outType , shape : : order ( labelsShapeInfo ) , shape : : shapeOf ( labelsShapeInfo ) , shape : : rank ( labelsShapeInfo ) ) ) ;
2019-12-20 20:35:39 +01:00
2019-06-06 14:21:15 +02:00
return SHAPELIST ( dLdpShapeInfo , dLdlShapeInfo ) ;
}
}
}
# endif