Add CL1LossLayer (#511)

Valeriy Fedyunin · web-flow · commit 40927bb628ec · 2021-12-22T02:15:55.000+03:00
* Add CL1LossLayer

Signed-off-by: Valeriy Fedyunin &lt;valery.fedyunin@abbyy.com&gt;

* Register L1Loss in Python wrapper

Signed-off-by: Valeriy Fedyunin &lt;valery.fedyunin@abbyy.com&gt;
diff --git a/NeoML/Python/neoml/Dnn/Loss.py b/NeoML/Python/neoml/Dnn/Loss.py
@@ -266,6 +266,50 @@ def __init__(self, input_layers, loss_weight=1.0, name=None):
 # ----------------------------------------------------------------------------------------------------------------------
 
 
+class L1Loss(Loss):
+    """The layer that calculates the loss function equal to L1 distance
+    between the objects in the network response and the correct objects.
+    
+    :param input_layers: The input layers to be connected. 
+        The integer in each tuple specifies the number of the output.
+        If not set, the first output will be used.
+    :type input_layers: list of object, tuple(object, int)
+    :param loss_weight: The multiplier for the loss function value during training.
+    :type loss_weight: float, default=1.0
+    :param name: The layer name.
+    :type name: str, default=None
+
+    .. rubric:: Layer inputs:
+
+    (1) the network response for which you are calculating the loss.
+    
+    (2) the correct objects. 
+    
+    (3) (optional): the objects' weights.
+    
+    The dimensions of all inputs are the same:
+
+        - **BatchLength** * **BatchWidth** * **ListSize** - the number of objects
+        - **Height** * **Width** * **Depth** * **Channels** - the object size
+
+    .. rubric:: Layer outputs:
+
+    The layer has no output.
+    """
+    def __init__(self, input_layers, loss_weight=1.0, name=None):
+
+        if type(input_layers) is PythonWrapper.L1Loss:
+            super().__init__(input_layers)
+            return
+
+        layers, outputs = check_input_layers(input_layers, (2, 3))
+
+        internal = PythonWrapper.L1Loss(str(name), layers, outputs, float(loss_weight))
+        super().__init__(internal)
+
+# ----------------------------------------------------------------------------------------------------------------------
+
+
 class HingeLoss(Loss):
     """The layer that calculates hinge loss function for binary classification:
     :math:`f(x) = \max(0, 1 - x * y)`, where 
diff --git a/NeoML/Python/neoml/Dnn/__init__.py b/NeoML/Python/neoml/Dnn/__init__.py
@@ -26,7 +26,7 @@
 from .ImageConversion import ImageResize, PixelToImage, ImageToPixel  
 from .IndRnn import IndRnn
 from .Irnn import Irnn
-from .Loss import CrossEntropyLoss, BinaryCrossEntropyLoss, EuclideanLoss, HingeLoss, SquaredHingeLoss, FocalLoss, BinaryFocalLoss, CenterLoss, MultiHingeLoss, MultiSquaredHingeLoss, CustomLoss, CustomLossCalculatorBase, call_loss_calculator
+from .Loss import CrossEntropyLoss, BinaryCrossEntropyLoss, EuclideanLoss, L1Loss, HingeLoss, SquaredHingeLoss, FocalLoss, BinaryFocalLoss, CenterLoss, MultiHingeLoss, MultiSquaredHingeLoss, CustomLoss, CustomLossCalculatorBase, call_loss_calculator
 from .Lrn import Lrn
 from .Lstm import Lstm
 from .MatrixMultiplication import MatrixMultiplication
diff --git a/NeoML/Python/src/PyDnn.cpp b/NeoML/Python/src/PyDnn.cpp
@@ -100,6 +100,7 @@ REGISTER_NEOML_PYLAYER( "FullyConnectedSource", "FmlCnnFullyConnectedSourceLayer
 REGISTER_NEOML_PYLAYER_EX( "Loss", "CrossEntropyLoss", "FmlCnnCrossEntropyLossLayer" )
 REGISTER_NEOML_PYLAYER_EX( "Loss", "BinaryCrossEntropyLoss", "FmlCnnBinaryCrossEntropyLossLayer" )
 REGISTER_NEOML_PYLAYER_EX( "Loss", "EuclideanLoss", "FmlCnnEuclideanLossLayer" )
+REGISTER_NEOML_PYLAYER_EX( "Loss", "L1Loss", "NeoMLDnnL1LossLayer" )
 REGISTER_NEOML_PYLAYER_EX( "Loss", "HingeLoss", "FmlCnnHingeLossLayer" )
 REGISTER_NEOML_PYLAYER_EX( "Loss", "SquaredHingeLoss", "FmlCnnSquaredHingeLossLayer" )
 REGISTER_NEOML_PYLAYER_EX( "Loss", "CustomLoss", "NeoMLCustomLossLayer" )
diff --git a/NeoML/Python/src/PyLossLayer.cpp b/NeoML/Python/src/PyLossLayer.cpp
@@ -70,6 +70,21 @@ class CPyEuclideanLossLayer : public CPyLossLayer {
 
 //------------------------------------------------------------------------------------------------------------
 
+class CPyL1LossLayer : public CPyLossLayer {
+public:
+	explicit CPyL1LossLayer( CL1LossLayer& layer, CPyMathEngineOwner& mathEngineOwner ) :
+		CPyLossLayer( layer, mathEngineOwner ) {}
+
+	py::object CreatePythonObject() const
+	{
+		py::object pyModule = py::module::import( "neoml.Dnn" );
+		py::object pyConstructor = pyModule.attr( "L1Loss" );
+		return pyConstructor( py::cast(this) );
+	}
+};
+
+//------------------------------------------------------------------------------------------------------------
+
 class CPyHingeLossLayer : public CPyLossLayer {
 public:
 	explicit CPyHingeLossLayer( CHingeLossLayer& layer, CPyMathEngineOwner& mathEngineOwner ) :
@@ -288,6 +303,33 @@ void InitializeLossLayer( py::module& m )
 		}) )
 	;
 
+//------------------------------------------------------------------------------------------------------------
+
+	py::class_<CPyL1LossLayer, CPyLossLayer>(m, "L1Loss")
+		.def( py::init([]( const CPyLayer& layer )
+		{
+			return CPyL1LossLayer( *layer.Layer<CL1LossLayer>(), layer.MathEngineOwner() );
+		}) )
+		.def( py::init([]( const std::string& name, const py::list& layers, const py::list& outputs, float lossWeight )
+		{
+			py::gil_scoped_release release;
+			CDnn& dnn = layers[0].cast<CPyLayer>().Dnn();
+			IMathEngine& mathEngine = dnn.GetMathEngine();
+
+			CPtr<CL1LossLayer> loss = new CL1LossLayer( mathEngine );
+			loss->SetLossWeight( lossWeight );
+			loss->SetName( FindFreeLayerName( dnn, "L1Loss", name ).c_str() );
+			dnn.AddLayer( *loss );
+			loss->Connect( 0, layers[0].cast<CPyLayer>().BaseLayer(), outputs[0].cast<int>() );
+			loss->Connect( 1, layers[1].cast<CPyLayer>().BaseLayer(), outputs[1].cast<int>() );
+			if( layers.size() == 3 ) {
+				loss->Connect( 2, layers[2].cast<CPyLayer>().BaseLayer(), outputs[2].cast<int>() );
+			}
+
+			return CPyL1LossLayer( *loss, layers[0].cast<CPyLayer>().MathEngineOwner() );
+		}) )
+	;
+
 //------------------------------------------------------------------------------------------------------------
 
 	py::class_<CPyHingeLossLayer, CPyLossLayer>(m, "HingeLoss")
@@ -303,7 +345,7 @@ void InitializeLossLayer( py::module& m )
 
 			CPtr<CHingeLossLayer> loss = new CHingeLossLayer( mathEngine );
 			loss->SetLossWeight( lossWeight );
-			loss->SetName( FindFreeLayerName( dnn, "EuclideanLoss", name ).c_str() );
+			loss->SetName( FindFreeLayerName( dnn, "HingeLoss", name ).c_str() );
 			dnn.AddLayer( *loss );
 			loss->Connect( 0, layers[0].cast<CPyLayer>().BaseLayer(), outputs[0].cast<int>() );
 			loss->Connect( 1, layers[1].cast<CPyLayer>().BaseLayer(), outputs[1].cast<int>() );
diff --git a/NeoML/Python/tests.py b/NeoML/Python/tests.py
@@ -2293,6 +2293,9 @@ def test_binary_cross_entropy_loss(self):
     def test_euclidean_loss(self):
         self._test_loss('EuclideanLoss', dict(loss_weight=7.7), last_loss=0.)
 
+    def test_l1_loss(self):
+        self._test_loss('L1Loss', dict(loss_weight=7.7), last_loss=0.)
+
     def test_hinge_loss(self):
         self._test_loss('HingeLoss', dict(loss_weight=7.7), last_loss=0.)
 
diff --git a/NeoML/docs/en/API/NN/LossLayers/L1LossLayer.md b/NeoML/docs/en/API/NN/LossLayers/L1LossLayer.md
@@ -0,0 +1,42 @@
+# CL1LossLayer Class
+
+<!-- TOC -->
+
+- [CL1LossLayer Class](#cl1losslayer-class)
+    - [Settings](#settings)
+    - [Trainable parameters](#trainable-parameters)
+    - [Inputs](#inputs)
+    - [Outputs](#outputs)
+        - [Getting the value of the loss function](#getting-the-value-of-the-loss-function)
+
+<!-- /TOC -->
+
+This class implements a layer that calculates a loss function equal to the l1 distance between the objects from the network response and the objects of the correct answer.
+
+## Settings
+
+The layer has no settings.
+
+## Trainable parameters
+
+The layer has no trainable parameters.
+
+## Inputs
+
+The layer may have 2 to 3 inputs:
+
+1. The network output for which you are calculating the loss function. It contains `BatchLength * BatchWidth * ListSize` objects, each of `Height * Width * Depth * Channels` size.
+2. A blob of the same size as the first input, containing the correct class objects. The loss function will calculate the L1 distance between the first and the second input.
+3. *[Optional]* The objects' weights. This blob should have the same dimensions as the first input.
+
+## Outputs
+
+This layer has no output.
+
+### Getting the value of the loss function
+
+```c++
+float GetLastLoss() const;
+```
+
+Use this method to get the value of the loss function calculated on the network's last run.
diff --git a/NeoML/docs/en/API/NN/LossLayers/README.md b/NeoML/docs/en/API/NN/LossLayers/README.md
@@ -12,5 +12,6 @@
   - [CFocalLossLayer](FocalLossLayer.md) - focal loss (modified cross-entropy)
 - For regression:
   - [CEuclideanLossLayer](EuclideanLossLayer.md) - Euclidean distance
+  - [CL1LossLayer](L1LossLayer.md) - L1 distance
 - Additionally:
   - [CCenterLossLayer](CenterLossLayer.md) - the auxiliary *center loss* function that penalizes large variance inside a class
diff --git a/NeoML/docs/en/API/NN/README.md b/NeoML/docs/en/API/NN/README.md
@@ -297,6 +297,7 @@ delete gpuMathEngine;
     - [CFocalLossLayer](LossLayers/FocalLossLayer.md) - focal loss function (modified cross-entropy)
   - For regression:
     - [CEuclideanLossLayer](LossLayers/EuclideanLossLayer.md) - Euclidean distance
+    - [CL1LossLayer](LossLayers/L1LossLayer.md) - L1 distance
   - Additionally:
     - [CCenterLossLayer](LossLayers/CenterLossLayer.md) - the auxiliary *center loss* function that penalizes large variance inside a class
 - Working with discrete features:
diff --git a/NeoML/docs/ru/API/NN/LossLayers/L1LossLayer.md b/NeoML/docs/ru/API/NN/LossLayers/L1LossLayer.md
@@ -0,0 +1,42 @@
+# Класс CL1LossLayer
+
+<!-- TOC -->
+
+- [Класс CL1LossLayer](#класс-cl1losslayer)
+    - [Настройки](#настройки)
+    - [Обучаемые параметры](#обучаемые-параметры)
+    - [Входы](#входы)
+    - [Выходы](#выходы)
+        - [Значение функции потерь](#значение-функции-потерь)
+
+<!-- /TOC -->
+
+Класс реализует слой, вычисляющий функцию потерь, равную L1 расстоянию между объектами из ответа сети и объектами из правильных ответов.
+
+## Настройки
+
+Слой не имеет настроек.
+
+## Обучаемые параметры
+
+Слой не имеет обучаемых параметров.
+
+## Входы
+
+Слой имеет 2 или 3 входа:
+
+1. Ответы сети, на которых необходимо вычислить функцию потерь. Содержит `BatchLength * BatchWidth * ListSize` объектов размера `Height * Width * Depth * Channels`.
+2. Правильные ответы в виде блоба того же размера, что и блоб у первого входа. Функция потерь равняется расстояниям между объектами из первого входа и второго.
+3. *[Опционально]* Веса объектов. Блоб этого входа должен иметь те же `BatchLength`, `BatchWidth` и `ListSize`, что и у первого входа. `Height`, `Width`, `Depth` и `Channels` должны быть равны `1`.
+
+## Выходы
+
+Слой не имеет выходов.
+
+### Значение функции потерь
+
+```c++
+float GetLastLoss() const;
+```
+
+Получение значения функции потерь на последнем запуске сети.
diff --git a/NeoML/docs/ru/API/NN/LossLayers/README.md b/NeoML/docs/ru/API/NN/LossLayers/README.md
@@ -12,5 +12,6 @@
   - [CFocalLossLayer](FocalLossLayer.md) - функция `Focal` (модифицированная кросс-энтропия);
 - Регрессия:
   - [CEuclideanLossLayer](EuclideanLossLayer.md) - евклидово расстояние;
+  - [CL1LossLayer](L1LossLayer.md) - L1 расстояние;
 - Дополнительно:
   - [CCenterLossLayer](CenterLossLayer.md) - вспомогательная функция `Center`, штрафующая дисперсию внутри классов.
diff --git a/NeoML/docs/ru/API/NN/README.md b/NeoML/docs/ru/API/NN/README.md
@@ -296,6 +296,7 @@ delete gpuMathEngine;
     - [CFocalLossLayer](LossLayers/FocalLossLayer.md) - функция `Focal` (модифицированная кросс-энтропия)
   - Регрессия:
     - [CEuclideanLossLayer](LossLayers/EuclideanLossLayer.md) - евклидово расстояние
+    - [CL1LossLayer](LossLayers/L1ossLayer.md) - L1 расстояние
   - Дополнительно:
     - [CCenterLossLayer](LossLayers/CenterLossLayer.md) - вспомогательная функция `Center`, штрафующая дисперсию внутри классов
 - Работа с дискретными признаками:
diff --git a/NeoML/include/NeoML/Dnn/Layers/LossLayer.h b/NeoML/include/NeoML/Dnn/Layers/LossLayer.h
@@ -219,6 +219,25 @@ NEOML_API CLayerWrapper<CEuclideanLossLayer> EuclideanLoss( float lossWeight = 1
 
 ///////////////////////////////////////////////////////////////////////////////////
 
+// CL1LossLayer implements a layer that estimates the loss value as abs(result - standard)
+// The layer has two inputs: #0 - result, #1 - standard
+class NEOML_API CL1LossLayer : public CLossLayer {
+	NEOML_DNN_LAYER( CL1LossLayer )
+public:
+	explicit CL1LossLayer( IMathEngine& mathEngine ) : CLossLayer( mathEngine, "CL1LossLayer" ) {}
+
+	void Serialize( CArchive& archive ) override;
+
+protected:
+	void Reshape() override;
+	void BatchCalculateLossAndGradient( int batchSize, CConstFloatHandle data, int vectorSize, CConstFloatHandle label,
+		int labelSize, CFloatHandle lossValue, CFloatHandle lossGradient ) override;
+};
+
+NEOML_API CLayerWrapper<CL1LossLayer> L1Loss( float lossWeight = 1.0f );
+
+///////////////////////////////////////////////////////////////////////////////////
+
 // CHingeLossLayer implements a layer that estimates the loss value as max(0, 1 - result * standard)
 // The layer has two inputs: #0 - result, #1 - standard
 // The standard contains the data in the format: 1 for objects that belong to the class, -1 for the rest
diff --git a/NeoML/src/CMakeLists.txt b/NeoML/src/CMakeLists.txt
@@ -63,6 +63,7 @@ set(NeoML_SOURCES
     Dnn/Layers/ImageResizeLayer.cpp
     Dnn/Layers/IndRnnLayer.cpp
     Dnn/Layers/IrnnLayer.cpp
+    Dnn/Layers/L1LossLayer.cpp
     Dnn/Layers/LrnLayer.cpp
     Dnn/Layers/LstmLayer.cpp
     Dnn/Layers/MatrixMultiplicationLayer.cpp
diff --git a/NeoML/src/Dnn/Dnn.cpp b/NeoML/src/Dnn/Dnn.cpp
@@ -340,6 +340,7 @@ REGISTER_NEOML_LAYER( CCastLayer, "NeoMLDnnCastLayer" )
 REGISTER_NEOML_LAYER( CDataLayer, "NeoMLDnnDataLayer" )
 REGISTER_NEOML_LAYER( CTransformerEncoderLayer, "NeoMLDnnTransformerEncoderLayer" )
 REGISTER_NEOML_LAYER( CBertConvLayer, "NeoMLDnnBertConvLayer" )
+REGISTER_NEOML_LAYER( CL1LossLayer, "NeoMLDnnL1LossLayer" )
 
 }
 
diff --git a/NeoML/src/Dnn/Layers/L1LossLayer.cpp b/NeoML/src/Dnn/Layers/L1LossLayer.cpp
@@ -0,0 +1,70 @@
+/* Copyright © 2017-2021 ABBYY Production LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+	http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+--------------------------------------------------------------------------------------------------------------*/
+
+#include <common.h>
+#pragma hdrstop
+
+#include <NeoML/Dnn/Layers/LossLayer.h>
+#include <NeoMathEngine/NeoMathEngine.h>
+
+namespace NeoML {
+
+///////////////////////////////////////////////////////////////////////////////////
+// CL1LossLayer
+
+void CL1LossLayer::Reshape()
+{
+	CLossLayer::Reshape();
+	CheckArchitecture( inputDescs[1].GetDataType() == CT_Float, GetName(), "labels must be CT_Float" );
+	CheckArchitecture( inputDescs[0].ObjectSize() == inputDescs[1].ObjectSize(), GetName(),
+		"the labels dimensions should be equal to the first input dimensions" );
+}
+
+void CL1LossLayer::BatchCalculateLossAndGradient( int batchSize, CConstFloatHandle data, int vectorSize,
+	CConstFloatHandle label, int /* labelSize */, CFloatHandle lossValue, CFloatHandle lossGradient )
+{
+	int totalSize = batchSize * vectorSize;
+
+	CFloatHandleStackVar temp( MathEngine(), totalSize );
+
+	MathEngine().VectorSub( data, label, temp, totalSize );
+
+	if( !lossGradient.IsNull() ) {
+		CFloatHandleStackVar ones( MathEngine(), totalSize );
+		MathEngine().VectorFill( ones.GetHandle(), 1.f, totalSize );
+
+		MathEngine().VectorAbsDiff( temp, ones, lossGradient, totalSize );
+	}
+
+	MathEngine().VectorAbs( temp, temp, totalSize );
+	MathEngine().SumMatrixColumns( lossValue, temp, batchSize, vectorSize );
+}
+
+static const int L1LossLayerVersion = 0;
+
+void CL1LossLayer::Serialize( CArchive& archive )
+{
+	archive.SerializeVersion( L1LossLayerVersion );
+	CLossLayer::Serialize( archive );
+}
+
+CLayerWrapper<CL1LossLayer> L1Loss( float lossWeight )
+{
+	return CLayerWrapper<CL1LossLayer>( "L1Loss", [=]( CL1LossLayer* result ) {
+		result->SetLossWeight( lossWeight );
+	} );
+}
+
+} // namespace NeoML
diff --git a/NeoML/test/data/LayersSerializationTestData/NeoMLDnnL1LossLayer.arch b/NeoML/test/data/LayersSerializationTestData/NeoMLDnnL1LossLayer.arch
diff --git a/NeoML/test/src/DnnLayersSerializationTest.cpp b/NeoML/test/src/DnnLayersSerializationTest.cpp
@@ -683,6 +683,7 @@ GTEST_TEST( SerializeToFile, LossLayerSerialization )
 	serializeToFile<CCrfInternalLossLayer>( "FmlCnnCrfInternalLossLayer" );
 	serializeToFile<CMultiHingeLossLayer>( "FmlCnnMultyHingeLossLayer" );
 	serializeToFile<CMultiSquaredHingeLossLayer>( "FmlCnnMultySquaredHingeLossLayer" );
+	serializeToFile<CL1LossLayer>( "NeoMLDnnL1LossLayer" );
 }
 
 #endif
@@ -701,6 +702,7 @@ GTEST_TEST( SerializeFromFile, LossLayerSerialization )
 	checkSerializeLayer<CLossLayer>( "FmlCnnCrfInternalLossLayer" );
 	checkSerializeLayer<CLossLayer>( "FmlCnnMultyHingeLossLayer" );
 	checkSerializeLayer<CLossLayer>( "FmlCnnMultySquaredHingeLossLayer" );
+	checkSerializeLayer<CLossLayer>( "NeoMLDnnL1LossLayer" );
 }
 
 // ====================================================================================================================

Original file line number	Diff line number	Diff line change
`@@ -340,6 +340,7 @@ REGISTER_NEOML_LAYER( CCastLayer, "NeoMLDnnCastLayer" )`
`340`	`340`	`REGISTER_NEOML_LAYER( CDataLayer, "NeoMLDnnDataLayer" )`
`341`	`341`	`REGISTER_NEOML_LAYER( CTransformerEncoderLayer, "NeoMLDnnTransformerEncoderLayer" )`
`342`	`342`	`REGISTER_NEOML_LAYER( CBertConvLayer, "NeoMLDnnBertConvLayer" )`
	`343`	`+REGISTER_NEOML_LAYER( CL1LossLayer, "NeoMLDnnL1LossLayer" )`
`343`	`344`
`344`	`345`	`}`
`345`	`346`
Original file line number	Diff line number	Diff line change
`@@ -683,6 +683,7 @@ GTEST_TEST( SerializeToFile, LossLayerSerialization )`
`683`	`683`	`serializeToFile<CCrfInternalLossLayer>( "FmlCnnCrfInternalLossLayer" );`
`684`	`684`	`serializeToFile<CMultiHingeLossLayer>( "FmlCnnMultyHingeLossLayer" );`
`685`	`685`	`serializeToFile<CMultiSquaredHingeLossLayer>( "FmlCnnMultySquaredHingeLossLayer" );`
	`686`	`+ serializeToFile<CL1LossLayer>( "NeoMLDnnL1LossLayer" );`
`686`	`687`	`}`
`687`	`688`
`688`	`689`	`#endif`
`@@ -701,6 +702,7 @@ GTEST_TEST( SerializeFromFile, LossLayerSerialization )`
`701`	`702`	`checkSerializeLayer<CLossLayer>( "FmlCnnCrfInternalLossLayer" );`
`702`	`703`	`checkSerializeLayer<CLossLayer>( "FmlCnnMultyHingeLossLayer" );`
`703`	`704`	`checkSerializeLayer<CLossLayer>( "FmlCnnMultySquaredHingeLossLayer" );`
	`705`	`+ checkSerializeLayer<CLossLayer>( "NeoMLDnnL1LossLayer" );`
`704`	`706`	`}`
`705`	`707`
`706`	`708`	`// ====================================================================================================================`