AdvancedClimateSystems · Swopper050 · Nov 29, 2023 · Nov 29, 2023 · Nov 30, 2023 · Dec 1, 2023
diff --git a/ops/opset13/batch_normalization.go b/ops/opset13/batch_normalization.go
@@ -0,0 +1,230 @@
+package opset13
+
+import (
+	"github.com/advancedclimatesystems/gonnx/onnx"
+	"github.com/advancedclimatesystems/gonnx/ops"
+	"gorgonia.org/tensor"
+)
+
+const (
+	MinBatchNormalizationInputs       = 5
+	MaxBatchNormalizationInputs       = 5
+	BatchNormalizationDefaultEpsilon  = 1e-5
+	BatchNormalizationDefaultMomentum = 0.9
+)
+
+// BatchNormalization represents the ONNX batchNormalization operator.
+type BatchNormalization struct {
+	epsilon  float32
+	momentum float32
+	testMode bool
+}
+
+// newBatchNormalization creates a new batchNormalization operator.
+func newBatchNormalization() ops.Operator {
+	return &BatchNormalization{
+		epsilon:  BatchNormalizationDefaultEpsilon,
+		momentum: BatchNormalizationDefaultMomentum,
+	}
+}
+
+// Init initializes the batchNormalization operator.
+func (b *BatchNormalization) Init(n *onnx.NodeProto) error {
+	hasMomentum := false
+
+	for _, attr := range n.GetAttribute() {
+		switch attr.GetName() {
+		case "epsilon":
+			b.epsilon = attr.GetF()
+		case "momentum":
+			hasMomentum = true
+			b.momentum = attr.GetF()
+		default:
+			return ops.ErrInvalidAttribute(attr.GetName(), b)
+		}
+	}
+
+	if !hasMomentum {
+		b.testMode = true
+	}
+
+	return nil
+}
+
+// Apply applies the batchNormalization operator.
+func (b *BatchNormalization) Apply(inputs []tensor.Tensor) ([]tensor.Tensor, error) {
+	X := inputs[0]
+	scale := inputs[1]
+	B := inputs[2]
+	mean := inputs[3]
+	variance := inputs[4]
+
+	// We only support test mode, as this is by far the most common for inference models.
+	if !b.testMode {
+		return nil, ops.ErrUnsupportedAttribute("momentum", b)
+	}
+
+	out, err := b.testModeCalculation(X, scale, B, mean, variance)
+	if err != nil {
+		return nil, err
+	}
+
+	return []tensor.Tensor{out}, nil
+}
+
+// ValidateInputs validates the inputs that will be given to Apply for this operator.
+func (b *BatchNormalization) ValidateInputs(inputs []tensor.Tensor) ([]tensor.Tensor, error) {
+	return ops.ValidateInputs(b, inputs)
+}
+
+// GetMinInputs returns the minimum number of input tensors this operator expects.
+func (b *BatchNormalization) GetMinInputs() int {
+	return MinBatchNormalizationInputs
+}
+
+// GetMaxInputs returns the maximum number of input tensors this operator expects.
+func (b *BatchNormalization) GetMaxInputs() int {
+	return MaxBatchNormalizationInputs
+}
+
+// GetInputTypeConstraints returns a list. Every element represents a set of allowed tensor dtypes
+// for the corresponding input tensor.
+func (b *BatchNormalization) GetInputTypeConstraints() [][]tensor.Dtype {
+	return [][]tensor.Dtype{
+		{tensor.Float32, tensor.Float64},
+		{tensor.Float32, tensor.Float64},
+		{tensor.Float32, tensor.Float64},
+		{tensor.Float32, tensor.Float64},
+		{tensor.Float32, tensor.Float64},
+	}
+}
+
+// String implements the stringer interface, and can be used to format errors or messages.
+func (b *BatchNormalization) String() string {
+	return "batchNormalization operator"
+}
+
+func (b *BatchNormalization) reshapeTensors(X, scale, bias, mean, variance tensor.Tensor) (newScale, newBias, newMean, newVariance tensor.Tensor, err error) {
+	nNonSpatialDims := 2
+
+	nSpatialDims := len(X.Shape()) - nNonSpatialDims
+	if nSpatialDims <= 0 {
+		return scale, bias, mean, variance, nil
+	}
+
+	// The new shape for the `scale`, `bias`, `mean` and `variance` tensors should
+	// be (C, 1, 1, ...), such that they can be broadcasted to match the shape of `X`.
+	newShape := make([]int, 1+nSpatialDims)
+
+	// Here we set the channel dimension. The channel dimension is the same
+	// for all `X`, `scale`, `bias`, `mean` and `variance` tensors.
+	newShape[0] = scale.Shape()[0]
+
+	// Set all the remaining dimensions to 1 to allow for broadcasting.
+	for i := 1; i < len(newShape); i++ {
+		newShape[i] = 1
+	}
+
+	// Now we create new tensors for all the input tensors (except `X`) and reshape
+	// them.
+	newScale, ok := scale.Clone().(tensor.Tensor)
+	if !ok {
+		return nil, nil, nil, nil, ops.ErrTypeAssert("tensor.Tensor", scale.Clone())
+	}
+
+	newBias, ok = bias.Clone().(tensor.Tensor)
+	if !ok {
+		return nil, nil, nil, nil, ops.ErrTypeAssert("tensor.Tensor", bias.Clone())
+	}
+
+	newMean, ok = mean.Clone().(tensor.Tensor)
+	if !ok {
+		return nil, nil, nil, nil, ops.ErrTypeAssert("tensor.Tensor", mean.Clone())
+	}
+
+	newVariance, ok = variance.Clone().(tensor.Tensor)
+	if !ok {
+		return nil, nil, nil, nil, ops.ErrTypeAssert("tensor.Tensor", variance.Clone())
+	}
+
+	err = newScale.Reshape(newShape...)
+	if err != nil {
+		return nil, nil, nil, nil, err
+	}
+
+	err = newBias.Reshape(newShape...)
+	if err != nil {
+		return nil, nil, nil, nil, err
+	}
+
+	err = newMean.Reshape(newShape...)
+	if err != nil {
+		return nil, nil, nil, nil, err
+	}
+
+	err = newVariance.Reshape(newShape...)
+	if err != nil {
+		return nil, nil, nil, nil, err
+	}
+
+	return
+}
+
+func (b *BatchNormalization) testModeCalculation(X, scale, bias, mean, variance tensor.Tensor) (tensor.Tensor, error) {
+	newScale, newBias, newMean, newVariance, err := b.reshapeTensors(X, scale, bias, mean, variance)
+	if err != nil {
+		return nil, err
+	}
+
+	numerator, err := ops.ApplyBinaryOperation(
+		X,
+		newMean,
+		ops.Sub,
+		ops.UnidirectionalBroadcasting,
+	)
+	if err != nil {
+		return nil, err
+	}
+
+	numerator, err = ops.ApplyBinaryOperation(
+		numerator[0],
+		newScale,
+		ops.Mul,
+		ops.UnidirectionalBroadcasting,
+	)
+	if err != nil {
+		return nil, err
+	}
+
+	denominator, err := tensor.Add(newVariance, b.epsilon)
+	if err != nil {
+		return nil, err
+	}
+
+	denominator, err = tensor.Sqrt(denominator)
+	if err != nil {
+		return nil, err
+	}
+
+	outputs, err := ops.ApplyBinaryOperation(
+		numerator[0],
+		denominator,
+		ops.Div,
+		ops.UnidirectionalBroadcasting,
+	)
+	if err != nil {
+		return nil, err
+	}
+
+	outputs, err = ops.ApplyBinaryOperation(
+		outputs[0],
+		newBias,
+		ops.Add,
+		ops.UnidirectionalBroadcasting,
+	)
+	if err != nil {
+		return nil, err
+	}
+
+	return outputs[0], nil
+}
diff --git a/ops/opset13/batch_normalization_test.go b/ops/opset13/batch_normalization_test.go
@@ -0,0 +1,146 @@
+package opset13
+
+import (
+	"testing"
+
+	"github.com/advancedclimatesystems/gonnx/onnx"
+	"github.com/advancedclimatesystems/gonnx/ops"
+	"github.com/stretchr/testify/assert"
+	"gorgonia.org/tensor"
+)
+
+func TestBatchNormalizationInit(t *testing.T) {
+	b := &BatchNormalization{}
+
+	err := b.Init(
+		&onnx.NodeProto{
+			Attribute: []*onnx.AttributeProto{
+				{Name: "epsilon", F: 0.001},
+			},
+		},
+	)
+	assert.Nil(t, err)
+
+	assert.Equal(t, float32(0.001), b.epsilon)
+	assert.True(t, b.testMode)
+}
+
+func TestBatchNormalizationInitTrainingMode(t *testing.T) {
+	b := &BatchNormalization{}
+
+	err := b.Init(
+		&onnx.NodeProto{
+			Attribute: []*onnx.AttributeProto{
+				{Name: "epsilon", F: 0.001},
+				{Name: "momentum", F: 0.99},
+			},
+		},
+	)
+	assert.Nil(t, err)
+
+	assert.Equal(t, float32(0.001), b.epsilon)
+	assert.Equal(t, float32(0.99), b.momentum)
+	assert.False(t, b.testMode)
+}
+
+func TestBatchNormalization(t *testing.T) {
+	tests := []struct {
+		batchNormalization *BatchNormalization
+		backings           [][]float32
+		shapes             [][]int
+		expected           []float32
+	}{
+		{
+			&BatchNormalization{
+				epsilon:  1e5,
+				momentum: 0.9,
+				testMode: true,
+			},
+			[][]float32{
+				{0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23},
+				{0.2, 0.3, 0.4},
+				{0.1, -0.1, 0.2},
+				{4, 8, 12},
+				{1, 2, 3},
+			},
+			[][]int{
+				{2, 3, 2, 2},
+				{3},
+				{3},
+				{3},
+				{3},
+			},
+			[]float32{0.097470194, 0.098102644, 0.098735094, 0.09936755, -0.103794694, -0.10284603, -0.10189735, -0.10094868, 0.19494043, 0.19620533, 0.19747022, 0.19873512, 0.10505962, 0.10569207, 0.10632452, 0.10695698, -0.09241061, -0.091461934, -0.09051326, -0.08956459, 0.21011914, 0.21138403, 0.21264893, 0.21391381},
+		},
+	}
+
+	for _, test := range tests {
+		inputs := []tensor.Tensor{
+			ops.TensorWithBackingFixture(test.backings[0], test.shapes[0]...),
+			ops.TensorWithBackingFixture(test.backings[1], test.shapes[1]...),
+			ops.TensorWithBackingFixture(test.backings[2], test.shapes[2]...),
+			ops.TensorWithBackingFixture(test.backings[3], test.shapes[3]...),
+			ops.TensorWithBackingFixture(test.backings[4], test.shapes[4]...),
+		}
+
+		res, err := test.batchNormalization.Apply(inputs)
+		assert.Nil(t, err)
+
+		assert.Equal(t, test.expected, res[0].Data())
+	}
+}
+
+func TestInputValidationBatchNormalization(t *testing.T) {
+	tests := []struct {
+		inputs []tensor.Tensor
+		err    error
+	}{
+		{
+			[]tensor.Tensor{
+				ops.TensorWithBackingFixture([]float32{1, 2}, 2),
+				ops.TensorWithBackingFixture([]float32{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float32{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float32{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float32{3, 4}, 2),
+			},
+			nil,
+		},
+		{
+			[]tensor.Tensor{
+				ops.TensorWithBackingFixture([]float64{1, 2}, 2),
+				ops.TensorWithBackingFixture([]float64{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float64{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float64{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float64{3, 4}, 2),
+			},
+			nil,
+		},
+		{
+			[]tensor.Tensor{
+				ops.TensorWithBackingFixture([]int{1, 2}, 2),
+			},
+			ops.ErrInvalidInputCount(1, &BatchNormalization{}),
+		},
+		{
+			[]tensor.Tensor{
+				ops.TensorWithBackingFixture([]float32{1, 2}, 2),
+				ops.TensorWithBackingFixture([]int{3, 4}, 2),
+				ops.TensorWithBackingFixture([]float32{1, 2}, 2),
+				ops.TensorWithBackingFixture([]float32{1, 2}, 2),
+				ops.TensorWithBackingFixture([]float32{1, 2}, 2),
+			},
+			ops.ErrInvalidInputType(1, "int", &BatchNormalization{}),
+		},
+	}
+
+	for _, test := range tests {
+		batchNormalization := &BatchNormalization{}
+		validated, err := batchNormalization.ValidateInputs(test.inputs)
+
+		assert.Equal(t, test.err, err)
+
+		if test.err == nil {
+			assert.Equal(t, test.inputs, validated)
+		}
+	}
+}