Add prelu and normalize ops (#107)

alessandropalla · web-flow · commit f04d499432fe · 2024-07-25T15:53:58.000+02:00
diff --git a/include/intel_npu_acceleration_library/nn_factory.h b/include/intel_npu_acceleration_library/nn_factory.h
@@ -914,6 +914,19 @@ class ModelFactory : public intel_npu_acceleration_library::OVInferenceModel {
         return power.get();
     }
 
+    /**
+     * @brief Create a new prelu operation
+     *
+     * @param x1 operation's input node
+     * @param slope operation's slope
+     * @return ov::op::Op*
+     */
+    ov::op::Op* prelu(ov::op::Op* x1, ov::op::Op* slope) {
+        auto power = std::make_shared<ov::op::v0::PRelu>(x1->output(0), slope->output(0));
+        operations.push_back(power);
+        return power.get();
+    }
+
     /**
      * @brief Create a new log softmax operation
      *
diff --git a/intel_npu_acceleration_library/backend/ops.py b/intel_npu_acceleration_library/backend/ops.py
@@ -57,6 +57,7 @@ def get_supported_ops() -> List[SupportedOp]:
         SupportedOp(name="log_act", inputs=1),
         SupportedOp(name="negative", inputs=1),
         SupportedOp(name="relu", inputs=1),
+        SupportedOp(name="prelu", inputs=2),
         SupportedOp(name="sigmoid", inputs=1),
         SupportedOp(name="sign", inputs=1),
         SupportedOp(name="sin_act", inputs=1),
diff --git a/intel_npu_acceleration_library/nn/functional.py b/intel_npu_acceleration_library/nn/functional.py
@@ -443,15 +443,45 @@ def layer_norm(
     """
     axis = input.shape.index(normalized_shape[0])
     ln = generate_op([input], "normL2", axis, eps)
-    if weight:
+    if weight is not None:
         ln = ln * weight
 
-    if bias:
+    if bias is not None:
         ln = ln + bias
 
     return ln
 
 
+@implements(torch.nn.functional.normalize)
+def normalize(
+    input: Tensor,
+    p: float = 2.0,
+    dim: int = 1,
+    eps: float = 1e-12,
+    out: Optional[Tensor] = None,
+) -> Tensor:
+    """Return the normalized tensor.
+
+    Args:
+        input (Tensor): The input tensor.
+        p (float): The power value. Defaults to 2.0.
+        dim (int): The dim to normalize. Defaults to 1.
+        eps (float): The epsilon value. Defaults to 1e-12.
+        out (Optional[Tensor], optional): Output tensor. Defaults to None.
+
+    Raises:
+        NotImplementedError: p != 2 is not supported yet
+
+    Returns:
+        Tensor: Output tensor.
+    """
+    if p != 2:
+        raise NotImplementedError("p != 2 is not supported yet")
+
+    out = generate_op([input], "normL2", dim, eps)
+    return out
+
+
 @implements(torch.ceil)
 def ceil(x: Tensor, out: Optional[Tensor] = None) -> Tensor:
     """Return the ceil of a tensor element-wise.
@@ -814,6 +844,20 @@ def relu(x: Tensor, inplace=False) -> Tensor:
     return out
 
 
+@implements(torch.nn.functional.prelu)
+def prelu(x: Tensor, weight: Tensor) -> Tensor:
+    """Return the parametric relu of a tensor element-wise.
+
+    Args:
+        x (Tensor): The input tensor.
+        weight (Tensor): The weights tensor.
+
+    Returns:
+        Tensor: Output tensor.
+    """
+    return generate_op([x, weight], "prelu")
+
+
 @implements(torch.nn.functional.sigmoid)
 def sigmoid(x: Tensor) -> Tensor:
     """Return the sigmoid of a tensor element-wise.
@@ -955,6 +999,10 @@ def adaptive_avg_pool2d(input: Tensor, output_size: Sequence[int]):
     Returns:
         Tensor: Output tensor.
     """
+    if output_size == 1:
+        return generate_op(
+            [input], "reduce_mean", reduction_axes=[-2, -1], keep_dims=True
+        )
     return generate_op([input, output_size], "adaptive_avg_pool")
 
 
@@ -977,6 +1025,10 @@ def adaptive_max_pool2d(
     """
     if return_indices:
         raise NotImplementedError("return_indices is not supported yet")
+    if output_size == 1:
+        return generate_op(
+            [input], "reduce_max", reduction_axes=[-2, -1], keep_dims=True
+        )
     return generate_op([input, output_size], "adaptive_max_pool")
 
 
diff --git a/src/bindings.cpp b/src/bindings.cpp
@@ -262,6 +262,11 @@ intel_npu_acceleration_library_DLL_API ov::op::Op* relu(intel_npu_acceleration_l
     return factory->relu(in0);
 }
 
+intel_npu_acceleration_library_DLL_API ov::op::Op* prelu(intel_npu_acceleration_library::ModelFactory* factory,
+                                                         ov::op::Op* in0, ov::op::Op* in1) {
+    return factory->prelu(in0, in1);
+}
+
 intel_npu_acceleration_library_DLL_API ov::op::Op* sigmoid(intel_npu_acceleration_library::ModelFactory* factory,
                                                            ov::op::Op* in0) {
     return factory->sigmoid(in0);