Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Fix the aten::mv for pytorch models #22073 #22677

Merged
merged 24 commits into from
Mar 25, 2024
Merged
Show file tree
Hide file tree
Changes from 8 commits
Commits
Show all changes
24 commits
Select commit Hold shift + click to select a range
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
41 changes: 41 additions & 0 deletions src/frontends/pytorch/src/op/matmul.cpp
mvafin marked this conversation as resolved.
Show resolved Hide resolved
Original file line number Diff line number Diff line change
@@ -0,0 +1,41 @@
#include "openvino/frontend/pytorch/node_context.hpp"
#include "openvino/op/matmul.hpp"
#include "pt_framework_node.hpp"
#include "openvino/op/convert.hpp"
#include "openvino/op/convert_like.hpp"
#include "utils.hpp"

namespace ov {
namespace frontend {
namespace pytorch {
namespace op {
using namespace ov::op;

OutputVector translate_mv(const NodeContext& context) {
num_inputs_check(context, 2, 3);
// "aten::mv(Tensor input, Tensor vec) -> Tensor"

// Ensure matrix input is in float32 dtype
auto matrix = context.mark_node(std::make_shared<v0::Convert>(context.get_input(0), element::f32));
eaidova marked this conversation as resolved.
Show resolved Hide resolved

// Ensure vector input is in float32 dtype
auto vector = context.mark_node(std::make_shared<v0::Convert>(context.get_input(1), element::f32));
mvafin marked this conversation as resolved.
Show resolved Hide resolved

// Perform matrix-vector multiplication
auto result = context.mark_node(std::make_shared<v1::MatMul>(matrix, vector));



if (!context.input_is_none(2)) {
context.mutate_input(2, result);
}

return {result};
}

} // namespace op
} // namespace pytorch
} // namespace frontend
} // namespace ov

} // namespace ov
2 changes: 2 additions & 0 deletions src/frontends/pytorch/src/op_table.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -125,6 +125,7 @@ OP_CONVERTER(translate_lstm);
OP_CONVERTER(translate_masked_fill);
OP_CONVERTER(translate_masked_scatter);
OP_CONVERTER(translate_max);
OP_CONVERTER(translate_mv);
mvafin marked this conversation as resolved.
Show resolved Hide resolved
OP_CONVERTER(translate_max_dim);
OP_CONVERTER(translate_maximum);
OP_CONVERTER(translate_max_poolnd);
Expand Down Expand Up @@ -482,6 +483,7 @@ const std::map<std::string, CreatorFunction> get_supported_ops_ts() {
{"aten::masked_scatter_", op::inplace_op<op::translate_masked_scatter>},
{"aten::matmul", op::translate_1to1_match_2_inputs<opset10::MatMul>},
{"aten::max", op::translate_max},
{"aten::mv", op::translate_mv},
mvafin marked this conversation as resolved.
Show resolved Hide resolved
{"aten::maximum", op::translate_maximum},
{"aten::max_pool1d", op::quantizable_op<op::translate_max_poolnd>},
{"aten::max_pool1d_with_indices", op::quantizable_op<op::translate_max_poolnd>},
Expand Down
37 changes: 37 additions & 0 deletions tests/layer_tests/pytorch_tests/test_matmul.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
import numpy as np
import pytest
import torch
from pytorch_layer_test_class import PytorchLayerTest

class TestMVOperation(PytorchLayerTest):
def _prepare_input(self, matrix, vector):
matrix_input = np.array(matrix).astype(np.float32)
vector_input = np.array(vector).astype(np.float32)
return [matrix_input, vector_input]

def create_model(self, matrix, vector):
class CustomMVOperation(torch.nn.Module):
def forward(self, matrix, vector):
return torch.mv(matrix, vector) # Using torch.mv for matrix-vector multiplication
mvafin marked this conversation as resolved.
Show resolved Hide resolved

model_class = CustomMVOperation()
ref_net = None
return model_class, ref_net, "aten::mv"

@pytest.mark.nightly
@pytest.mark.precommit
@pytest.mark.parametrize("matrix, vector", [
(np.array([[1, 2], [3, 4]]), np.array([5, 6])),
(np.array([[0, 0], [0, 0]]), np.array([1, 2])),
(np.array([[1, 2, 3], [4, 5, 6]]), np.array([0, 1, 0])),
(np.array([[1, 0, 0], [0, 1, 0], [0, 0, 1]]), np.array([2, 3, 4])),
# Add more test cases as needed
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Add maybe 1 or 2 more test cases for non-square matrix and 3x3 matrix

])
def test_mv_operation(self, matrix, vector, ie_device, precision, ir_version):
self._test(
*self.create_model(matrix, vector),
ie_device,
precision,
ir_version,
kwargs_to_prepare_input={"matrix": matrix, "vector": vector}
)
Loading