openvinotoolkit · IvanNovoselov · Sep 27, 2024 · Sep 9, 2024 · Sep 10, 2024 · Sep 10, 2024
@@ -0,0 +1,27 @@
+// Copyright (C) 2018-2024 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/pass/matcher_pass.hpp"
+#include "snippets/pass/tokenization.hpp"
+
+namespace ov {
+namespace snippets {
+namespace pass {
+
+/**
+ * @interface TokenizeFCSnippets
+ * @brief The pass tokenizes FullyConnected like (with constant path on B input) MatMuls
+ * @ingroup snippets
+ */
+class TokenizeFCSnippets: public ov::pass::MatcherPass {
+public:
+    OPENVINO_RTTI("TokenizeFCSnippets", "0");
+    TokenizeFCSnippets(const SnippetsTokenization::Config& config);
+};
+
+}  // namespace pass
+}  // namespace snippets
+}  // namespace ov
@@ -0,0 +1,28 @@
+// Copyright (C) 2024 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief A file contains tokenization related utilities.
+ * @file tokenization_utils.hpp
+ */
+#pragma once
+
+#include "snippets/op/subgraph.hpp"
+#include "snippets/pass/tokenization.hpp"
+
+namespace ov {
+namespace snippets {
+namespace utils {
+/**
+ * @brief Tokenizes a node into Subgraph. 2 options are possible (depending on config's values and internal logic)L
+ *        1. The node is wrapped in a trivial Subgraph which contains only this node
+ *        2. The node is fused in parent's Subgraphs
+ * @param node node which should be tokenized
+ * @param config tokenization config which regulates 
+ * @return whether the node was tokenized or not
+ */
+bool tokenize_node(const std::shared_ptr<ov::Node>& node, const ov::snippets::pass::SnippetsTokenization::Config& config);
+} // namespace utils
+} // namespace snippets
+} // namespace ov
@@ -0,0 +1,33 @@
+// Copyright (C) 2024 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "snippets/pass/fc_tokenization.hpp"
+
+#include "openvino/pass/graph_rewrite.hpp"
+#include "openvino/pass/pattern/op/wrap_type.hpp"
+#include "snippets/itt.hpp"
+#include "snippets/op/subgraph.hpp"
+#include "snippets/utils/tokenization_utils.hpp"
+
+ov::snippets::pass::TokenizeFCSnippets::TokenizeFCSnippets(const SnippetsTokenization::Config& config) {
+    MATCHER_SCOPE(TokenizeFCSnippets);
+    // TODO: extend constant path coverage:
+    // 1. Transpose support
+    // 2. Convert support
+    // 3. Decompression subgraphs support (and all the possible compressed weights related precisions)
+    auto constant = ov::pass::pattern::wrap_type<ov::op::v0::Constant>();
+    auto m_matmul = ov::pass::pattern::wrap_type<ov::opset1::MatMul>({ov::pass::pattern::any_input(), constant});
+
+    auto callback = [OV_CAPTURE_CPY_AND_THIS](ov::pass::pattern::Matcher &m) {
+        OV_ITT_SCOPED_TASK(ov::pass::itt::domains::SnippetsTransform, "Snippets::op::TokenizeFCSnippets")
+        const auto matmul = m.get_match_root();
+        if (transformation_callback(matmul)) {
+            return false;
+        }
+        return ov::snippets::utils::tokenize_node(matmul, config);
+    };
+
+    auto matcher = std::make_shared<ov::pass::pattern::Matcher>(m_matmul, matcher_name);
+    register_matcher(matcher, callback);
+}
@@ -2,16 +2,17 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "snippets/itt.hpp"
+#include "snippets/pass/tokenization.hpp"
 
+#include "openvino/pass/graph_rewrite.hpp"
 #include "openvino/pass/manager.hpp"
-#include "snippets/pass/tokenization.hpp"
+#include "snippets/itt.hpp"
+#include "snippets/pass/collapse_subgraph.hpp"
 #include "snippets/pass/common_optimizations.hpp"
 #include "snippets/pass/extract_reshapes_from_mha.hpp"
-#include "snippets/pass/mha_tokenization.hpp"
+#include "snippets/pass/fc_tokenization.hpp"
 #include "snippets/pass/gn_tokenization.hpp"
-#include "snippets/pass/collapse_subgraph.hpp"
-
+#include "snippets/pass/mha_tokenization.hpp"
 
 namespace ov {
 namespace snippets {
@@ -81,9 +82,15 @@ bool SnippetsTokenization::run_on_model(const std::shared_ptr<ov::Model>& m) {
 
     manager.register_pass<EnumerateNodes>();
     manager.register_pass<ExtractReshapesFromMHA>();
+    // This pass mustn't be registered in GraphRewrite with other tokenization passes
+    // since it changes the nodes after the matched root node
     manager.register_pass<TokenizeMHASnippets>(m_config);
-    manager.register_pass<TokenizeGNSnippets>();
-    manager.register_pass<TokenizeSnippets>(m_config);
+
+    auto tokenization_passes = manager.register_pass<ov::pass::GraphRewrite>();
+    tokenization_passes->add_matcher<TokenizeGNSnippets>();
+    tokenization_passes->add_matcher<TokenizeFCSnippets>(m_config);
+    tokenization_passes->add_matcher<TokenizeSnippets>(m_config);
+
     manager.register_pass<CommonOptimizations>(m_config);
     manager.run_passes(m);
 

@@ -197,16 +197,9 @@ Result BrgemmShapeInfer::infer(const std::vector<VectorDimsRef>& input_shapes) {
     size_t max_rank = arg0_shape_tmp.size();
     VectorDims output_shape(max_rank);
     for (size_t i = 0; i < max_rank - 2; ++i) {
-        if (arg0_shape_tmp[i] == arg1_shape_tmp[i]) {
-            output_shape[i] = arg0_shape_tmp[i];
-        } else {
-            if (arg0_shape_tmp[i] == 1 || utils::is_dynamic_value(arg0_shape_tmp[i]))
-                output_shape[i] = arg1_shape_tmp[i];
-            else if (arg1_shape_tmp[i] == 1 || utils::is_dynamic_value(arg1_shape_tmp[i]))
-                output_shape[i] = arg0_shape_tmp[i];
-            else
-                OPENVINO_THROW("Incompatible Brgemm batch dimension");
-        }
+        if (!utils::broadcast_merge_dim(output_shape[i], arg0_shape_tmp[i], arg1_shape_tmp[i]))
+            OPENVINO_THROW("Incompatible MatMul batch dimension. Can't merge dim ", arg0_shape_tmp[i],
+                           " with dim ", arg1_shape_tmp[i], " at index=", i);
     }
     output_shape[output_shape.size() - 2] = arg0_shape_tmp[arg0_shape_tmp.size() - 2];  // M
     output_shape[output_shape.size() - 1] = arg1_shape_tmp[arg1_shape_tmp.size() - 1];  // N