Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 9 additions & 0 deletions onnxruntime/core/optimizer/matmul_integer_to_float.cc
Original file line number Diff line number Diff line change
Expand Up @@ -114,6 +114,15 @@ Status MatMulIntegerToFloatFusion::ApplyImpl(Graph& graph, bool& modified, int g
continue;
}

const Node* p_dynamicquantize_node = graph_utils::FirstParentByType(*p_matmulinteger_node, "DynamicQuantizeLinear");

// Check MatMulInteger Nodes' input is coming from DynamicQuantizeLinear
// For larger tensors DynamicQuantizeLinear -> MatMulInteger is used to be resource efficient
// And we have better MatMulInteger Metacommand coverage in DML
if (is_dml_ep && p_dynamicquantize_node) {
continue;
}

// Find bias node
Node* p_add_node = nullptr;
if (optimizer_utils::CheckOutputEdges(graph, mul_node, 1)) {
Expand Down
Loading