intel
diff --git a/‎js/web/docs/webnn-operators.md‎
Lines changed: 1 addition & 0 deletions b/‎js/web/docs/webnn-operators.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎onnxruntime/core/providers/webnn/builders/helper.cc‎
Lines changed: 8 additions & 8 deletions b/‎onnxruntime/core/providers/webnn/builders/helper.cc‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎onnxruntime/core/providers/webnn/builders/helper.h‎
Lines changed: 6 additions & 3 deletions b/‎onnxruntime/core/providers/webnn/builders/helper.h‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎onnxruntime/core/providers/webnn/builders/impl/attention_helper.h‎
Lines changed: 72 additions & 0 deletions b/‎onnxruntime/core/providers/webnn/builders/impl/attention_helper.h‎
Lines changed: 72 additions & 0 deletions
diff --git a/‎onnxruntime/core/providers/webnn/builders/impl/binary_op_builder.cc‎
Lines changed: 1 addition & 1 deletion b/‎onnxruntime/core/providers/webnn/builders/impl/binary_op_builder.cc‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎onnxruntime/core/providers/webnn/builders/impl/concat_op_builder.cc‎
Lines changed: 1 addition & 1 deletion b/‎onnxruntime/core/providers/webnn/builders/impl/concat_op_builder.cc‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎onnxruntime/core/providers/webnn/builders/impl/conv_op_builder.cc‎
Lines changed: 1 addition & 1 deletion b/‎onnxruntime/core/providers/webnn/builders/impl/conv_op_builder.cc‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎onnxruntime/core/providers/webnn/builders/impl/gemm_op_builder.cc‎
Lines changed: 1 addition & 1 deletion b/‎onnxruntime/core/providers/webnn/builders/impl/gemm_op_builder.cc‎
Lines changed: 1 addition & 1 deletion
@@ -49,6 +49,7 @@ platforms. Check the [WebNN status](https://webmachinelearning.github.io/webnn-s
 | GlobalLpPool| ai.onnx(7+) | l2Pool2d | Only supports 4-D input, 'p' value is 2 |
 | Greater | ai.onnx(7-8, 9-12, 13+) | greater | |
 | GreaterOrEqual | ai.onnx(12-15, 16+) | greaterOrEqual | |
+| GroupQueryAttention | com.microsoft(1+) | add, cast, concat, constant, cumulativeSum, div, expand, lesser, matmul, reshape, scatterND, softmax, transpose, where | Only supports input total_sequence_length is constant and past_sequence_length of past kv equals to present_sequence_length of present kv. Does not support cos_cache and sin_cache inputs |
 | GRU | ai.onnx(7-13, 14-21, 22+) | gru | Only supports 'layout' == 0. 'clip' is not supported. The activation functions in 'activations' must be one of 'Relu', 'Tanh', 'Sigmoid'. Forward and backward activations must be the same if bidirectional. 'sequence_lens' if present should be constant with values equal to the first dimension length of input 'X' |
 | HardSigmoid | ai.onnx(7+) | hardSigmoid | |
 | HardSwish | ai.onnx(14+) | hardSwish | |
 
@@ -121,15 +121,15 @@ std::unordered_set<const Node*> GetSupportedNodes(const GraphViewer& graph_viewe
   return supported_nodes;
 }
 
-bool AreInputDataTypesSame(const std::string_view op_type,
-                           gsl::span<const int32_t> input_types,
-                           const logging::Logger& logger) {
-  for (size_t i = 1; i < input_types.size(); i++) {
-    if (input_types[0] != input_types[i]) {
+bool AreDataTypesSame(const std::string_view op_type,
+                      gsl::span<const int32_t> data_types,
+                      const logging::Logger& logger) {
+  for (size_t i = 1; i < data_types.size(); i++) {
+    if (data_types[0] != data_types[i]) {
       LOGS(logger, VERBOSE) << "[" << op_type
-                            << "] Input data types should be the same, but ["
-                            << input_types[0] << "] does not match "
-                            << input_types[i] << "].";
+                            << "] data types should be the same, but ["
+                            << data_types[0] << "] does not match "
+                            << data_types[i] << "].";
       return false;
     }
   }
 
@@ -199,6 +199,9 @@ std::unordered_set<const Node*> GetSupportedNodes(const GraphViewer& graph_viewe
 
 // Some ONNX ops are supported by decomposed WebNN ops.
 const std::map<std::string_view, std::vector<std::string_view>> decomposed_op_map = {
+    {"GroupQueryAttention",
+     {"add", "cast", "concat", "constant", "cumulativeSum", "div", "expand", "lesser", "matmul", "reshape", "scatterND",
+      "softmax", "transpose", "where"}},
     {"LRN", {"add", "averagePool2d", "div", "mul", "pad", "pow", "transpose"}},
     {"MatMulNBits", {"add", "dequantizeLinear", "matmul", "reshape", "transpose"}},
     {"RotaryEmbedding", {"add", "concat", "gather", "mul", "reshape", "split"}},
@@ -361,9 +364,9 @@ const std::map<ONNX_NAMESPACE::TensorProto_DataType, std::string_view> onnx_to_w
     {ONNX_NAMESPACE::TensorProto_DataType_UINT64, "uint64"},
 };
 
-bool AreInputDataTypesSame(const std::string_view op_type,
-                           gsl::span<const int32_t> input_types,
-                           const logging::Logger& logger);
+bool AreDataTypesSame(const std::string_view op_type,
+                      gsl::span<const int32_t> input_types,
+                      const logging::Logger& logger);
 bool IsSupportedDataType(const int32_t onnx_data_type, const emscripten::val& webnn_supported_data_types);
 bool IsDataTypeSupportedByOp(const std::string_view onnx_op_type,
                              const int32_t onnx_data_type,
 
@@ -0,0 +1,72 @@
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Copyright (c) Intel Corporation. All rights reserved.
+// Licensed under the MIT License.
+
+namespace onnxruntime {
+namespace webnn {
+/*
+    ScaledDotProductAttention Subgraph: The basis for MultiHeadAttention and GroupQueryAttention
+    inputs: query, key, value, scale, attention mask, and reshape_output_shape (for reshape)
+    Abbreviatios: B is batch_size, S is query sequence_length, kv_S is key/value sequence length,
+                  N is number of attention heads, H is head size, W is hidden_size
+
+  query         key
+    |            |
+    +---matmul---+    scale
+          |             |
+          +-----div-----+   attn_mask
+                 |             |
+                 +-----add-----+        value
+                        |                 |
+                        +------matmul-----+
+                                 |
+                   (0,2,1,3) transpose B,H,S,N -> B,S,H,N
+                                 |
+                              reshape B,S,H,N -> B,S,W
+                                 |
+                               output
+*/
+emscripten::val ScaledDotProductAttention(ModelBuilder& model_builder, const Node& node, const logging::Logger& logger,
+                                          emscripten::val query, emscripten::val key, emscripten::val value,
+                                          emscripten::val scale, emscripten::val attn_mask,
+                                          std::vector<uint32_t> reshape_output_shape) {
+  emscripten::val common_options = emscripten::val::object();
+  // B,H,S,N * B,H,kv_S,N = B,H,S,kv_S
+  common_options.set("label", node.Name() + "_/Attention/qkv/matmul_1");
+  emscripten::val matmul_output =
+      model_builder.GetBuilder().call<emscripten::val>("matmul", query, key, common_options);
+
+  common_options.set("label", node.Name() + "_/Attention/qkv/div");
+  emscripten::val div_output =
+      model_builder.GetBuilder().call<emscripten::val>("mul", matmul_output, scale, common_options);
+
+  emscripten::val softmax_input = div_output;
+  if (attn_mask != emscripten::val::undefined()) {
+    common_options.set("label", node.Name() + "_/Attention/attn_mask/softmax_input");
+    softmax_input = model_builder.GetBuilder().call<emscripten::val>("add", div_output, attn_mask, common_options);
+  }
+
+  common_options.set("label", node.Name() + "_/Attention/attn_mask/softmax_input");
+  int32_t softmax_axis = 3;
+  emscripten::val softmax_output =
+      model_builder.GetBuilder().call<emscripten::val>("softmax", softmax_input, softmax_axis, common_options);
+
+  // B,H,S,kv_S * B,H,kv_S,N = B,H,S,N
+  common_options.set("label", node.Name() + "_/Attention/qkv/matmul_2");
+  emscripten::val attn_output =
+      model_builder.GetBuilder().call<emscripten::val>("matmul", softmax_output, value, common_options);
+
+  emscripten::val options = emscripten::val::object();
+  options.set("permutation", emscripten::val::array(std::vector<uint32_t>({0, 2, 1, 3})));
+  options.set("label", node.Name() + "_/Attention/qkv/transpose");
+  attn_output = model_builder.GetBuilder().call<emscripten::val>("transpose", attn_output, options);
+
+  common_options.set("label", node.Name() + "_/Attention/qkv/reshape");
+  attn_output = model_builder.GetBuilder().call<emscripten::val>(
+      "reshape", attn_output, emscripten::val::array(reshape_output_shape), common_options);
+
+  return attn_output;
+}
+
+}  // namespace webnn
+}  // namespace onnxruntime
@@ -69,7 +69,7 @@ bool BinaryOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& nod
     return false;
 
   std::array<int32_t, 2> input_types{input0_type, input1_type};
-  if (!AreInputDataTypesSame(op_type, input_types, logger)) {
+  if (!AreDataTypesSame(op_type, input_types, logger)) {
     return false;
   }
 
 
@@ -70,7 +70,7 @@ bool ConcatOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& nod
     }
 
     std::array<int32_t, 2> input_types{input0_type, input_type};
-    if (!AreInputDataTypesSame(op_type, input_types, logger)) {
+    if (!AreDataTypesSame(op_type, input_types, logger)) {
       return false;
     }
   }
 
@@ -406,7 +406,7 @@ bool ConvOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& node,
   if (has_input3) {
     input_types.push_back(input3_type);
   }
-  if (!AreInputDataTypesSame(op_type, input_types, logger)) {
+  if (!AreDataTypesSame(op_type, input_types, logger)) {
     return false;
   }
 
 
@@ -237,7 +237,7 @@ bool GemmOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& node,
   if (has_input3) {
     input_types.push_back(input3_type);
   }
-  if (!AreInputDataTypesSame(op_type, input_types, logger)) {
+  if (!AreDataTypesSame(op_type, input_types, logger)) {
     return false;
   }
Original file line number	Diff line number	Diff line change
`@@ -69,7 +69,7 @@ bool BinaryOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& nod`
`69`	`69`	`return false;`
`70`	`70`
`71`	`71`	`std::array<int32_t, 2> input_types{input0_type, input1_type};`
`72`		`- if (!AreInputDataTypesSame(op_type, input_types, logger)) {`
	`72`	`+ if (!AreDataTypesSame(op_type, input_types, logger)) {`
`73`	`73`	`return false;`
`74`	`74`	`}`
`75`	`75`
Original file line number	Diff line number	Diff line change
`@@ -70,7 +70,7 @@ bool ConcatOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& nod`
`70`	`70`	`}`
`71`	`71`
`72`	`72`	`std::array<int32_t, 2> input_types{input0_type, input_type};`
`73`		`- if (!AreInputDataTypesSame(op_type, input_types, logger)) {`
	`73`	`+ if (!AreDataTypesSame(op_type, input_types, logger)) {`
`74`	`74`	`return false;`
`75`	`75`	`}`
`76`	`76`	`}`
Original file line number	Diff line number	Diff line change
`@@ -406,7 +406,7 @@ bool ConvOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& node,`
`406`	`406`	`if (has_input3) {`
`407`	`407`	`input_types.push_back(input3_type);`
`408`	`408`	`}`
`409`		`- if (!AreInputDataTypesSame(op_type, input_types, logger)) {`
	`409`	`+ if (!AreDataTypesSame(op_type, input_types, logger)) {`
`410`	`410`	`return false;`
`411`	`411`	`}`
`412`	`412`
Original file line number	Diff line number	Diff line change
`@@ -237,7 +237,7 @@ bool GemmOpBuilder::HasSupportedInputsImpl(const GraphViewer&, const Node& node,`
`237`	`237`	`if (has_input3) {`
`238`	`238`	`input_types.push_back(input3_type);`
`239`	`239`	`}`
`240`		`- if (!AreInputDataTypesSame(op_type, input_types, logger)) {`
	`240`	`+ if (!AreDataTypesSame(op_type, input_types, logger)) {`
`241`	`241`	`return false;`
`242`	`242`	`}`
`243`	`243`