intel
diff --git a/‎unified-runtime/include/ur_api.h
Lines changed: 6 additions & 0 deletions b/‎unified-runtime/include/ur_api.h
Lines changed: 6 additions & 0 deletions
diff --git a/‎unified-runtime/include/ur_print.hpp
Lines changed: 10 additions & 0 deletions b/‎unified-runtime/include/ur_print.hpp
Lines changed: 10 additions & 0 deletions
diff --git a/‎unified-runtime/scripts/core/exp-launch-properties.yml
Lines changed: 6 additions & 0 deletions b/‎unified-runtime/scripts/core/exp-launch-properties.yml
Lines changed: 6 additions & 0 deletions
diff --git a/‎unified-runtime/source/adapters/cuda/enqueue.cpp
Lines changed: 7 additions & 0 deletions b/‎unified-runtime/source/adapters/cuda/enqueue.cpp
Lines changed: 7 additions & 0 deletions
diff --git a/‎unified-runtime/test/conformance/exp_launch_properties/launch_properties.cpp
Lines changed: 9 additions & 0 deletions b/‎unified-runtime/test/conformance/exp_launch_properties/launch_properties.cpp
Lines changed: 9 additions & 0 deletions
@@ -36,6 +36,8 @@ etors:
       desc: "work-group cluster dimensions"
     - name: WORK_GROUP_MEMORY
       desc: "Implicit work group memory allocation"
+    - name: OPPORTUNISTIC_QUEUE_SERIALIZE
+      desc: "Whether to opportunistically execute kernel launches serially on a native queue"
 --- #--------------------------------------------------------------------------
 type: union
 desc: "Specifies a launch property value"
@@ -56,6 +58,10 @@ members:
       name: workgroup_mem_size
       desc: "[in] non-zero value indicates the amount of work group memory to allocate in bytes"
       tag: $X_EXP_LAUNCH_PROPERTY_ID_WORK_GROUP_MEMORY
+    - type: int
+      name: opportunistic_queue_serialize
+      desc: "[in] non-zero value indicates an opportunistic native queue serialized kernel"
+      tag: $X_EXP_LAUNCH_PROPERTY_ID_OPPORTUNISTIC_QUEUE_SERIALIZE
 --- #--------------------------------------------------------------------------
 type: struct
 desc: "Kernel launch property"
 
@@ -560,6 +560,13 @@ UR_APIEXPORT ur_result_t UR_APICALL urEnqueueKernelLaunchCustomExp(
       attr.value.cooperative = launchPropList[i].value.cooperative;
       break;
     }
+    case UR_EXP_LAUNCH_PROPERTY_ID_OPPORTUNISTIC_QUEUE_SERIALIZE: {
+      auto &attr = launch_attribute.emplace_back();
+      attr.id = CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_STREAM_SERIALIZATION;
+      attr.value.programmaticStreamSerializationAllowed =
+          launchPropList[i].value.opportunistic_queue_serialize;
+      break;
+    }
     case UR_EXP_LAUNCH_PROPERTY_ID_WORK_GROUP_MEMORY: {
       break;
     }
 
@@ -66,6 +66,15 @@ TEST_P(urEnqueueKernelLaunchCustomTest, Success) {
       props.push_back(coop_prop);
     }
 
+    if (compute_capability >= 9.0) {
+      ur_exp_launch_property_t opportunistic_queue_serialize_prop;
+      opportunistic_queue_serialize_prop.id =
+          UR_EXP_LAUNCH_PROPERTY_ID_OPPORTUNISTIC_QUEUE_SERIALIZE;
+      opportunistic_queue_serialize_prop.value.opportunistic_queue_serialize =
+          1;
+      props.push_back(opportunistic_queue_serialize_prop);
+    }
+
     ur_bool_t cluster_launch_supported = false;
     ASSERT_SUCCESS(
         urDeviceGetInfo(device, UR_DEVICE_INFO_CLUSTER_LAUNCH_SUPPORT_EXP,
Original file line number	Diff line number	Diff line change
`@@ -560,6 +560,13 @@ UR_APIEXPORT ur_result_t UR_APICALL urEnqueueKernelLaunchCustomExp(`
`560`	`560`	`attr.value.cooperative = launchPropList[i].value.cooperative;`
`561`	`561`	`break;`
`562`	`562`	`}`
	`563`	`+ case UR_EXP_LAUNCH_PROPERTY_ID_OPPORTUNISTIC_QUEUE_SERIALIZE: {`
	`564`	`+ auto &attr = launch_attribute.emplace_back();`
	`565`	`+ attr.id = CU_LAUNCH_ATTRIBUTE_PROGRAMMATIC_STREAM_SERIALIZATION;`
	`566`	`+ attr.value.programmaticStreamSerializationAllowed =`
	`567`	`+ launchPropList[i].value.opportunistic_queue_serialize;`
	`568`	`+ break;`
	`569`	`+ }`
`563`	`570`	`case UR_EXP_LAUNCH_PROPERTY_ID_WORK_GROUP_MEMORY: {`
`564`	`571`	`break;`
`565`	`572`	`}`