@@ -433,10 +433,6 @@ typedef enum ur_function_t {
433
433
UR_FUNCTION_BINDLESS_IMAGES_MAP_EXTERNAL_LINEAR_MEMORY_EXP = 245,
434
434
/// Enumerator for ::urEnqueueEventsWaitWithBarrierExt
435
435
UR_FUNCTION_ENQUEUE_EVENTS_WAIT_WITH_BARRIER_EXT = 246,
436
- /// Enumerator for ::urTensorMapEncodeIm2ColExp
437
- UR_FUNCTION_TENSOR_MAP_ENCODE_IM_2_COL_EXP = 247,
438
- /// Enumerator for ::urTensorMapEncodeTiledExp
439
- UR_FUNCTION_TENSOR_MAP_ENCODE_TILED_EXP = 248,
440
436
/// Enumerator for ::urPhysicalMemGetInfo
441
437
UR_FUNCTION_PHYSICAL_MEM_GET_INFO = 249,
442
438
/// @cond
@@ -12133,258 +12129,6 @@ UR_APIEXPORT ur_result_t UR_APICALL urEnqueueNativeCommandExp(
12133
12129
/// array.
12134
12130
ur_event_handle_t *phEvent);
12135
12131
12136
- #if !defined(__GNUC__)
12137
- #pragma endregion
12138
- #endif
12139
- // Intel 'oneAPI' Unified Runtime Experimental API for mapping tensor objects
12140
- #if !defined(__GNUC__)
12141
- #pragma region tensor_map_(experimental)
12142
- #endif
12143
- ///////////////////////////////////////////////////////////////////////////////
12144
- /// @brief Handle of tensor map object
12145
- typedef struct ur_exp_tensor_map_handle_t_ *ur_exp_tensor_map_handle_t;
12146
-
12147
- ///////////////////////////////////////////////////////////////////////////////
12148
- /// @brief Tensor map data type
12149
- typedef uint32_t ur_exp_tensor_map_data_type_flags_t;
12150
- typedef enum ur_exp_tensor_map_data_type_flag_t {
12151
- /// 1 byte
12152
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT8 = UR_BIT(0),
12153
- /// 2 bytes
12154
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT16 = UR_BIT(1),
12155
- /// 4 bytes
12156
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT32 = UR_BIT(2),
12157
- /// 4 bytes
12158
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_INT32 = UR_BIT(3),
12159
- /// 8 bytes
12160
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT64 = UR_BIT(4),
12161
- /// 8 bytes
12162
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_INT64 = UR_BIT(5),
12163
- /// 2 bytes
12164
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT16 = UR_BIT(6),
12165
- /// 4 bytes
12166
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT32 = UR_BIT(7),
12167
- /// 8 bytes
12168
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT64 = UR_BIT(8),
12169
- /// 2 bytes
12170
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_BFLOAT16 = UR_BIT(9),
12171
- /// 4 bytes
12172
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT32_FTZ = UR_BIT(10),
12173
- /// 4 bytes
12174
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_TFLOAT32 = UR_BIT(11),
12175
- /// 4 bytes
12176
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_TFLOAT32_FTZ = UR_BIT(12),
12177
- /// @cond
12178
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FORCE_UINT32 = 0x7fffffff
12179
- /// @endcond
12180
-
12181
- } ur_exp_tensor_map_data_type_flag_t;
12182
- /// @brief Bit Mask for validating ur_exp_tensor_map_data_type_flags_t
12183
- #define UR_EXP_TENSOR_MAP_DATA_TYPE_FLAGS_MASK 0xffffe000
12184
-
12185
- ///////////////////////////////////////////////////////////////////////////////
12186
- /// @brief Tensor map interleave
12187
- typedef uint32_t ur_exp_tensor_map_interleave_flags_t;
12188
- typedef enum ur_exp_tensor_map_interleave_flag_t {
12189
- /// No interleave
12190
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_NONE = UR_BIT(0),
12191
- /// 16B interleave
12192
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_16B = UR_BIT(1),
12193
- /// 32B interleave
12194
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_32B = UR_BIT(2),
12195
- /// @cond
12196
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_FORCE_UINT32 = 0x7fffffff
12197
- /// @endcond
12198
-
12199
- } ur_exp_tensor_map_interleave_flag_t;
12200
- /// @brief Bit Mask for validating ur_exp_tensor_map_interleave_flags_t
12201
- #define UR_EXP_TENSOR_MAP_INTERLEAVE_FLAGS_MASK 0xfffffff8
12202
-
12203
- ///////////////////////////////////////////////////////////////////////////////
12204
- /// @brief Tensor map l2 promotion
12205
- typedef uint32_t ur_exp_tensor_map_l2_promotion_flags_t;
12206
- typedef enum ur_exp_tensor_map_l2_promotion_flag_t {
12207
- /// No promotion type
12208
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_NONE = UR_BIT(0),
12209
- /// 64B promotion type
12210
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_64B = UR_BIT(1),
12211
- /// 128B promotion type
12212
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_128B = UR_BIT(2),
12213
- /// 256B promotion type
12214
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_256B = UR_BIT(3),
12215
- /// @cond
12216
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_FORCE_UINT32 = 0x7fffffff
12217
- /// @endcond
12218
-
12219
- } ur_exp_tensor_map_l2_promotion_flag_t;
12220
- /// @brief Bit Mask for validating ur_exp_tensor_map_l2_promotion_flags_t
12221
- #define UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAGS_MASK 0xfffffff0
12222
-
12223
- ///////////////////////////////////////////////////////////////////////////////
12224
- /// @brief Tensor map swizzle
12225
- typedef uint32_t ur_exp_tensor_map_swizzle_flags_t;
12226
- typedef enum ur_exp_tensor_map_swizzle_flag_t {
12227
- /// No swizzle
12228
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_NONE = UR_BIT(0),
12229
- /// 32B swizzle
12230
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_32B = UR_BIT(1),
12231
- /// 64B swizzle
12232
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_64B = UR_BIT(2),
12233
- /// 128B swizzle
12234
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_128B = UR_BIT(3),
12235
- /// @cond
12236
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_FORCE_UINT32 = 0x7fffffff
12237
- /// @endcond
12238
-
12239
- } ur_exp_tensor_map_swizzle_flag_t;
12240
- /// @brief Bit Mask for validating ur_exp_tensor_map_swizzle_flags_t
12241
- #define UR_EXP_TENSOR_MAP_SWIZZLE_FLAGS_MASK 0xfffffff0
12242
-
12243
- ///////////////////////////////////////////////////////////////////////////////
12244
- /// @brief Tensor map OOB fill
12245
- typedef uint32_t ur_exp_tensor_map_oob_fill_flags_t;
12246
- typedef enum ur_exp_tensor_map_oob_fill_flag_t {
12247
- /// No OOB fill
12248
- UR_EXP_TENSOR_MAP_OOB_FILL_FLAG_NONE = UR_BIT(0),
12249
- /// Refer to NVIDIA docs
12250
- UR_EXP_TENSOR_MAP_OOB_FILL_FLAG_REQUEST_ZERO_FMA = UR_BIT(1),
12251
- /// @cond
12252
- UR_EXP_TENSOR_MAP_OOB_FILL_FLAG_FORCE_UINT32 = 0x7fffffff
12253
- /// @endcond
12254
-
12255
- } ur_exp_tensor_map_oob_fill_flag_t;
12256
- /// @brief Bit Mask for validating ur_exp_tensor_map_oob_fill_flags_t
12257
- #define UR_EXP_TENSOR_MAP_OOB_FILL_FLAGS_MASK 0xfffffffc
12258
-
12259
- ///////////////////////////////////////////////////////////////////////////////
12260
- /// @brief Encode tensor map with image data
12261
- ///
12262
- /// @details
12263
- /// - Map encode using im2col.
12264
- ///
12265
- /// @returns
12266
- /// - ::UR_RESULT_SUCCESS
12267
- /// - ::UR_RESULT_ERROR_UNINITIALIZED
12268
- /// - ::UR_RESULT_ERROR_DEVICE_LOST
12269
- /// - ::UR_RESULT_ERROR_ADAPTER_SPECIFIC
12270
- /// - ::UR_RESULT_ERROR_INVALID_NULL_HANDLE
12271
- /// + `NULL == hDevice`
12272
- /// - ::UR_RESULT_ERROR_INVALID_ENUMERATION
12273
- /// + `::UR_EXP_TENSOR_MAP_DATA_TYPE_FLAGS_MASK & TensorMapType`
12274
- /// + `::UR_EXP_TENSOR_MAP_INTERLEAVE_FLAGS_MASK & Interleave`
12275
- /// + `::UR_EXP_TENSOR_MAP_SWIZZLE_FLAGS_MASK & Swizzle`
12276
- /// + `::UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAGS_MASK & L2Promotion`
12277
- /// + `::UR_EXP_TENSOR_MAP_OOB_FILL_FLAGS_MASK & OobFill`
12278
- /// - ::UR_RESULT_ERROR_INVALID_NULL_POINTER
12279
- /// + `NULL == GlobalAddress`
12280
- /// + `NULL == GlobalDim`
12281
- /// + `NULL == GlobalStrides`
12282
- /// + `NULL == PixelBoxLowerCorner`
12283
- /// + `NULL == PixelBoxUpperCorner`
12284
- /// + `NULL == ElementStrides`
12285
- /// + `NULL == hTensorMap`
12286
- /// - ::UR_RESULT_ERROR_INVALID_ARGUMENT
12287
- /// + `TensorRank < 3`
12288
- UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeIm2ColExp(
12289
- /// [in] Handle of the device object.
12290
- ur_device_handle_t hDevice,
12291
- /// [in] Data type of the tensor object.
12292
- ur_exp_tensor_map_data_type_flags_t TensorMapType,
12293
- /// [in] Dimensionality of tensor; must be at least 3.
12294
- uint32_t TensorRank,
12295
- /// [in] Starting address of memory region described by tensor.
12296
- void *GlobalAddress,
12297
- /// [in] Array containing tensor size (number of elements) along each of
12298
- /// the TensorRank dimensions.
12299
- const uint64_t *GlobalDim,
12300
- /// [in] Array containing stride size (in bytes) along each of the
12301
- /// TensorRank - 1 dimensions.
12302
- const uint64_t *GlobalStrides,
12303
- /// [in] Array containing DHW dimensions of lower box corner.
12304
- const int *PixelBoxLowerCorner,
12305
- /// [in] Array containing DHW dimensions of upper box corner.
12306
- const int *PixelBoxUpperCorner,
12307
- /// [in] Number of channels per pixel.
12308
- uint32_t ChannelsPerPixel,
12309
- /// [in] Number of pixels per column.
12310
- uint32_t PixelsPerColumn,
12311
- /// [in] Array containing traversal stride in each of the TensorRank
12312
- /// dimensions.
12313
- const uint32_t *ElementStrides,
12314
- /// [in] Type of interleaved layout the tensor addresses
12315
- ur_exp_tensor_map_interleave_flags_t Interleave,
12316
- /// [in] Bank swizzling pattern inside shared memory
12317
- ur_exp_tensor_map_swizzle_flags_t Swizzle,
12318
- /// [in] L2 promotion size.
12319
- ur_exp_tensor_map_l2_promotion_flags_t L2Promotion,
12320
- /// [in] Indicates whether zero or special NaN constant will be used to
12321
- /// fill out-of-bounds elements.
12322
- ur_exp_tensor_map_oob_fill_flags_t OobFill,
12323
- /// [out] Handle of the tensor map object.
12324
- ur_exp_tensor_map_handle_t *hTensorMap);
12325
-
12326
- ///////////////////////////////////////////////////////////////////////////////
12327
- /// @brief Encode tensor map with tiled data
12328
- ///
12329
- /// @details
12330
- /// - Tiled map encode.
12331
- ///
12332
- /// @returns
12333
- /// - ::UR_RESULT_SUCCESS
12334
- /// - ::UR_RESULT_ERROR_UNINITIALIZED
12335
- /// - ::UR_RESULT_ERROR_DEVICE_LOST
12336
- /// - ::UR_RESULT_ERROR_ADAPTER_SPECIFIC
12337
- /// - ::UR_RESULT_ERROR_INVALID_NULL_HANDLE
12338
- /// + `NULL == hDevice`
12339
- /// - ::UR_RESULT_ERROR_INVALID_ENUMERATION
12340
- /// + `::UR_EXP_TENSOR_MAP_DATA_TYPE_FLAGS_MASK & TensorMapType`
12341
- /// + `::UR_EXP_TENSOR_MAP_INTERLEAVE_FLAGS_MASK & Interleave`
12342
- /// + `::UR_EXP_TENSOR_MAP_SWIZZLE_FLAGS_MASK & Swizzle`
12343
- /// + `::UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAGS_MASK & L2Promotion`
12344
- /// + `::UR_EXP_TENSOR_MAP_OOB_FILL_FLAGS_MASK & OobFill`
12345
- /// - ::UR_RESULT_ERROR_INVALID_NULL_POINTER
12346
- /// + `NULL == GlobalAddress`
12347
- /// + `NULL == GlobalDim`
12348
- /// + `NULL == GlobalStrides`
12349
- /// + `NULL == BoxDim`
12350
- /// + `NULL == ElementStrides`
12351
- /// + `NULL == hTensorMap`
12352
- /// - ::UR_RESULT_ERROR_INVALID_ARGUMENT
12353
- /// + `TensorRank < 3`
12354
- UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeTiledExp(
12355
- /// [in] Handle of the device object.
12356
- ur_device_handle_t hDevice,
12357
- /// [in] Data type of the tensor object.
12358
- ur_exp_tensor_map_data_type_flags_t TensorMapType,
12359
- /// [in] Dimensionality of tensor; must be at least 3.
12360
- uint32_t TensorRank,
12361
- /// [in] Starting address of memory region described by tensor.
12362
- void *GlobalAddress,
12363
- /// [in] Array containing tensor size (number of elements) along each of
12364
- /// the TensorRank dimensions.
12365
- const uint64_t *GlobalDim,
12366
- /// [in] Array containing stride size (in bytes) along each of the
12367
- /// TensorRank - 1 dimensions.
12368
- const uint64_t *GlobalStrides,
12369
- /// [in] Array containing traversal box size (number of elments) along
12370
- /// each of the TensorRank dimensions. Specifies how many elements to be
12371
- /// traversed along each tensor dimension.
12372
- const uint32_t *BoxDim,
12373
- /// [in] Array containing traversal stride in each of the TensorRank
12374
- /// dimensions.
12375
- const uint32_t *ElementStrides,
12376
- /// [in] Type of interleaved layout the tensor addresses
12377
- ur_exp_tensor_map_interleave_flags_t Interleave,
12378
- /// [in] Bank swizzling pattern inside shared memory
12379
- ur_exp_tensor_map_swizzle_flags_t Swizzle,
12380
- /// [in] L2 promotion size.
12381
- ur_exp_tensor_map_l2_promotion_flags_t L2Promotion,
12382
- /// [in] Indicates whether zero or special NaN constant will be used to
12383
- /// fill out-of-bounds elements.
12384
- ur_exp_tensor_map_oob_fill_flags_t OobFill,
12385
- /// [out] Handle of the tensor map object.
12386
- ur_exp_tensor_map_handle_t *hTensorMap);
12387
-
12388
12132
#if !defined(__GNUC__)
12389
12133
#pragma endregion
12390
12134
#endif
@@ -14574,49 +14318,6 @@ typedef struct ur_command_buffer_command_get_info_exp_params_t {
14574
14318
size_t **ppPropSizeRet;
14575
14319
} ur_command_buffer_command_get_info_exp_params_t;
14576
14320
14577
- ///////////////////////////////////////////////////////////////////////////////
14578
- /// @brief Function parameters for urTensorMapEncodeIm2ColExp
14579
- /// @details Each entry is a pointer to the parameter passed to the function;
14580
- /// allowing the callback the ability to modify the parameter's value
14581
- typedef struct ur_tensor_map_encode_im_2_col_exp_params_t {
14582
- ur_device_handle_t *phDevice;
14583
- ur_exp_tensor_map_data_type_flags_t *pTensorMapType;
14584
- uint32_t *pTensorRank;
14585
- void **pGlobalAddress;
14586
- const uint64_t **pGlobalDim;
14587
- const uint64_t **pGlobalStrides;
14588
- const int **pPixelBoxLowerCorner;
14589
- const int **pPixelBoxUpperCorner;
14590
- uint32_t *pChannelsPerPixel;
14591
- uint32_t *pPixelsPerColumn;
14592
- const uint32_t **pElementStrides;
14593
- ur_exp_tensor_map_interleave_flags_t *pInterleave;
14594
- ur_exp_tensor_map_swizzle_flags_t *pSwizzle;
14595
- ur_exp_tensor_map_l2_promotion_flags_t *pL2Promotion;
14596
- ur_exp_tensor_map_oob_fill_flags_t *pOobFill;
14597
- ur_exp_tensor_map_handle_t **phTensorMap;
14598
- } ur_tensor_map_encode_im_2_col_exp_params_t;
14599
-
14600
- ///////////////////////////////////////////////////////////////////////////////
14601
- /// @brief Function parameters for urTensorMapEncodeTiledExp
14602
- /// @details Each entry is a pointer to the parameter passed to the function;
14603
- /// allowing the callback the ability to modify the parameter's value
14604
- typedef struct ur_tensor_map_encode_tiled_exp_params_t {
14605
- ur_device_handle_t *phDevice;
14606
- ur_exp_tensor_map_data_type_flags_t *pTensorMapType;
14607
- uint32_t *pTensorRank;
14608
- void **pGlobalAddress;
14609
- const uint64_t **pGlobalDim;
14610
- const uint64_t **pGlobalStrides;
14611
- const uint32_t **pBoxDim;
14612
- const uint32_t **pElementStrides;
14613
- ur_exp_tensor_map_interleave_flags_t *pInterleave;
14614
- ur_exp_tensor_map_swizzle_flags_t *pSwizzle;
14615
- ur_exp_tensor_map_l2_promotion_flags_t *pL2Promotion;
14616
- ur_exp_tensor_map_oob_fill_flags_t *pOobFill;
14617
- ur_exp_tensor_map_handle_t **phTensorMap;
14618
- } ur_tensor_map_encode_tiled_exp_params_t;
14619
-
14620
14321
///////////////////////////////////////////////////////////////////////////////
14621
14322
/// @brief Function parameters for urUsmP2PEnablePeerAccessExp
14622
14323
/// @details Each entry is a pointer to the parameter passed to the function;
0 commit comments