@@ -433,10 +433,6 @@ typedef enum ur_function_t {
433
433
UR_FUNCTION_BINDLESS_IMAGES_MAP_EXTERNAL_LINEAR_MEMORY_EXP = 245,
434
434
/// Enumerator for ::urEnqueueEventsWaitWithBarrierExt
435
435
UR_FUNCTION_ENQUEUE_EVENTS_WAIT_WITH_BARRIER_EXT = 246,
436
- /// Enumerator for ::urTensorMapEncodeIm2ColExp
437
- UR_FUNCTION_TENSOR_MAP_ENCODE_IM_2_COL_EXP = 247,
438
- /// Enumerator for ::urTensorMapEncodeTiledExp
439
- UR_FUNCTION_TENSOR_MAP_ENCODE_TILED_EXP = 248,
440
436
/// Enumerator for ::urPhysicalMemGetInfo
441
437
UR_FUNCTION_PHYSICAL_MEM_GET_INFO = 249,
442
438
/// @cond
@@ -12131,258 +12127,6 @@ UR_APIEXPORT ur_result_t UR_APICALL urEnqueueNativeCommandExp(
12131
12127
/// array.
12132
12128
ur_event_handle_t *phEvent);
12133
12129
12134
- #if !defined(__GNUC__)
12135
- #pragma endregion
12136
- #endif
12137
- // Intel 'oneAPI' Unified Runtime Experimental API for mapping tensor objects
12138
- #if !defined(__GNUC__)
12139
- #pragma region tensor_map_(experimental)
12140
- #endif
12141
- ///////////////////////////////////////////////////////////////////////////////
12142
- /// @brief Handle of tensor map object
12143
- typedef struct ur_exp_tensor_map_handle_t_ *ur_exp_tensor_map_handle_t;
12144
-
12145
- ///////////////////////////////////////////////////////////////////////////////
12146
- /// @brief Tensor map data type
12147
- typedef uint32_t ur_exp_tensor_map_data_type_flags_t;
12148
- typedef enum ur_exp_tensor_map_data_type_flag_t {
12149
- /// 1 byte
12150
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT8 = UR_BIT(0),
12151
- /// 2 bytes
12152
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT16 = UR_BIT(1),
12153
- /// 4 bytes
12154
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT32 = UR_BIT(2),
12155
- /// 4 bytes
12156
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_INT32 = UR_BIT(3),
12157
- /// 8 bytes
12158
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_UINT64 = UR_BIT(4),
12159
- /// 8 bytes
12160
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_INT64 = UR_BIT(5),
12161
- /// 2 bytes
12162
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT16 = UR_BIT(6),
12163
- /// 4 bytes
12164
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT32 = UR_BIT(7),
12165
- /// 8 bytes
12166
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT64 = UR_BIT(8),
12167
- /// 2 bytes
12168
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_BFLOAT16 = UR_BIT(9),
12169
- /// 4 bytes
12170
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FLOAT32_FTZ = UR_BIT(10),
12171
- /// 4 bytes
12172
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_TFLOAT32 = UR_BIT(11),
12173
- /// 4 bytes
12174
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_TFLOAT32_FTZ = UR_BIT(12),
12175
- /// @cond
12176
- UR_EXP_TENSOR_MAP_DATA_TYPE_FLAG_FORCE_UINT32 = 0x7fffffff
12177
- /// @endcond
12178
-
12179
- } ur_exp_tensor_map_data_type_flag_t;
12180
- /// @brief Bit Mask for validating ur_exp_tensor_map_data_type_flags_t
12181
- #define UR_EXP_TENSOR_MAP_DATA_TYPE_FLAGS_MASK 0xffffe000
12182
-
12183
- ///////////////////////////////////////////////////////////////////////////////
12184
- /// @brief Tensor map interleave
12185
- typedef uint32_t ur_exp_tensor_map_interleave_flags_t;
12186
- typedef enum ur_exp_tensor_map_interleave_flag_t {
12187
- /// No interleave
12188
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_NONE = UR_BIT(0),
12189
- /// 16B interleave
12190
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_16B = UR_BIT(1),
12191
- /// 32B interleave
12192
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_32B = UR_BIT(2),
12193
- /// @cond
12194
- UR_EXP_TENSOR_MAP_INTERLEAVE_FLAG_FORCE_UINT32 = 0x7fffffff
12195
- /// @endcond
12196
-
12197
- } ur_exp_tensor_map_interleave_flag_t;
12198
- /// @brief Bit Mask for validating ur_exp_tensor_map_interleave_flags_t
12199
- #define UR_EXP_TENSOR_MAP_INTERLEAVE_FLAGS_MASK 0xfffffff8
12200
-
12201
- ///////////////////////////////////////////////////////////////////////////////
12202
- /// @brief Tensor map l2 promotion
12203
- typedef uint32_t ur_exp_tensor_map_l2_promotion_flags_t;
12204
- typedef enum ur_exp_tensor_map_l2_promotion_flag_t {
12205
- /// No promotion type
12206
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_NONE = UR_BIT(0),
12207
- /// 64B promotion type
12208
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_64B = UR_BIT(1),
12209
- /// 128B promotion type
12210
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_128B = UR_BIT(2),
12211
- /// 256B promotion type
12212
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_256B = UR_BIT(3),
12213
- /// @cond
12214
- UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAG_FORCE_UINT32 = 0x7fffffff
12215
- /// @endcond
12216
-
12217
- } ur_exp_tensor_map_l2_promotion_flag_t;
12218
- /// @brief Bit Mask for validating ur_exp_tensor_map_l2_promotion_flags_t
12219
- #define UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAGS_MASK 0xfffffff0
12220
-
12221
- ///////////////////////////////////////////////////////////////////////////////
12222
- /// @brief Tensor map swizzle
12223
- typedef uint32_t ur_exp_tensor_map_swizzle_flags_t;
12224
- typedef enum ur_exp_tensor_map_swizzle_flag_t {
12225
- /// No swizzle
12226
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_NONE = UR_BIT(0),
12227
- /// 32B swizzle
12228
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_32B = UR_BIT(1),
12229
- /// 64B swizzle
12230
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_64B = UR_BIT(2),
12231
- /// 128B swizzle
12232
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_128B = UR_BIT(3),
12233
- /// @cond
12234
- UR_EXP_TENSOR_MAP_SWIZZLE_FLAG_FORCE_UINT32 = 0x7fffffff
12235
- /// @endcond
12236
-
12237
- } ur_exp_tensor_map_swizzle_flag_t;
12238
- /// @brief Bit Mask for validating ur_exp_tensor_map_swizzle_flags_t
12239
- #define UR_EXP_TENSOR_MAP_SWIZZLE_FLAGS_MASK 0xfffffff0
12240
-
12241
- ///////////////////////////////////////////////////////////////////////////////
12242
- /// @brief Tensor map OOB fill
12243
- typedef uint32_t ur_exp_tensor_map_oob_fill_flags_t;
12244
- typedef enum ur_exp_tensor_map_oob_fill_flag_t {
12245
- /// No OOB fill
12246
- UR_EXP_TENSOR_MAP_OOB_FILL_FLAG_NONE = UR_BIT(0),
12247
- /// Refer to NVIDIA docs
12248
- UR_EXP_TENSOR_MAP_OOB_FILL_FLAG_REQUEST_ZERO_FMA = UR_BIT(1),
12249
- /// @cond
12250
- UR_EXP_TENSOR_MAP_OOB_FILL_FLAG_FORCE_UINT32 = 0x7fffffff
12251
- /// @endcond
12252
-
12253
- } ur_exp_tensor_map_oob_fill_flag_t;
12254
- /// @brief Bit Mask for validating ur_exp_tensor_map_oob_fill_flags_t
12255
- #define UR_EXP_TENSOR_MAP_OOB_FILL_FLAGS_MASK 0xfffffffc
12256
-
12257
- ///////////////////////////////////////////////////////////////////////////////
12258
- /// @brief Encode tensor map with image data
12259
- ///
12260
- /// @details
12261
- /// - Map encode using im2col.
12262
- ///
12263
- /// @returns
12264
- /// - ::UR_RESULT_SUCCESS
12265
- /// - ::UR_RESULT_ERROR_UNINITIALIZED
12266
- /// - ::UR_RESULT_ERROR_DEVICE_LOST
12267
- /// - ::UR_RESULT_ERROR_ADAPTER_SPECIFIC
12268
- /// - ::UR_RESULT_ERROR_INVALID_NULL_HANDLE
12269
- /// + `NULL == hDevice`
12270
- /// - ::UR_RESULT_ERROR_INVALID_ENUMERATION
12271
- /// + `::UR_EXP_TENSOR_MAP_DATA_TYPE_FLAGS_MASK & TensorMapType`
12272
- /// + `::UR_EXP_TENSOR_MAP_INTERLEAVE_FLAGS_MASK & Interleave`
12273
- /// + `::UR_EXP_TENSOR_MAP_SWIZZLE_FLAGS_MASK & Swizzle`
12274
- /// + `::UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAGS_MASK & L2Promotion`
12275
- /// + `::UR_EXP_TENSOR_MAP_OOB_FILL_FLAGS_MASK & OobFill`
12276
- /// - ::UR_RESULT_ERROR_INVALID_NULL_POINTER
12277
- /// + `NULL == GlobalAddress`
12278
- /// + `NULL == GlobalDim`
12279
- /// + `NULL == GlobalStrides`
12280
- /// + `NULL == PixelBoxLowerCorner`
12281
- /// + `NULL == PixelBoxUpperCorner`
12282
- /// + `NULL == ElementStrides`
12283
- /// + `NULL == hTensorMap`
12284
- /// - ::UR_RESULT_ERROR_INVALID_ARGUMENT
12285
- /// + `TensorRank < 3`
12286
- UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeIm2ColExp(
12287
- /// [in] Handle of the device object.
12288
- ur_device_handle_t hDevice,
12289
- /// [in] Data type of the tensor object.
12290
- ur_exp_tensor_map_data_type_flags_t TensorMapType,
12291
- /// [in] Dimensionality of tensor; must be at least 3.
12292
- uint32_t TensorRank,
12293
- /// [in] Starting address of memory region described by tensor.
12294
- void *GlobalAddress,
12295
- /// [in] Array containing tensor size (number of elements) along each of
12296
- /// the TensorRank dimensions.
12297
- const uint64_t *GlobalDim,
12298
- /// [in] Array containing stride size (in bytes) along each of the
12299
- /// TensorRank - 1 dimensions.
12300
- const uint64_t *GlobalStrides,
12301
- /// [in] Array containing DHW dimensions of lower box corner.
12302
- const int *PixelBoxLowerCorner,
12303
- /// [in] Array containing DHW dimensions of upper box corner.
12304
- const int *PixelBoxUpperCorner,
12305
- /// [in] Number of channels per pixel.
12306
- uint32_t ChannelsPerPixel,
12307
- /// [in] Number of pixels per column.
12308
- uint32_t PixelsPerColumn,
12309
- /// [in] Array containing traversal stride in each of the TensorRank
12310
- /// dimensions.
12311
- const uint32_t *ElementStrides,
12312
- /// [in] Type of interleaved layout the tensor addresses
12313
- ur_exp_tensor_map_interleave_flags_t Interleave,
12314
- /// [in] Bank swizzling pattern inside shared memory
12315
- ur_exp_tensor_map_swizzle_flags_t Swizzle,
12316
- /// [in] L2 promotion size.
12317
- ur_exp_tensor_map_l2_promotion_flags_t L2Promotion,
12318
- /// [in] Indicates whether zero or special NaN constant will be used to
12319
- /// fill out-of-bounds elements.
12320
- ur_exp_tensor_map_oob_fill_flags_t OobFill,
12321
- /// [out] Handle of the tensor map object.
12322
- ur_exp_tensor_map_handle_t *hTensorMap);
12323
-
12324
- ///////////////////////////////////////////////////////////////////////////////
12325
- /// @brief Encode tensor map with tiled data
12326
- ///
12327
- /// @details
12328
- /// - Tiled map encode.
12329
- ///
12330
- /// @returns
12331
- /// - ::UR_RESULT_SUCCESS
12332
- /// - ::UR_RESULT_ERROR_UNINITIALIZED
12333
- /// - ::UR_RESULT_ERROR_DEVICE_LOST
12334
- /// - ::UR_RESULT_ERROR_ADAPTER_SPECIFIC
12335
- /// - ::UR_RESULT_ERROR_INVALID_NULL_HANDLE
12336
- /// + `NULL == hDevice`
12337
- /// - ::UR_RESULT_ERROR_INVALID_ENUMERATION
12338
- /// + `::UR_EXP_TENSOR_MAP_DATA_TYPE_FLAGS_MASK & TensorMapType`
12339
- /// + `::UR_EXP_TENSOR_MAP_INTERLEAVE_FLAGS_MASK & Interleave`
12340
- /// + `::UR_EXP_TENSOR_MAP_SWIZZLE_FLAGS_MASK & Swizzle`
12341
- /// + `::UR_EXP_TENSOR_MAP_L2_PROMOTION_FLAGS_MASK & L2Promotion`
12342
- /// + `::UR_EXP_TENSOR_MAP_OOB_FILL_FLAGS_MASK & OobFill`
12343
- /// - ::UR_RESULT_ERROR_INVALID_NULL_POINTER
12344
- /// + `NULL == GlobalAddress`
12345
- /// + `NULL == GlobalDim`
12346
- /// + `NULL == GlobalStrides`
12347
- /// + `NULL == BoxDim`
12348
- /// + `NULL == ElementStrides`
12349
- /// + `NULL == hTensorMap`
12350
- /// - ::UR_RESULT_ERROR_INVALID_ARGUMENT
12351
- /// + `TensorRank < 3`
12352
- UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeTiledExp(
12353
- /// [in] Handle of the device object.
12354
- ur_device_handle_t hDevice,
12355
- /// [in] Data type of the tensor object.
12356
- ur_exp_tensor_map_data_type_flags_t TensorMapType,
12357
- /// [in] Dimensionality of tensor; must be at least 3.
12358
- uint32_t TensorRank,
12359
- /// [in] Starting address of memory region described by tensor.
12360
- void *GlobalAddress,
12361
- /// [in] Array containing tensor size (number of elements) along each of
12362
- /// the TensorRank dimensions.
12363
- const uint64_t *GlobalDim,
12364
- /// [in] Array containing stride size (in bytes) along each of the
12365
- /// TensorRank - 1 dimensions.
12366
- const uint64_t *GlobalStrides,
12367
- /// [in] Array containing traversal box size (number of elments) along
12368
- /// each of the TensorRank dimensions. Specifies how many elements to be
12369
- /// traversed along each tensor dimension.
12370
- const uint32_t *BoxDim,
12371
- /// [in] Array containing traversal stride in each of the TensorRank
12372
- /// dimensions.
12373
- const uint32_t *ElementStrides,
12374
- /// [in] Type of interleaved layout the tensor addresses
12375
- ur_exp_tensor_map_interleave_flags_t Interleave,
12376
- /// [in] Bank swizzling pattern inside shared memory
12377
- ur_exp_tensor_map_swizzle_flags_t Swizzle,
12378
- /// [in] L2 promotion size.
12379
- ur_exp_tensor_map_l2_promotion_flags_t L2Promotion,
12380
- /// [in] Indicates whether zero or special NaN constant will be used to
12381
- /// fill out-of-bounds elements.
12382
- ur_exp_tensor_map_oob_fill_flags_t OobFill,
12383
- /// [out] Handle of the tensor map object.
12384
- ur_exp_tensor_map_handle_t *hTensorMap);
12385
-
12386
12130
#if !defined(__GNUC__)
12387
12131
#pragma endregion
12388
12132
#endif
@@ -14572,49 +14316,6 @@ typedef struct ur_command_buffer_command_get_info_exp_params_t {
14572
14316
size_t **ppPropSizeRet;
14573
14317
} ur_command_buffer_command_get_info_exp_params_t;
14574
14318
14575
- ///////////////////////////////////////////////////////////////////////////////
14576
- /// @brief Function parameters for urTensorMapEncodeIm2ColExp
14577
- /// @details Each entry is a pointer to the parameter passed to the function;
14578
- /// allowing the callback the ability to modify the parameter's value
14579
- typedef struct ur_tensor_map_encode_im_2_col_exp_params_t {
14580
- ur_device_handle_t *phDevice;
14581
- ur_exp_tensor_map_data_type_flags_t *pTensorMapType;
14582
- uint32_t *pTensorRank;
14583
- void **pGlobalAddress;
14584
- const uint64_t **pGlobalDim;
14585
- const uint64_t **pGlobalStrides;
14586
- const int **pPixelBoxLowerCorner;
14587
- const int **pPixelBoxUpperCorner;
14588
- uint32_t *pChannelsPerPixel;
14589
- uint32_t *pPixelsPerColumn;
14590
- const uint32_t **pElementStrides;
14591
- ur_exp_tensor_map_interleave_flags_t *pInterleave;
14592
- ur_exp_tensor_map_swizzle_flags_t *pSwizzle;
14593
- ur_exp_tensor_map_l2_promotion_flags_t *pL2Promotion;
14594
- ur_exp_tensor_map_oob_fill_flags_t *pOobFill;
14595
- ur_exp_tensor_map_handle_t **phTensorMap;
14596
- } ur_tensor_map_encode_im_2_col_exp_params_t;
14597
-
14598
- ///////////////////////////////////////////////////////////////////////////////
14599
- /// @brief Function parameters for urTensorMapEncodeTiledExp
14600
- /// @details Each entry is a pointer to the parameter passed to the function;
14601
- /// allowing the callback the ability to modify the parameter's value
14602
- typedef struct ur_tensor_map_encode_tiled_exp_params_t {
14603
- ur_device_handle_t *phDevice;
14604
- ur_exp_tensor_map_data_type_flags_t *pTensorMapType;
14605
- uint32_t *pTensorRank;
14606
- void **pGlobalAddress;
14607
- const uint64_t **pGlobalDim;
14608
- const uint64_t **pGlobalStrides;
14609
- const uint32_t **pBoxDim;
14610
- const uint32_t **pElementStrides;
14611
- ur_exp_tensor_map_interleave_flags_t *pInterleave;
14612
- ur_exp_tensor_map_swizzle_flags_t *pSwizzle;
14613
- ur_exp_tensor_map_l2_promotion_flags_t *pL2Promotion;
14614
- ur_exp_tensor_map_oob_fill_flags_t *pOobFill;
14615
- ur_exp_tensor_map_handle_t **phTensorMap;
14616
- } ur_tensor_map_encode_tiled_exp_params_t;
14617
-
14618
14319
///////////////////////////////////////////////////////////////////////////////
14619
14320
/// @brief Function parameters for urUsmP2PEnablePeerAccessExp
14620
14321
/// @details Each entry is a pointer to the parameter passed to the function;
0 commit comments