@@ -2566,6 +2566,46 @@ ulong4 intel_subgroup_block_read_transpose_u64_k4(__global void *base_address,
2566
2566
2567
2567
#endif //defined(cl_intel_subgroup_extended_block_read)
2568
2568
2569
+ #ifdef cl_intel_subgroup_extended_block_read_cacheopts
2570
+ extern enum LSC_LDCC ;
2571
+ extern enum LSC_STCC ;
2572
+
2573
+ ushort2 intel_subgroup_block_read_cacheopts_u8_m1k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2574
+ ushort4 intel_subgroup_block_read_cacheopts_u8_m2k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2575
+ ushort8 intel_subgroup_block_read_cacheopts_u8_m4k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2576
+ ushort16 intel_subgroup_block_read_cacheopts_u8_m8k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2577
+ ushort2 intel_subgroup_block_read_cacheopts_u16_m1k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2578
+ ushort4 intel_subgroup_block_read_cacheopts_u16_m2k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2579
+ ushort8 intel_subgroup_block_read_cacheopts_u16_m4k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2580
+ ushort16 intel_subgroup_block_read_cacheopts_u16_m8k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2581
+ uint8 intel_subgroup_block_read_cacheopts_transform_u8_k32 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2582
+ uint8 intel_subgroup_block_read_cacheopts_transform_u16_k16 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2583
+ uint8 intel_subgroup_block_read_cacheopts_transpose_u32_k8 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2584
+ ulong4 intel_subgroup_block_read_cacheopts_transpose_u64_k4 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2585
+
2586
+ void intel_subgroup_block_write_cacheopts_u8_m1k32v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort val , enum LSC_STCC cache_control );
2587
+ void intel_subgroup_block_write_cacheopts_u8_m2k32v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort2 val , enum LSC_STCC cache_control );
2588
+ void intel_subgroup_block_write_cacheopts_u8_m4k32v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort4 val , enum LSC_STCC cache_control );
2589
+ void intel_subgroup_block_write_cacheopts_u8_m8k32v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort8 val , enum LSC_STCC cache_control );
2590
+ void intel_subgroup_block_write_cacheopts_u16_m1k16v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort val , enum LSC_STCC cache_control );
2591
+ void intel_subgroup_block_write_cacheopts_u16_m2k16v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort2 val , enum LSC_STCC cache_control );
2592
+ void intel_subgroup_block_write_cacheopts_u16_m4k16v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort4 val , enum LSC_STCC cache_control );
2593
+ void intel_subgroup_block_write_cacheopts_u16_m8k16v1 (__global void * base_address , int width , int height , int pitch , int2 coord , ushort8 val , enum LSC_STCC cache_control );
2594
+
2595
+ void intel_subgroup_block_prefetch_u8_m1k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2596
+ void intel_subgroup_block_prefetch_u8_m2k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2597
+ void intel_subgroup_block_prefetch_u8_m4k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2598
+ void intel_subgroup_block_prefetch_u8_m8k32v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2599
+ void intel_subgroup_block_prefetch_u16_m1k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2600
+ void intel_subgroup_block_prefetch_u16_m2k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2601
+ void intel_subgroup_block_prefetch_u16_m4k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2602
+ void intel_subgroup_block_prefetch_u16_m8k16v2 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2603
+ void intel_subgroup_block_prefetch_transform_u8_k32 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2604
+ void intel_subgroup_block_prefetch_transform_u16_k16 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2605
+ void intel_subgroup_block_prefetch_transpose_u32_k8 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2606
+ void intel_subgroup_block_prefetch_transpose_u64_k4 (__global void * base_address , int width , int height , int pitch , int2 coord , enum LSC_LDCC cache_control );
2607
+ #endif //defined(cl_intel_subgroup_extended_block_read_cacheopts)
2608
+
2569
2609
void global_barrier ();
2570
2610
2571
2611
//
0 commit comments