@@ -500,19 +500,19 @@ entry:
500
500
;
501
501
; @llvm.nvvm.suld.<NDims>.array.v<NChannels><DType>.clamp
502
502
;
503
- ; <NDims> = { 1d, 2d, 3d }
503
+ ; <NDims> = { 1d, 2d }
504
504
; <NChannels> = { 2, 4 }
505
505
; <Dtype> = { i8, i16, i32 }
506
506
;
507
- ; Note: The case of NChannels=1 doesn't need to be handled here as it can be
507
+ ; Note: The case of NChannels=1 does not need to be handled here as it can be
508
508
; called directly.
509
509
510
510
511
511
; @llvm.nvvm.suld.<NDims>.array.v<NChannels>{i8, i16, i32}.clamp
512
512
513
513
; - @llvm.nvvm.suld.<NDims>.array.v{2, 4}i8.clamp
514
514
515
- ; - - @llvm.nvvm.suld.{1d, 2d, 3d }.array.v2i8.clamp
515
+ ; - - @llvm.nvvm.suld.{1d, 2d}.array.v2i8.clamp
516
516
517
517
declare {i16 ,i16 } @llvm.nvvm.suld.1d.array.v2i8.clamp (i64 , i32 , i32 )
518
518
define <2 x i16 > @__clc_llvm_nvvm_suld_1d_array_v2i8_clamp (i64 %img , i32 %idx , i32 %x ) nounwind alwaysinline {
@@ -530,15 +530,7 @@ entry:
530
530
ret <2 x i16 > %1
531
531
}
532
532
533
- declare {i16 ,i16 } @llvm.nvvm.suld.3d.array.v2i8.clamp (i64 , i32 , i32 , i32 , i32 )
534
- define <2 x i16 > @__clc_llvm_nvvm_suld_3d_array_v2i8_clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z ) nounwind alwaysinline {
535
- entry:
536
- %0 = tail call {i16 ,i16 } @llvm.nvvm.suld.3d.array.v2i8.clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z );
537
- %1 = tail call <2 x i16 > @__clc_struct16_to_vector2 ({i16 ,i16 } %0 )
538
- ret <2 x i16 > %1
539
- }
540
-
541
- ; - - @llvm.nvvm.suld.{1d, 2d, 3d}.array.v4i8.clamp
533
+ ; - - @llvm.nvvm.suld.{1d, 2d}.array.v4i8.clamp
542
534
543
535
declare {i16 ,i16 ,i16 ,i16 } @llvm.nvvm.suld.1d.array.v4i8.clamp (i64 , i32 , i32 )
544
536
define <4 x i16 > @__clc_llvm_nvvm_suld_1d_array_v4i8_clamp (i64 %img , i32 %idx , i32 %x ) nounwind alwaysinline {
@@ -556,17 +548,9 @@ entry:
556
548
ret <4 x i16 > %1
557
549
}
558
550
559
- declare {i16 ,i16 ,i16 ,i16 } @llvm.nvvm.suld.3d.array.v4i8.clamp (i64 , i32 , i32 , i32 , i32 )
560
- define <4 x i16 > @__clc_llvm_nvvm_suld_3d_array_v4i8_clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z ) nounwind alwaysinline {
561
- entry:
562
- %0 = tail call {i16 ,i16 ,i16 ,i16 } @llvm.nvvm.suld.3d.array.v4i8.clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z );
563
- %1 = tail call <4 x i16 > @__clc_struct16_to_vector ({i16 ,i16 ,i16 ,i16 } %0 )
564
- ret <4 x i16 > %1
565
- }
566
-
567
551
; - @llvm.nvvm.suld.<NDims>.array.v{2, 4}i16.clamp
568
552
569
- ; - - @llvm.nvvm.suld.{1d, 2d, 3d }.array.v2i16.clamp
553
+ ; - - @llvm.nvvm.suld.{1d, 2d}.array.v2i16.clamp
570
554
571
555
declare {i16 ,i16 } @llvm.nvvm.suld.1d.array.v2i16.clamp (i64 , i32 , i32 )
572
556
define <2 x i16 > @__clc_llvm_nvvm_suld_1d_array_v2i16_clamp (i64 %img , i32 %idx , i32 %x ) nounwind alwaysinline {
@@ -584,15 +568,7 @@ entry:
584
568
ret <2 x i16 > %1
585
569
}
586
570
587
- declare {i16 ,i16 } @llvm.nvvm.suld.3d.array.v2i16.clamp (i64 , i32 , i32 , i32 , i32 )
588
- define <2 x i16 > @__clc_llvm_nvvm_suld_3d_array_v2i16_clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z ) nounwind alwaysinline {
589
- entry:
590
- %0 = tail call {i16 ,i16 } @llvm.nvvm.suld.3d.array.v2i16.clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z );
591
- %1 = tail call <2 x i16 > @__clc_struct16_to_vector2 ({i16 ,i16 } %0 )
592
- ret <2 x i16 > %1
593
- }
594
-
595
- ; - - @llvm.nvvm.suld.{1d, 2d, 3d}.array.v4i16.clamp
571
+ ; - - @llvm.nvvm.suld.{1d, 2d}.array.v4i16.clamp
596
572
597
573
declare {i16 ,i16 ,i16 ,i16 } @llvm.nvvm.suld.1d.array.v4i16.clamp (i64 , i32 , i32 )
598
574
define <4 x i16 > @__clc_llvm_nvvm_suld_1d_array_v4i16_clamp (i64 %img , i32 %idx , i32 %x ) nounwind alwaysinline {
@@ -610,17 +586,9 @@ entry:
610
586
ret <4 x i16 > %1
611
587
}
612
588
613
- declare {i16 ,i16 ,i16 ,i16 } @llvm.nvvm.suld.3d.array.v4i16.clamp (i64 , i32 , i32 , i32 , i32 )
614
- define <4 x i16 > @__clc_llvm_nvvm_suld_3d_array_v4i16_clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z ) nounwind alwaysinline {
615
- entry:
616
- %0 = tail call {i16 ,i16 ,i16 ,i16 } @llvm.nvvm.suld.3d.array.v4i16.clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z );
617
- %1 = tail call <4 x i16 > @__clc_struct16_to_vector ({i16 ,i16 ,i16 ,i16 } %0 )
618
- ret <4 x i16 > %1
619
- }
620
-
621
589
; - @llvm.nvvm.suld.<NDims>.array.v{2, 4}i32.clamp
622
590
623
- ; - - @llvm.nvvm.suld.{1d, 2d, 3d }.array.v2i32.clamp
591
+ ; - - @llvm.nvvm.suld.{1d, 2d}.array.v2i32.clamp
624
592
625
593
declare {i32 ,i32 } @llvm.nvvm.suld.1d.array.v2i32.clamp (i64 , i32 , i32 )
626
594
define <2 x i32 > @__clc_llvm_nvvm_suld_1d_array_v2i32_clamp (i64 %img , i32 %idx , i32 %x ) nounwind alwaysinline {
@@ -638,17 +606,9 @@ entry:
638
606
ret <2 x i32 > %1
639
607
}
640
608
641
- declare {i32 ,i32 } @llvm.nvvm.suld.3d.array.v2i32.clamp (i64 , i32 , i32 , i32 , i32 )
642
- define <2 x i32 > @__clc_llvm_nvvm_suld_3d_array_v2i32_clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z ) nounwind alwaysinline {
643
- entry:
644
- %0 = tail call {i32 ,i32 } @llvm.nvvm.suld.3d.array.v2i32.clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z );
645
- %1 = tail call <2 x i32 > @__clc_struct32_to_vector2 ({i32 ,i32 } %0 )
646
- ret <2 x i32 > %1
647
- }
648
-
649
609
; - @llvm.nvvm.suld.<NDims>.array.v4i32.clamp
650
610
651
- ; - - @llvm.nvvm.suld.{1d, 2d, 3d }.array.v4i32.clamp
611
+ ; - - @llvm.nvvm.suld.{1d, 2d}.array.v4i32.clamp
652
612
653
613
declare {i32 ,i32 ,i32 ,i32 } @llvm.nvvm.suld.1d.array.v4i32.clamp (i64 , i32 , i32 )
654
614
define <4 x i32 > @__clc_llvm_nvvm_suld_1d_array_v4i32_clamp (i64 %img , i32 %idx , i32 %x ) nounwind alwaysinline {
@@ -665,10 +625,3 @@ entry:
665
625
%1 = tail call <4 x i32 > @__clc_struct32_to_vector ({i32 ,i32 ,i32 ,i32 } %0 )
666
626
ret <4 x i32 > %1
667
627
}
668
-
669
- declare {i32 ,i32 ,i32 ,i32 } @llvm.nvvm.suld.3d.array.v4i32.clamp (i64 , i32 , i32 , i32 , i32 )
670
- define <4 x i32 > @__clc_llvm_nvvm_suld_3d_array_v4i32_clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z ) nounwind alwaysinline {
671
- entry:
672
- %0 = tail call {i32 ,i32 ,i32 ,i32 } @llvm.nvvm.suld.3d.array.v4i32.clamp (i64 %img , i32 %idx , i32 %x , i32 %y , i32 %z );
673
- %1 = tail call <4 x i32 > @__clc_struct32_to_vector ({i32 ,i32 ,i32 ,i32 } %0 ) ret <4 x i32 > %1
674
- }
0 commit comments