@@ -1061,10 +1061,10 @@ define hidden void @eight_bytes_interleave_op(ptr noalias nocapture noundef writ
1061
1061
; CHECK: LV: Found an estimated cost of 14 for VF 2 For instruction: store i32
1062
1062
; CHECK: LV: Vector loop of width 2 costs: 44.
1063
1063
; CHECK: LV: Found an estimated cost of 18 for VF 4 For instruction: %10 = load i8
1064
- ; CHECK: LV: Found an estimated cost of 36 for VF 4 For instruction: %17 = load i32
1065
- ; CHECK: LV: Found an estimated cost of 36 for VF 4 For instruction: store i32
1066
- ; CHECK: LV: Vector loop of width 4 costs: 32 .
1067
- ; CHECK: LV: Selecting VF: 1 .
1064
+ ; CHECK: LV: Found an estimated cost of 24 for VF 4 For instruction: %17 = load i32
1065
+ ; CHECK: LV: Found an estimated cost of 24 for VF 4 For instruction: store i32
1066
+ ; CHECK: LV: Vector loop of width 4 costs: 26 .
1067
+ ; CHECK: LV: Selecting VF: 4 .
1068
1068
define hidden void @four_bytes_into_four_ints_same_op (ptr noalias nocapture noundef %0 , ptr nocapture noundef readonly %1 , ptr nocapture noundef readonly %2 , i32 noundef %3 ) {
1069
1069
%5 = icmp eq i32 %3 , 0
1070
1070
br i1 %5 , label %6 , label %7
@@ -1123,21 +1123,20 @@ define hidden void @four_bytes_into_four_ints_same_op(ptr noalias nocapture noun
1123
1123
br i1 %50 , label %6 , label %7
1124
1124
}
1125
1125
1126
- ; TODO: Should be able to vectorize?
1127
1126
; CHECK-LABEL: four_bytes_into_four_ints_vary_op
1128
1127
; CHECK: Cost of 14 for VF 2: INTERLEAVE-GROUP with factor 4
1129
1128
; CHECK: Cost of 18 for VF 4: INTERLEAVE-GROUP with factor 4
1130
- ; CHECK: Cost of 36 for VF 4: INTERLEAVE-GROUP with factor 4
1129
+ ; CHECK: Cost of 24 for VF 4: INTERLEAVE-GROUP with factor 4
1131
1130
; CHECK: LV: Scalar loop costs: 21.
1132
1131
; CHECK: LV: Found an estimated cost of 6 for VF 2 For instruction: %10 = load i8
1133
1132
; CHECK: LV: Found an estimated cost of 0 for VF 2 For instruction: %11 = zext i8
1134
1133
; CHECK: LV: Found an estimated cost of 14 for VF 2 For instruction: store i32
1135
1134
; CHECK: LV: Vector loop of width 2 costs: 35.
1136
1135
; CHECK: LV: Found an estimated cost of 18 for VF 4 For instruction: %10 = load i8
1137
1136
; CHECK: LV: Found an estimated cost of 2 for VF 4 For instruction: %11 = zext i8
1138
- ; CHECK: LV: Found an estimated cost of 36 for VF 4 For instruction: store i32
1139
- ; CHECK: LV: Vector loop of width 4 costs: 23 .
1140
- ; CHECK: LV: Selecting VF: 1 .
1137
+ ; CHECK: LV: Found an estimated cost of 24 for VF 4 For instruction: store i32
1138
+ ; CHECK: LV: Vector loop of width 4 costs: 20 .
1139
+ ; CHECK: LV: Selecting VF: 4 .
1141
1140
define hidden void @four_bytes_into_four_ints_vary_op (ptr noalias nocapture noundef writeonly %0 , ptr nocapture noundef readonly %1 , ptr nocapture noundef readonly %2 , i32 noundef %3 ) {
1142
1141
%5 = icmp eq i32 %3 , 0
1143
1142
br i1 %5 , label %6 , label %7
0 commit comments