1 /*
2  * Copyright (C) 2017 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 /**
18  * Tests for halving-add idiomatic vectorization.
19  */
20 public class HaddChar {
21 
22   private static final int N = 64 * 1024;
23   private static final int M = N + 31;
24 
25   static char[] sB1 = new char[M];
26   static char[] sB2 = new char[M];
27   static char[] sBo = new char[M];
28 
29   /// CHECK-START: void HaddChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (before)
30   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
31   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
32   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
33   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
34   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
35   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
36   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
37   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
38   //
39   /// CHECK-START-ARM: void HaddChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (after)
40   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
41   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
42   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
43   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
44   //
45   /// CHECK-START-ARM64: void HaddChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (after)
46   /// CHECK-IF:     hasIsaFeature("sve")
47   //
48   //      HalvingAdd idiom is not supported for SVE.
49   ///     CHECK-NOT: VecHalvingAdd
50   //
51   /// CHECK-ELSE:
52   //
53   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
54   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
55   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
56   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
57   //
58   /// CHECK-FI:
halving_add_unsigned(char[] b1, char[] b2, char[] bo)59   private static void halving_add_unsigned(char[] b1, char[] b2, char[] bo) {
60     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
61     for (int i = 0; i < min_length; i++) {
62       bo[i] = (char) ((b1[i] + b2[i]) >> 1);
63     }
64   }
65 
66   /// CHECK-START: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) instruction_simplifier (before)
67   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
68   /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535                   loop:none
69   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
70   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
71   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
72   /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<IMAX>>]             loop:<<Loop>>      outer_loop:none
73   /// CHECK-DAG: <<And2:i\d+>> And [<<IMAX>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
74   /// CHECK-DAG: <<Add:i\d+>>  Add [<<And1>>,<<And2>>]             loop:<<Loop>>      outer_loop:none
75   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
76   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
77   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
78   //
79   /// CHECK-START: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (before)
80   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
81   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
82   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
83   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
84   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
85   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
86   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
87   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
88   //
89   /// CHECK-START-ARM: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after)
90   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
91   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
92   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
93   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
94   //
95   /// CHECK-START-ARM64: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after)
96   /// CHECK-IF:     hasIsaFeature("sve")
97   //
98   //      HalvingAdd idiom is not supported for SVE.
99   ///     CHECK-NOT: VecHalvingAdd
100   //
101   /// CHECK-ELSE:
102   //
103   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
104   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
105   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
106   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
107   //
108   /// CHECK-FI:
109   //
110   // Note: HAnd has no impact (already a zero extension).
111   //
halving_add_also_unsigned(char[] b1, char[] b2, char[] bo)112   private static void halving_add_also_unsigned(char[] b1, char[] b2, char[] bo) {
113     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
114     for (int i = 0; i < min_length; i++) {
115       bo[i] = (char) (((b1[i] & 0xffff) + (b2[i] & 0xffff)) >> 1);
116     }
117   }
118 
119   /// CHECK-START: void HaddChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (before)
120   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
121   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
122   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
123   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
124   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
125   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
126   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
127   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
128   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
129   //
130   /// CHECK-START-ARM: void HaddChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (after)
131   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
132   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
133   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
134   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
135   //
136   /// CHECK-START-ARM64: void HaddChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (after)
137   /// CHECK-IF:     hasIsaFeature("sve")
138   //
139   //      HalvingAdd idiom is not supported for SVE.
140   ///     CHECK-NOT: VecHalvingAdd
141   //
142   /// CHECK-ELSE:
143   //
144   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
145   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
146   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
147   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
148   //
149   /// CHECK-FI:
rounding_halving_add_unsigned(char[] b1, char[] b2, char[] bo)150   private static void rounding_halving_add_unsigned(char[] b1, char[] b2, char[] bo) {
151     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
152     for (int i = 0; i < min_length; i++) {
153       bo[i] = (char) ((b1[i] + b2[i] + 1) >> 1);
154     }
155   }
156 
157   /// CHECK-START: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) instruction_simplifier (before)
158   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
159   /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535                   loop:none
160   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
161   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
162   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
163   /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<IMAX>>]             loop:<<Loop>>      outer_loop:none
164   /// CHECK-DAG: <<And2:i\d+>> And [<<IMAX>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
165   /// CHECK-DAG: <<Add1:i\d+>> Add [<<And1>>,<<And2>>]             loop:<<Loop>>      outer_loop:none
166   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
167   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
168   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
169   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
170   //
171   /// CHECK-START: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (before)
172   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
173   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
174   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
175   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
176   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
177   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
178   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
179   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
180   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
181   //
182   /// CHECK-START-ARM: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after)
183   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
184   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
185   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
186   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
187   //
188   /// CHECK-START-ARM64: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after)
189   /// CHECK-IF:     hasIsaFeature("sve")
190   //
191   //      HalvingAdd idiom is not supported for SVE.
192   ///     CHECK-NOT: VecHalvingAdd
193   //
194   /// CHECK-ELSE:
195   //
196   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
197   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
198   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
199   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
200   //
201   /// CHECK-FI:
202   //
203   // Note: HAnd has no impact (already a zero extension).
204   //
rounding_halving_add_also_unsigned(char[] b1, char[] b2, char[] bo)205   private static void rounding_halving_add_also_unsigned(char[] b1, char[] b2, char[] bo) {
206     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
207     for (int i = 0; i < min_length; i++) {
208       bo[i] = (char) (((b1[i] & 0xffff) + (b2[i] & 0xffff) + 1) >> 1);
209     }
210   }
211 
212   /// CHECK-START: void HaddChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (before)
213   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
214   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
215   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
216   /// CHECK-DAG: <<Get:c\d+>>  ArrayGet                            loop:<<Loop>>      outer_loop:none
217   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
218   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
219   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
220   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
221   //
222   /// CHECK-START-ARM: void HaddChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (after)
223   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                     loop:none
224   /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>]         loop:none
225   /// CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
226   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
227   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
228   //
229   /// CHECK-START-ARM64: void HaddChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (after)
230   /// CHECK-IF:     hasIsaFeature("sve")
231   //
232   //      HalvingAdd idiom is not supported for SVE.
233   ///     CHECK-NOT: VecHalvingAdd
234   //
235   /// CHECK-ELSE:
236   //
237   ///     CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                     loop:none
238   ///     CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>]         loop:none
239   ///     CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
240   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
241   //
242   /// CHECK-FI:
halving_add_unsigned_constant(char[] b1, char[] bo)243   private static void halving_add_unsigned_constant(char[] b1, char[] bo) {
244     int min_length = Math.min(bo.length, b1.length);
245     for (int i = 0; i < min_length; i++) {
246       bo[i] = (char) ((b1[i] + 0xffff) >> 1);
247     }
248   }
249 
250   /// CHECK-START: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) instruction_simplifier (before)
251   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
252   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
253   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
254   /// CHECK-DAG: <<Get:c\d+>>  ArrayGet                            loop:<<Loop>>      outer_loop:none
255   /// CHECK-DAG: <<And:i\d+>>  And [<<Get>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
256   /// CHECK-DAG: <<Add:i\d+>>  Add [<<And>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
257   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
258   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
259   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
260   //
261   /// CHECK-START: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (before)
262   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
263   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
264   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
265   /// CHECK-DAG: <<Get:c\d+>>  ArrayGet                            loop:<<Loop>>      outer_loop:none
266   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
267   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
268   /// CHECK-DAG: <<Cnv:c\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
269   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
270   //
271   /// CHECK-START-ARM: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (after)
272   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                     loop:none
273   /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>]         loop:none
274   /// CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
275   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
276   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
277   //
278   /// CHECK-START-ARM64: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (after)
279   /// CHECK-IF:     hasIsaFeature("sve")
280   //
281   //      HalvingAdd idiom is not supported for SVE.
282   ///     CHECK-NOT: VecHalvingAdd
283   //
284   /// CHECK-ELSE:
285   //
286   ///     CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                     loop:none
287   ///     CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>]         loop:none
288   ///     CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
289   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
290   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
291   //
292   /// CHECK-FI:
293   //
294   // Note: HAnd has no impact (already a zero extension).
295   //
halving_add_also_unsigned_constant(char[] b1, char[] bo)296   private static void halving_add_also_unsigned_constant(char[] b1, char[] bo) {
297     int min_length = Math.min(bo.length, b1.length);
298     for (int i = 0; i < min_length; i++) {
299       bo[i] = (char) (((b1[i] & 0xffff) + 0xffff) >> 1);
300     }
301   }
302 
main()303   public static void main() {
304     // Some interesting values.
305     char[] interesting = {
306       (char) 0x0000,
307       (char) 0x0001,
308       (char) 0x0002,
309       (char) 0x1234,
310       (char) 0x8000,
311       (char) 0x8001,
312       (char) 0x7fff,
313       (char) 0xffff
314     };
315     // Initialize cross-values to test all cases, and also
316     // set up some extra values to exercise the cleanup loop.
317     for (int i = 0; i < M; i++) {
318       sB1[i] = (char) i;
319       sB2[i] = interesting[i & 7];
320     }
321 
322     // Test halving add idioms.
323     halving_add_unsigned(sB1, sB2, sBo);
324     for (int i = 0; i < M; i++) {
325       char e = (char) ((sB1[i] + sB2[i]) >> 1);
326       expectEquals(e, sBo[i]);
327     }
328     halving_add_also_unsigned(sB1, sB2, sBo);
329     for (int i = 0; i < M; i++) {
330       char e = (char) ((sB1[i] + sB2[i]) >> 1);
331       expectEquals(e, sBo[i]);
332     }
333     rounding_halving_add_unsigned(sB1, sB2, sBo);
334     for (int i = 0; i < M; i++) {
335       char e = (char) ((sB1[i] + sB2[i] + 1) >> 1);
336       expectEquals(e, sBo[i]);
337     }
338     rounding_halving_add_also_unsigned(sB1, sB2, sBo);
339     for (int i = 0; i < M; i++) {
340       char e = (char) ((sB1[i] + sB2[i] + 1) >> 1);
341       expectEquals(e, sBo[i]);
342     }
343     halving_add_unsigned_constant(sB1, sBo);
344     for (int i = 0; i < M; i++) {
345       char e = (char) ((sB1[i] + 0xffff) >> 1);
346       expectEquals(e, sBo[i]);
347     }
348     halving_add_also_unsigned_constant(sB1, sBo);
349     for (int i = 0; i < M; i++) {
350       char e = (char) ((sB1[i] + 0xffff) >> 1);
351       expectEquals(e, sBo[i]);
352     }
353 
354     System.out.println("HaddChar passed");
355   }
356 
expectEquals(int expected, int result)357   private static void expectEquals(int expected, int result) {
358     if (expected != result) {
359       throw new Error("Expected: " + expected + ", found: " + result);
360     }
361   }
362 }
363