1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 1.2 +++ b/test/compiler/6340864/TestShortVect.java Wed Apr 27 01:25:04 2016 +0800 1.3 @@ -0,0 +1,1340 @@ 1.4 +/* 1.5 + * Copyright (c) 2012, Oracle and/or its affiliates. All rights reserved. 1.6 + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 1.7 + * 1.8 + * This code is free software; you can redistribute it and/or modify it 1.9 + * under the terms of the GNU General Public License version 2 only, as 1.10 + * published by the Free Software Foundation. 1.11 + * 1.12 + * This code is distributed in the hope that it will be useful, but WITHOUT 1.13 + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 1.14 + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 1.15 + * version 2 for more details (a copy is included in the LICENSE file that 1.16 + * accompanied this code). 1.17 + * 1.18 + * You should have received a copy of the GNU General Public License version 1.19 + * 2 along with this work; if not, write to the Free Software Foundation, 1.20 + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 1.21 + * 1.22 + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 1.23 + * or visit www.oracle.com if you need additional information or have any 1.24 + * questions. 1.25 + * 1.26 + */ 1.27 + 1.28 +/** 1.29 + * @test 1.30 + * @bug 6340864 1.31 + * @summary Implement vectorization optimizations in hotspot-server 1.32 + * 1.33 + * @run main/othervm/timeout=400 -Xbatch -Xmx64m TestShortVect 1.34 + */ 1.35 + 1.36 +public class TestShortVect { 1.37 + private static final int ARRLEN = 997; 1.38 + private static final int ITERS = 11000; 1.39 + private static final int ADD_INIT = Short.MAX_VALUE-500; 1.40 + private static final int BIT_MASK = 0xB731; 1.41 + private static final int VALUE = 7; 1.42 + private static final int SHIFT = 16; 1.43 + 1.44 + public static void main(String args[]) { 1.45 + System.out.println("Testing Short vectors"); 1.46 + int errn = test(); 1.47 + if (errn > 0) { 1.48 + System.err.println("FAILED: " + errn + " errors"); 1.49 + System.exit(97); 1.50 + } 1.51 + System.out.println("PASSED"); 1.52 + } 1.53 + 1.54 + static int test() { 1.55 + short[] a0 = new short[ARRLEN]; 1.56 + short[] a1 = new short[ARRLEN]; 1.57 + short[] a2 = new short[ARRLEN]; 1.58 + short[] a3 = new short[ARRLEN]; 1.59 + short[] a4 = new short[ARRLEN]; 1.60 + int[] p2 = new int[ARRLEN/2]; 1.61 + long[] p4 = new long[ARRLEN/4]; 1.62 + // Initialize 1.63 + int gold_sum = 0; 1.64 + for (int i=0; i<ARRLEN; i++) { 1.65 + short val = (short)(ADD_INIT+i); 1.66 + gold_sum += val; 1.67 + a1[i] = val; 1.68 + a2[i] = (short)VALUE; 1.69 + a3[i] = (short)-VALUE; 1.70 + a4[i] = (short)BIT_MASK; 1.71 + } 1.72 + System.out.println("Warmup"); 1.73 + for (int i=0; i<ITERS; i++) { 1.74 + test_sum(a1); 1.75 + test_addc(a0, a1); 1.76 + test_addv(a0, a1, (short)VALUE); 1.77 + test_adda(a0, a1, a2); 1.78 + test_subc(a0, a1); 1.79 + test_subv(a0, a1, (short)VALUE); 1.80 + test_suba(a0, a1, a2); 1.81 + 1.82 + test_mulc(a0, a1); 1.83 + test_mulv(a0, a1, (short)VALUE); 1.84 + test_mula(a0, a1, a2); 1.85 + test_divc(a0, a1); 1.86 + test_divv(a0, a1, (short)VALUE); 1.87 + test_diva(a0, a1, a2); 1.88 + test_mulc_n(a0, a1); 1.89 + test_mulv(a0, a1, (short)-VALUE); 1.90 + test_mula(a0, a1, a3); 1.91 + test_divc_n(a0, a1); 1.92 + test_divv(a0, a1, (short)-VALUE); 1.93 + test_diva(a0, a1, a3); 1.94 + 1.95 + test_andc(a0, a1); 1.96 + test_andv(a0, a1, (short)BIT_MASK); 1.97 + test_anda(a0, a1, a4); 1.98 + test_orc(a0, a1); 1.99 + test_orv(a0, a1, (short)BIT_MASK); 1.100 + test_ora(a0, a1, a4); 1.101 + test_xorc(a0, a1); 1.102 + test_xorv(a0, a1, (short)BIT_MASK); 1.103 + test_xora(a0, a1, a4); 1.104 + 1.105 + test_sllc(a0, a1); 1.106 + test_sllv(a0, a1, VALUE); 1.107 + test_srlc(a0, a1); 1.108 + test_srlv(a0, a1, VALUE); 1.109 + test_srac(a0, a1); 1.110 + test_srav(a0, a1, VALUE); 1.111 + 1.112 + test_sllc_n(a0, a1); 1.113 + test_sllv(a0, a1, -VALUE); 1.114 + test_srlc_n(a0, a1); 1.115 + test_srlv(a0, a1, -VALUE); 1.116 + test_srac_n(a0, a1); 1.117 + test_srav(a0, a1, -VALUE); 1.118 + 1.119 + test_sllc_o(a0, a1); 1.120 + test_sllv(a0, a1, SHIFT); 1.121 + test_srlc_o(a0, a1); 1.122 + test_srlv(a0, a1, SHIFT); 1.123 + test_srac_o(a0, a1); 1.124 + test_srav(a0, a1, SHIFT); 1.125 + 1.126 + test_sllc_on(a0, a1); 1.127 + test_sllv(a0, a1, -SHIFT); 1.128 + test_srlc_on(a0, a1); 1.129 + test_srlv(a0, a1, -SHIFT); 1.130 + test_srac_on(a0, a1); 1.131 + test_srav(a0, a1, -SHIFT); 1.132 + 1.133 + test_sllc_add(a0, a1); 1.134 + test_sllv_add(a0, a1, ADD_INIT); 1.135 + test_srlc_add(a0, a1); 1.136 + test_srlv_add(a0, a1, ADD_INIT); 1.137 + test_srac_add(a0, a1); 1.138 + test_srav_add(a0, a1, ADD_INIT); 1.139 + 1.140 + test_sllc_and(a0, a1); 1.141 + test_sllv_and(a0, a1, BIT_MASK); 1.142 + test_srlc_and(a0, a1); 1.143 + test_srlv_and(a0, a1, BIT_MASK); 1.144 + test_srac_and(a0, a1); 1.145 + test_srav_and(a0, a1, BIT_MASK); 1.146 + 1.147 + test_pack2(p2, a1); 1.148 + test_unpack2(a0, p2); 1.149 + test_pack2_swap(p2, a1); 1.150 + test_unpack2_swap(a0, p2); 1.151 + test_pack4(p4, a1); 1.152 + test_unpack4(a0, p4); 1.153 + test_pack4_swap(p4, a1); 1.154 + test_unpack4_swap(a0, p4); 1.155 + } 1.156 + // Test and verify results 1.157 + System.out.println("Verification"); 1.158 + int errn = 0; 1.159 + { 1.160 + int sum = test_sum(a1); 1.161 + if (sum != gold_sum) { 1.162 + System.err.println("test_sum: " + sum + " != " + gold_sum); 1.163 + errn++; 1.164 + } 1.165 + 1.166 + test_addc(a0, a1); 1.167 + for (int i=0; i<ARRLEN; i++) { 1.168 + errn += verify("test_addc: ", i, a0[i], (short)((short)(ADD_INIT+i)+VALUE)); 1.169 + } 1.170 + test_addv(a0, a1, (short)VALUE); 1.171 + for (int i=0; i<ARRLEN; i++) { 1.172 + errn += verify("test_addv: ", i, a0[i], (short)((short)(ADD_INIT+i)+VALUE)); 1.173 + } 1.174 + test_adda(a0, a1, a2); 1.175 + for (int i=0; i<ARRLEN; i++) { 1.176 + errn += verify("test_adda: ", i, a0[i], (short)((short)(ADD_INIT+i)+VALUE)); 1.177 + } 1.178 + 1.179 + test_subc(a0, a1); 1.180 + for (int i=0; i<ARRLEN; i++) { 1.181 + errn += verify("test_subc: ", i, a0[i], (short)((short)(ADD_INIT+i)-VALUE)); 1.182 + } 1.183 + test_subv(a0, a1, (short)VALUE); 1.184 + for (int i=0; i<ARRLEN; i++) { 1.185 + errn += verify("test_subv: ", i, a0[i], (short)((short)(ADD_INIT+i)-VALUE)); 1.186 + } 1.187 + test_suba(a0, a1, a2); 1.188 + for (int i=0; i<ARRLEN; i++) { 1.189 + errn += verify("test_suba: ", i, a0[i], (short)((short)(ADD_INIT+i)-VALUE)); 1.190 + } 1.191 + 1.192 + test_mulc(a0, a1); 1.193 + for (int i=0; i<ARRLEN; i++) { 1.194 + errn += verify("test_mulc: ", i, a0[i], (short)((short)(ADD_INIT+i)*VALUE)); 1.195 + } 1.196 + test_mulv(a0, a1, (short)VALUE); 1.197 + for (int i=0; i<ARRLEN; i++) { 1.198 + errn += verify("test_mulv: ", i, a0[i], (short)((short)(ADD_INIT+i)*VALUE)); 1.199 + } 1.200 + test_mula(a0, a1, a2); 1.201 + for (int i=0; i<ARRLEN; i++) { 1.202 + errn += verify("test_mula: ", i, a0[i], (short)((short)(ADD_INIT+i)*VALUE)); 1.203 + } 1.204 + 1.205 + test_divc(a0, a1); 1.206 + for (int i=0; i<ARRLEN; i++) { 1.207 + errn += verify("test_divc: ", i, a0[i], (short)((short)(ADD_INIT+i)/VALUE)); 1.208 + } 1.209 + test_divv(a0, a1, (short)VALUE); 1.210 + for (int i=0; i<ARRLEN; i++) { 1.211 + errn += verify("test_divv: ", i, a0[i], (short)((short)(ADD_INIT+i)/VALUE)); 1.212 + } 1.213 + test_diva(a0, a1, a2); 1.214 + for (int i=0; i<ARRLEN; i++) { 1.215 + errn += verify("test_diva: ", i, a0[i], (short)((short)(ADD_INIT+i)/VALUE)); 1.216 + } 1.217 + 1.218 + test_mulc_n(a0, a1); 1.219 + for (int i=0; i<ARRLEN; i++) { 1.220 + errn += verify("test_mulc_n: ", i, a0[i], (short)((short)(ADD_INIT+i)*(-VALUE))); 1.221 + } 1.222 + test_mulv(a0, a1, (short)-VALUE); 1.223 + for (int i=0; i<ARRLEN; i++) { 1.224 + errn += verify("test_mulv_n: ", i, a0[i], (short)((short)(ADD_INIT+i)*(-VALUE))); 1.225 + } 1.226 + test_mula(a0, a1, a3); 1.227 + for (int i=0; i<ARRLEN; i++) { 1.228 + errn += verify("test_mula_n: ", i, a0[i], (short)((short)(ADD_INIT+i)*(-VALUE))); 1.229 + } 1.230 + 1.231 + test_divc_n(a0, a1); 1.232 + for (int i=0; i<ARRLEN; i++) { 1.233 + errn += verify("test_divc_n: ", i, a0[i], (short)((short)(ADD_INIT+i)/(-VALUE))); 1.234 + } 1.235 + test_divv(a0, a1, (short)-VALUE); 1.236 + for (int i=0; i<ARRLEN; i++) { 1.237 + errn += verify("test_divv_n: ", i, a0[i], (short)((short)(ADD_INIT+i)/(-VALUE))); 1.238 + } 1.239 + test_diva(a0, a1, a3); 1.240 + for (int i=0; i<ARRLEN; i++) { 1.241 + errn += verify("test_diva_n: ", i, a0[i], (short)((short)(ADD_INIT+i)/(-VALUE))); 1.242 + } 1.243 + 1.244 + test_andc(a0, a1); 1.245 + for (int i=0; i<ARRLEN; i++) { 1.246 + errn += verify("test_andc: ", i, a0[i], (short)((short)(ADD_INIT+i)&BIT_MASK)); 1.247 + } 1.248 + test_andv(a0, a1, (short)BIT_MASK); 1.249 + for (int i=0; i<ARRLEN; i++) { 1.250 + errn += verify("test_andv: ", i, a0[i], (short)((short)(ADD_INIT+i)&BIT_MASK)); 1.251 + } 1.252 + test_anda(a0, a1, a4); 1.253 + for (int i=0; i<ARRLEN; i++) { 1.254 + errn += verify("test_anda: ", i, a0[i], (short)((short)(ADD_INIT+i)&BIT_MASK)); 1.255 + } 1.256 + 1.257 + test_orc(a0, a1); 1.258 + for (int i=0; i<ARRLEN; i++) { 1.259 + errn += verify("test_orc: ", i, a0[i], (short)((short)(ADD_INIT+i)|BIT_MASK)); 1.260 + } 1.261 + test_orv(a0, a1, (short)BIT_MASK); 1.262 + for (int i=0; i<ARRLEN; i++) { 1.263 + errn += verify("test_orv: ", i, a0[i], (short)((short)(ADD_INIT+i)|BIT_MASK)); 1.264 + } 1.265 + test_ora(a0, a1, a4); 1.266 + for (int i=0; i<ARRLEN; i++) { 1.267 + errn += verify("test_ora: ", i, a0[i], (short)((short)(ADD_INIT+i)|BIT_MASK)); 1.268 + } 1.269 + 1.270 + test_xorc(a0, a1); 1.271 + for (int i=0; i<ARRLEN; i++) { 1.272 + errn += verify("test_xorc: ", i, a0[i], (short)((short)(ADD_INIT+i)^BIT_MASK)); 1.273 + } 1.274 + test_xorv(a0, a1, (short)BIT_MASK); 1.275 + for (int i=0; i<ARRLEN; i++) { 1.276 + errn += verify("test_xorv: ", i, a0[i], (short)((short)(ADD_INIT+i)^BIT_MASK)); 1.277 + } 1.278 + test_xora(a0, a1, a4); 1.279 + for (int i=0; i<ARRLEN; i++) { 1.280 + errn += verify("test_xora: ", i, a0[i], (short)((short)(ADD_INIT+i)^BIT_MASK)); 1.281 + } 1.282 + 1.283 + test_sllc(a0, a1); 1.284 + for (int i=0; i<ARRLEN; i++) { 1.285 + errn += verify("test_sllc: ", i, a0[i], (short)((short)(ADD_INIT+i)<<VALUE)); 1.286 + } 1.287 + test_sllv(a0, a1, VALUE); 1.288 + for (int i=0; i<ARRLEN; i++) { 1.289 + errn += verify("test_sllv: ", i, a0[i], (short)((short)(ADD_INIT+i)<<VALUE)); 1.290 + } 1.291 + 1.292 + test_srlc(a0, a1); 1.293 + for (int i=0; i<ARRLEN; i++) { 1.294 + errn += verify("test_srlc: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>VALUE)); 1.295 + } 1.296 + test_srlv(a0, a1, VALUE); 1.297 + for (int i=0; i<ARRLEN; i++) { 1.298 + errn += verify("test_srlv: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>VALUE)); 1.299 + } 1.300 + 1.301 + test_srac(a0, a1); 1.302 + for (int i=0; i<ARRLEN; i++) { 1.303 + errn += verify("test_srac: ", i, a0[i], (short)((short)(ADD_INIT+i)>>VALUE)); 1.304 + } 1.305 + test_srav(a0, a1, VALUE); 1.306 + for (int i=0; i<ARRLEN; i++) { 1.307 + errn += verify("test_srav: ", i, a0[i], (short)((short)(ADD_INIT+i)>>VALUE)); 1.308 + } 1.309 + 1.310 + test_sllc_n(a0, a1); 1.311 + for (int i=0; i<ARRLEN; i++) { 1.312 + errn += verify("test_sllc_n: ", i, a0[i], (short)((short)(ADD_INIT+i)<<(-VALUE))); 1.313 + } 1.314 + test_sllv(a0, a1, -VALUE); 1.315 + for (int i=0; i<ARRLEN; i++) { 1.316 + errn += verify("test_sllv_n: ", i, a0[i], (short)((short)(ADD_INIT+i)<<(-VALUE))); 1.317 + } 1.318 + 1.319 + test_srlc_n(a0, a1); 1.320 + for (int i=0; i<ARRLEN; i++) { 1.321 + errn += verify("test_srlc_n: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>(-VALUE))); 1.322 + } 1.323 + test_srlv(a0, a1, -VALUE); 1.324 + for (int i=0; i<ARRLEN; i++) { 1.325 + errn += verify("test_srlv_n: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>(-VALUE))); 1.326 + } 1.327 + 1.328 + test_srac_n(a0, a1); 1.329 + for (int i=0; i<ARRLEN; i++) { 1.330 + errn += verify("test_srac_n: ", i, a0[i], (short)((short)(ADD_INIT+i)>>(-VALUE))); 1.331 + } 1.332 + test_srav(a0, a1, -VALUE); 1.333 + for (int i=0; i<ARRLEN; i++) { 1.334 + errn += verify("test_srav_n: ", i, a0[i], (short)((short)(ADD_INIT+i)>>(-VALUE))); 1.335 + } 1.336 + 1.337 + test_sllc_o(a0, a1); 1.338 + for (int i=0; i<ARRLEN; i++) { 1.339 + errn += verify("test_sllc_o: ", i, a0[i], (short)((short)(ADD_INIT+i)<<SHIFT)); 1.340 + } 1.341 + test_sllv(a0, a1, SHIFT); 1.342 + for (int i=0; i<ARRLEN; i++) { 1.343 + errn += verify("test_sllv_o: ", i, a0[i], (short)((short)(ADD_INIT+i)<<SHIFT)); 1.344 + } 1.345 + 1.346 + test_srlc_o(a0, a1); 1.347 + for (int i=0; i<ARRLEN; i++) { 1.348 + errn += verify("test_srlc_o: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>SHIFT)); 1.349 + } 1.350 + test_srlv(a0, a1, SHIFT); 1.351 + for (int i=0; i<ARRLEN; i++) { 1.352 + errn += verify("test_srlv_o: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>SHIFT)); 1.353 + } 1.354 + 1.355 + test_srac_o(a0, a1); 1.356 + for (int i=0; i<ARRLEN; i++) { 1.357 + errn += verify("test_srac_o: ", i, a0[i], (short)((short)(ADD_INIT+i)>>SHIFT)); 1.358 + } 1.359 + test_srav(a0, a1, SHIFT); 1.360 + for (int i=0; i<ARRLEN; i++) { 1.361 + errn += verify("test_srav_o: ", i, a0[i], (short)((short)(ADD_INIT+i)>>SHIFT)); 1.362 + } 1.363 + 1.364 + test_sllc_on(a0, a1); 1.365 + for (int i=0; i<ARRLEN; i++) { 1.366 + errn += verify("test_sllc_on: ", i, a0[i], (short)((short)(ADD_INIT+i)<<(-SHIFT))); 1.367 + } 1.368 + test_sllv(a0, a1, -SHIFT); 1.369 + for (int i=0; i<ARRLEN; i++) { 1.370 + errn += verify("test_sllv_on: ", i, a0[i], (short)((short)(ADD_INIT+i)<<(-SHIFT))); 1.371 + } 1.372 + 1.373 + test_srlc_on(a0, a1); 1.374 + for (int i=0; i<ARRLEN; i++) { 1.375 + errn += verify("test_srlc_on: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>(-SHIFT))); 1.376 + } 1.377 + test_srlv(a0, a1, -SHIFT); 1.378 + for (int i=0; i<ARRLEN; i++) { 1.379 + errn += verify("test_srlv_on: ", i, a0[i], (short)((short)(ADD_INIT+i)>>>(-SHIFT))); 1.380 + } 1.381 + 1.382 + test_srac_on(a0, a1); 1.383 + for (int i=0; i<ARRLEN; i++) { 1.384 + errn += verify("test_srac_on: ", i, a0[i], (short)((short)(ADD_INIT+i)>>(-SHIFT))); 1.385 + } 1.386 + test_srav(a0, a1, -SHIFT); 1.387 + for (int i=0; i<ARRLEN; i++) { 1.388 + errn += verify("test_srav_on: ", i, a0[i], (short)((short)(ADD_INIT+i)>>(-SHIFT))); 1.389 + } 1.390 + 1.391 + test_sllc_add(a0, a1); 1.392 + for (int i=0; i<ARRLEN; i++) { 1.393 + errn += verify("test_sllc_add: ", i, a0[i], (short)(((short)(ADD_INIT+i) + ADD_INIT)<<VALUE)); 1.394 + } 1.395 + test_sllv_add(a0, a1, ADD_INIT); 1.396 + for (int i=0; i<ARRLEN; i++) { 1.397 + errn += verify("test_sllv_add: ", i, a0[i], (short)(((short)(ADD_INIT+i) + ADD_INIT)<<VALUE)); 1.398 + } 1.399 + 1.400 + test_srlc_add(a0, a1); 1.401 + for (int i=0; i<ARRLEN; i++) { 1.402 + errn += verify("test_srlc_add: ", i, a0[i], (short)(((short)(ADD_INIT+i) + ADD_INIT)>>>VALUE)); 1.403 + } 1.404 + test_srlv_add(a0, a1, ADD_INIT); 1.405 + for (int i=0; i<ARRLEN; i++) { 1.406 + errn += verify("test_srlv_add: ", i, a0[i], (short)(((short)(ADD_INIT+i) + ADD_INIT)>>>VALUE)); 1.407 + } 1.408 + 1.409 + test_srac_add(a0, a1); 1.410 + for (int i=0; i<ARRLEN; i++) { 1.411 + errn += verify("test_srac_add: ", i, a0[i], (short)(((short)(ADD_INIT+i) + ADD_INIT)>>VALUE)); 1.412 + } 1.413 + test_srav_add(a0, a1, ADD_INIT); 1.414 + for (int i=0; i<ARRLEN; i++) { 1.415 + errn += verify("test_srav_add: ", i, a0[i], (short)(((short)(ADD_INIT+i) + ADD_INIT)>>VALUE)); 1.416 + } 1.417 + 1.418 + test_sllc_and(a0, a1); 1.419 + for (int i=0; i<ARRLEN; i++) { 1.420 + errn += verify("test_sllc_and: ", i, a0[i], (short)(((short)(ADD_INIT+i) & BIT_MASK)<<VALUE)); 1.421 + } 1.422 + test_sllv_and(a0, a1, BIT_MASK); 1.423 + for (int i=0; i<ARRLEN; i++) { 1.424 + errn += verify("test_sllv_and: ", i, a0[i], (short)(((short)(ADD_INIT+i) & BIT_MASK)<<VALUE)); 1.425 + } 1.426 + 1.427 + test_srlc_and(a0, a1); 1.428 + for (int i=0; i<ARRLEN; i++) { 1.429 + errn += verify("test_srlc_and: ", i, a0[i], (short)(((short)(ADD_INIT+i) & BIT_MASK)>>>VALUE)); 1.430 + } 1.431 + test_srlv_and(a0, a1, BIT_MASK); 1.432 + for (int i=0; i<ARRLEN; i++) { 1.433 + errn += verify("test_srlv_and: ", i, a0[i], (short)(((short)(ADD_INIT+i) & BIT_MASK)>>>VALUE)); 1.434 + } 1.435 + 1.436 + test_srac_and(a0, a1); 1.437 + for (int i=0; i<ARRLEN; i++) { 1.438 + errn += verify("test_srac_and: ", i, a0[i], (short)(((short)(ADD_INIT+i) & BIT_MASK)>>VALUE)); 1.439 + } 1.440 + test_srav_and(a0, a1, BIT_MASK); 1.441 + for (int i=0; i<ARRLEN; i++) { 1.442 + errn += verify("test_srav_and: ", i, a0[i], (short)(((short)(ADD_INIT+i) & BIT_MASK)>>VALUE)); 1.443 + } 1.444 + 1.445 + test_pack2(p2, a1); 1.446 + for (int i=0; i<ARRLEN/2; i++) { 1.447 + errn += verify("test_pack2: ", i, p2[i], ((int)(ADD_INIT+2*i) & 0xFFFF) | ((int)(ADD_INIT+2*i+1) << 16)); 1.448 + } 1.449 + for (int i=0; i<ARRLEN; i++) { 1.450 + a0[i] = -1; 1.451 + } 1.452 + test_unpack2(a0, p2); 1.453 + for (int i=0; i<(ARRLEN&(-2)); i++) { 1.454 + errn += verify("test_unpack2: ", i, a0[i], (short)(ADD_INIT+i)); 1.455 + } 1.456 + 1.457 + test_pack2_swap(p2, a1); 1.458 + for (int i=0; i<ARRLEN/2; i++) { 1.459 + errn += verify("test_pack2_swap: ", i, p2[i], ((int)(ADD_INIT+2*i+1) & 0xFFFF) | ((int)(ADD_INIT+2*i) << 16)); 1.460 + } 1.461 + for (int i=0; i<ARRLEN; i++) { 1.462 + a0[i] = -1; 1.463 + } 1.464 + test_unpack2_swap(a0, p2); 1.465 + for (int i=0; i<(ARRLEN&(-2)); i++) { 1.466 + errn += verify("test_unpack2_swap: ", i, a0[i], (short)(ADD_INIT+i)); 1.467 + } 1.468 + 1.469 + test_pack4(p4, a1); 1.470 + for (int i=0; i<ARRLEN/4; i++) { 1.471 + errn += verify("test_pack4: ", i, p4[i], ((long)(ADD_INIT+4*i+0) & 0xFFFFl) | 1.472 + (((long)(ADD_INIT+4*i+1) & 0xFFFFl) << 16) | 1.473 + (((long)(ADD_INIT+4*i+2) & 0xFFFFl) << 32) | 1.474 + (((long)(ADD_INIT+4*i+3) & 0xFFFFl) << 48)); 1.475 + } 1.476 + for (int i=0; i<ARRLEN; i++) { 1.477 + a0[i] = -1; 1.478 + } 1.479 + test_unpack4(a0, p4); 1.480 + for (int i=0; i<(ARRLEN&(-4)); i++) { 1.481 + errn += verify("test_unpack4: ", i, a0[i], (short)(ADD_INIT+i)); 1.482 + } 1.483 + 1.484 + test_pack4_swap(p4, a1); 1.485 + for (int i=0; i<ARRLEN/4; i++) { 1.486 + errn += verify("test_pack4_swap: ", i, p4[i], ((long)(ADD_INIT+4*i+3) & 0xFFFFl) | 1.487 + (((long)(ADD_INIT+4*i+2) & 0xFFFFl) << 16) | 1.488 + (((long)(ADD_INIT+4*i+1) & 0xFFFFl) << 32) | 1.489 + (((long)(ADD_INIT+4*i+0) & 0xFFFFl) << 48)); 1.490 + } 1.491 + for (int i=0; i<ARRLEN; i++) { 1.492 + a0[i] = -1; 1.493 + } 1.494 + test_unpack4_swap(a0, p4); 1.495 + for (int i=0; i<(ARRLEN&(-4)); i++) { 1.496 + errn += verify("test_unpack4_swap: ", i, a0[i], (short)(ADD_INIT+i)); 1.497 + } 1.498 + 1.499 + } 1.500 + 1.501 + if (errn > 0) 1.502 + return errn; 1.503 + 1.504 + System.out.println("Time"); 1.505 + long start, end; 1.506 + 1.507 + start = System.currentTimeMillis(); 1.508 + for (int i=0; i<ITERS; i++) { 1.509 + test_sum(a1); 1.510 + } 1.511 + end = System.currentTimeMillis(); 1.512 + System.out.println("test_sum: " + (end - start)); 1.513 + 1.514 + start = System.currentTimeMillis(); 1.515 + for (int i=0; i<ITERS; i++) { 1.516 + test_addc(a0, a1); 1.517 + } 1.518 + end = System.currentTimeMillis(); 1.519 + System.out.println("test_addc: " + (end - start)); 1.520 + start = System.currentTimeMillis(); 1.521 + for (int i=0; i<ITERS; i++) { 1.522 + test_addv(a0, a1, (short)VALUE); 1.523 + } 1.524 + end = System.currentTimeMillis(); 1.525 + System.out.println("test_addv: " + (end - start)); 1.526 + start = System.currentTimeMillis(); 1.527 + for (int i=0; i<ITERS; i++) { 1.528 + test_adda(a0, a1, a2); 1.529 + } 1.530 + end = System.currentTimeMillis(); 1.531 + System.out.println("test_adda: " + (end - start)); 1.532 + 1.533 + start = System.currentTimeMillis(); 1.534 + for (int i=0; i<ITERS; i++) { 1.535 + test_subc(a0, a1); 1.536 + } 1.537 + end = System.currentTimeMillis(); 1.538 + System.out.println("test_subc: " + (end - start)); 1.539 + start = System.currentTimeMillis(); 1.540 + for (int i=0; i<ITERS; i++) { 1.541 + test_subv(a0, a1, (short)VALUE); 1.542 + } 1.543 + end = System.currentTimeMillis(); 1.544 + System.out.println("test_subv: " + (end - start)); 1.545 + start = System.currentTimeMillis(); 1.546 + for (int i=0; i<ITERS; i++) { 1.547 + test_suba(a0, a1, a2); 1.548 + } 1.549 + end = System.currentTimeMillis(); 1.550 + System.out.println("test_suba: " + (end - start)); 1.551 + 1.552 + start = System.currentTimeMillis(); 1.553 + for (int i=0; i<ITERS; i++) { 1.554 + test_mulc(a0, a1); 1.555 + } 1.556 + end = System.currentTimeMillis(); 1.557 + System.out.println("test_mulc: " + (end - start)); 1.558 + start = System.currentTimeMillis(); 1.559 + for (int i=0; i<ITERS; i++) { 1.560 + test_mulv(a0, a1, (short)VALUE); 1.561 + } 1.562 + end = System.currentTimeMillis(); 1.563 + System.out.println("test_mulv: " + (end - start)); 1.564 + start = System.currentTimeMillis(); 1.565 + for (int i=0; i<ITERS; i++) { 1.566 + test_mula(a0, a1, a2); 1.567 + } 1.568 + end = System.currentTimeMillis(); 1.569 + System.out.println("test_mula: " + (end - start)); 1.570 + 1.571 + start = System.currentTimeMillis(); 1.572 + for (int i=0; i<ITERS; i++) { 1.573 + test_divc(a0, a1); 1.574 + } 1.575 + end = System.currentTimeMillis(); 1.576 + System.out.println("test_divc: " + (end - start)); 1.577 + start = System.currentTimeMillis(); 1.578 + for (int i=0; i<ITERS; i++) { 1.579 + test_divv(a0, a1, (short)VALUE); 1.580 + } 1.581 + end = System.currentTimeMillis(); 1.582 + System.out.println("test_divv: " + (end - start)); 1.583 + start = System.currentTimeMillis(); 1.584 + for (int i=0; i<ITERS; i++) { 1.585 + test_diva(a0, a1, a2); 1.586 + } 1.587 + end = System.currentTimeMillis(); 1.588 + System.out.println("test_diva: " + (end - start)); 1.589 + 1.590 + start = System.currentTimeMillis(); 1.591 + for (int i=0; i<ITERS; i++) { 1.592 + test_mulc_n(a0, a1); 1.593 + } 1.594 + end = System.currentTimeMillis(); 1.595 + System.out.println("test_mulc_n: " + (end - start)); 1.596 + start = System.currentTimeMillis(); 1.597 + for (int i=0; i<ITERS; i++) { 1.598 + test_mulv(a0, a1, (short)-VALUE); 1.599 + } 1.600 + end = System.currentTimeMillis(); 1.601 + System.out.println("test_mulv_n: " + (end - start)); 1.602 + start = System.currentTimeMillis(); 1.603 + for (int i=0; i<ITERS; i++) { 1.604 + test_mula(a0, a1, a3); 1.605 + } 1.606 + end = System.currentTimeMillis(); 1.607 + System.out.println("test_mula_n: " + (end - start)); 1.608 + 1.609 + start = System.currentTimeMillis(); 1.610 + for (int i=0; i<ITERS; i++) { 1.611 + test_divc_n(a0, a1); 1.612 + } 1.613 + end = System.currentTimeMillis(); 1.614 + System.out.println("test_divc_n: " + (end - start)); 1.615 + start = System.currentTimeMillis(); 1.616 + for (int i=0; i<ITERS; i++) { 1.617 + test_divv(a0, a1, (short)-VALUE); 1.618 + } 1.619 + end = System.currentTimeMillis(); 1.620 + System.out.println("test_divv_n: " + (end - start)); 1.621 + start = System.currentTimeMillis(); 1.622 + for (int i=0; i<ITERS; i++) { 1.623 + test_diva(a0, a1, a3); 1.624 + } 1.625 + end = System.currentTimeMillis(); 1.626 + System.out.println("test_diva_n: " + (end - start)); 1.627 + 1.628 + start = System.currentTimeMillis(); 1.629 + for (int i=0; i<ITERS; i++) { 1.630 + test_andc(a0, a1); 1.631 + } 1.632 + end = System.currentTimeMillis(); 1.633 + System.out.println("test_andc: " + (end - start)); 1.634 + start = System.currentTimeMillis(); 1.635 + for (int i=0; i<ITERS; i++) { 1.636 + test_andv(a0, a1, (short)BIT_MASK); 1.637 + } 1.638 + end = System.currentTimeMillis(); 1.639 + System.out.println("test_andv: " + (end - start)); 1.640 + start = System.currentTimeMillis(); 1.641 + for (int i=0; i<ITERS; i++) { 1.642 + test_anda(a0, a1, a4); 1.643 + } 1.644 + end = System.currentTimeMillis(); 1.645 + System.out.println("test_anda: " + (end - start)); 1.646 + 1.647 + start = System.currentTimeMillis(); 1.648 + for (int i=0; i<ITERS; i++) { 1.649 + test_orc(a0, a1); 1.650 + } 1.651 + end = System.currentTimeMillis(); 1.652 + System.out.println("test_orc: " + (end - start)); 1.653 + start = System.currentTimeMillis(); 1.654 + for (int i=0; i<ITERS; i++) { 1.655 + test_orv(a0, a1, (short)BIT_MASK); 1.656 + } 1.657 + end = System.currentTimeMillis(); 1.658 + System.out.println("test_orv: " + (end - start)); 1.659 + start = System.currentTimeMillis(); 1.660 + for (int i=0; i<ITERS; i++) { 1.661 + test_ora(a0, a1, a4); 1.662 + } 1.663 + end = System.currentTimeMillis(); 1.664 + System.out.println("test_ora: " + (end - start)); 1.665 + 1.666 + start = System.currentTimeMillis(); 1.667 + for (int i=0; i<ITERS; i++) { 1.668 + test_xorc(a0, a1); 1.669 + } 1.670 + end = System.currentTimeMillis(); 1.671 + System.out.println("test_xorc: " + (end - start)); 1.672 + start = System.currentTimeMillis(); 1.673 + for (int i=0; i<ITERS; i++) { 1.674 + test_xorv(a0, a1, (short)BIT_MASK); 1.675 + } 1.676 + end = System.currentTimeMillis(); 1.677 + System.out.println("test_xorv: " + (end - start)); 1.678 + start = System.currentTimeMillis(); 1.679 + for (int i=0; i<ITERS; i++) { 1.680 + test_xora(a0, a1, a4); 1.681 + } 1.682 + end = System.currentTimeMillis(); 1.683 + System.out.println("test_xora: " + (end - start)); 1.684 + 1.685 + start = System.currentTimeMillis(); 1.686 + for (int i=0; i<ITERS; i++) { 1.687 + test_sllc(a0, a1); 1.688 + } 1.689 + end = System.currentTimeMillis(); 1.690 + System.out.println("test_sllc: " + (end - start)); 1.691 + start = System.currentTimeMillis(); 1.692 + for (int i=0; i<ITERS; i++) { 1.693 + test_sllv(a0, a1, VALUE); 1.694 + } 1.695 + end = System.currentTimeMillis(); 1.696 + System.out.println("test_sllv: " + (end - start)); 1.697 + 1.698 + start = System.currentTimeMillis(); 1.699 + for (int i=0; i<ITERS; i++) { 1.700 + test_srlc(a0, a1); 1.701 + } 1.702 + end = System.currentTimeMillis(); 1.703 + System.out.println("test_srlc: " + (end - start)); 1.704 + start = System.currentTimeMillis(); 1.705 + for (int i=0; i<ITERS; i++) { 1.706 + test_srlv(a0, a1, VALUE); 1.707 + } 1.708 + end = System.currentTimeMillis(); 1.709 + System.out.println("test_srlv: " + (end - start)); 1.710 + 1.711 + start = System.currentTimeMillis(); 1.712 + for (int i=0; i<ITERS; i++) { 1.713 + test_srac(a0, a1); 1.714 + } 1.715 + end = System.currentTimeMillis(); 1.716 + System.out.println("test_srac: " + (end - start)); 1.717 + start = System.currentTimeMillis(); 1.718 + for (int i=0; i<ITERS; i++) { 1.719 + test_srav(a0, a1, VALUE); 1.720 + } 1.721 + end = System.currentTimeMillis(); 1.722 + System.out.println("test_srav: " + (end - start)); 1.723 + 1.724 + start = System.currentTimeMillis(); 1.725 + for (int i=0; i<ITERS; i++) { 1.726 + test_sllc_n(a0, a1); 1.727 + } 1.728 + end = System.currentTimeMillis(); 1.729 + System.out.println("test_sllc_n: " + (end - start)); 1.730 + start = System.currentTimeMillis(); 1.731 + for (int i=0; i<ITERS; i++) { 1.732 + test_sllv(a0, a1, -VALUE); 1.733 + } 1.734 + end = System.currentTimeMillis(); 1.735 + System.out.println("test_sllv_n: " + (end - start)); 1.736 + 1.737 + start = System.currentTimeMillis(); 1.738 + for (int i=0; i<ITERS; i++) { 1.739 + test_srlc_n(a0, a1); 1.740 + } 1.741 + end = System.currentTimeMillis(); 1.742 + System.out.println("test_srlc_n: " + (end - start)); 1.743 + start = System.currentTimeMillis(); 1.744 + for (int i=0; i<ITERS; i++) { 1.745 + test_srlv(a0, a1, -VALUE); 1.746 + } 1.747 + end = System.currentTimeMillis(); 1.748 + System.out.println("test_srlv_n: " + (end - start)); 1.749 + 1.750 + start = System.currentTimeMillis(); 1.751 + for (int i=0; i<ITERS; i++) { 1.752 + test_srac_n(a0, a1); 1.753 + } 1.754 + end = System.currentTimeMillis(); 1.755 + System.out.println("test_srac_n: " + (end - start)); 1.756 + start = System.currentTimeMillis(); 1.757 + for (int i=0; i<ITERS; i++) { 1.758 + test_srav(a0, a1, -VALUE); 1.759 + } 1.760 + end = System.currentTimeMillis(); 1.761 + System.out.println("test_srav_n: " + (end - start)); 1.762 + 1.763 + start = System.currentTimeMillis(); 1.764 + for (int i=0; i<ITERS; i++) { 1.765 + test_sllc_o(a0, a1); 1.766 + } 1.767 + end = System.currentTimeMillis(); 1.768 + System.out.println("test_sllc_o: " + (end - start)); 1.769 + start = System.currentTimeMillis(); 1.770 + for (int i=0; i<ITERS; i++) { 1.771 + test_sllv(a0, a1, SHIFT); 1.772 + } 1.773 + end = System.currentTimeMillis(); 1.774 + System.out.println("test_sllv_o: " + (end - start)); 1.775 + 1.776 + start = System.currentTimeMillis(); 1.777 + for (int i=0; i<ITERS; i++) { 1.778 + test_srlc_o(a0, a1); 1.779 + } 1.780 + end = System.currentTimeMillis(); 1.781 + System.out.println("test_srlc_o: " + (end - start)); 1.782 + start = System.currentTimeMillis(); 1.783 + for (int i=0; i<ITERS; i++) { 1.784 + test_srlv(a0, a1, SHIFT); 1.785 + } 1.786 + end = System.currentTimeMillis(); 1.787 + System.out.println("test_srlv_o: " + (end - start)); 1.788 + 1.789 + start = System.currentTimeMillis(); 1.790 + for (int i=0; i<ITERS; i++) { 1.791 + test_srac_o(a0, a1); 1.792 + } 1.793 + end = System.currentTimeMillis(); 1.794 + System.out.println("test_srac_o: " + (end - start)); 1.795 + start = System.currentTimeMillis(); 1.796 + for (int i=0; i<ITERS; i++) { 1.797 + test_srav(a0, a1, SHIFT); 1.798 + } 1.799 + end = System.currentTimeMillis(); 1.800 + System.out.println("test_srav_o: " + (end - start)); 1.801 + 1.802 + start = System.currentTimeMillis(); 1.803 + for (int i=0; i<ITERS; i++) { 1.804 + test_sllc_on(a0, a1); 1.805 + } 1.806 + end = System.currentTimeMillis(); 1.807 + System.out.println("test_sllc_on: " + (end - start)); 1.808 + start = System.currentTimeMillis(); 1.809 + for (int i=0; i<ITERS; i++) { 1.810 + test_sllv(a0, a1, -SHIFT); 1.811 + } 1.812 + end = System.currentTimeMillis(); 1.813 + System.out.println("test_sllv_on: " + (end - start)); 1.814 + 1.815 + start = System.currentTimeMillis(); 1.816 + for (int i=0; i<ITERS; i++) { 1.817 + test_srlc_on(a0, a1); 1.818 + } 1.819 + end = System.currentTimeMillis(); 1.820 + System.out.println("test_srlc_on: " + (end - start)); 1.821 + start = System.currentTimeMillis(); 1.822 + for (int i=0; i<ITERS; i++) { 1.823 + test_srlv(a0, a1, -SHIFT); 1.824 + } 1.825 + end = System.currentTimeMillis(); 1.826 + System.out.println("test_srlv_on: " + (end - start)); 1.827 + 1.828 + start = System.currentTimeMillis(); 1.829 + for (int i=0; i<ITERS; i++) { 1.830 + test_srac_on(a0, a1); 1.831 + } 1.832 + end = System.currentTimeMillis(); 1.833 + System.out.println("test_srac_on: " + (end - start)); 1.834 + start = System.currentTimeMillis(); 1.835 + for (int i=0; i<ITERS; i++) { 1.836 + test_srav(a0, a1, -SHIFT); 1.837 + } 1.838 + end = System.currentTimeMillis(); 1.839 + System.out.println("test_srav_on: " + (end - start)); 1.840 + 1.841 + start = System.currentTimeMillis(); 1.842 + for (int i=0; i<ITERS; i++) { 1.843 + test_sllc_add(a0, a1); 1.844 + } 1.845 + end = System.currentTimeMillis(); 1.846 + System.out.println("test_sllc_add: " + (end - start)); 1.847 + start = System.currentTimeMillis(); 1.848 + for (int i=0; i<ITERS; i++) { 1.849 + test_sllv_add(a0, a1, ADD_INIT); 1.850 + } 1.851 + end = System.currentTimeMillis(); 1.852 + System.out.println("test_sllv_add: " + (end - start)); 1.853 + 1.854 + start = System.currentTimeMillis(); 1.855 + for (int i=0; i<ITERS; i++) { 1.856 + test_srlc_add(a0, a1); 1.857 + } 1.858 + end = System.currentTimeMillis(); 1.859 + System.out.println("test_srlc_add: " + (end - start)); 1.860 + start = System.currentTimeMillis(); 1.861 + for (int i=0; i<ITERS; i++) { 1.862 + test_srlv_add(a0, a1, ADD_INIT); 1.863 + } 1.864 + end = System.currentTimeMillis(); 1.865 + System.out.println("test_srlv_add: " + (end - start)); 1.866 + 1.867 + start = System.currentTimeMillis(); 1.868 + for (int i=0; i<ITERS; i++) { 1.869 + test_srac_add(a0, a1); 1.870 + } 1.871 + end = System.currentTimeMillis(); 1.872 + System.out.println("test_srac_add: " + (end - start)); 1.873 + start = System.currentTimeMillis(); 1.874 + for (int i=0; i<ITERS; i++) { 1.875 + test_srav_add(a0, a1, ADD_INIT); 1.876 + } 1.877 + end = System.currentTimeMillis(); 1.878 + System.out.println("test_srav_add: " + (end - start)); 1.879 + 1.880 + start = System.currentTimeMillis(); 1.881 + for (int i=0; i<ITERS; i++) { 1.882 + test_sllc_and(a0, a1); 1.883 + } 1.884 + end = System.currentTimeMillis(); 1.885 + System.out.println("test_sllc_and: " + (end - start)); 1.886 + start = System.currentTimeMillis(); 1.887 + for (int i=0; i<ITERS; i++) { 1.888 + test_sllv_and(a0, a1, BIT_MASK); 1.889 + } 1.890 + end = System.currentTimeMillis(); 1.891 + System.out.println("test_sllv_and: " + (end - start)); 1.892 + 1.893 + start = System.currentTimeMillis(); 1.894 + for (int i=0; i<ITERS; i++) { 1.895 + test_srlc_and(a0, a1); 1.896 + } 1.897 + end = System.currentTimeMillis(); 1.898 + System.out.println("test_srlc_and: " + (end - start)); 1.899 + start = System.currentTimeMillis(); 1.900 + for (int i=0; i<ITERS; i++) { 1.901 + test_srlv_and(a0, a1, BIT_MASK); 1.902 + } 1.903 + end = System.currentTimeMillis(); 1.904 + System.out.println("test_srlv_and: " + (end - start)); 1.905 + 1.906 + start = System.currentTimeMillis(); 1.907 + for (int i=0; i<ITERS; i++) { 1.908 + test_srac_and(a0, a1); 1.909 + } 1.910 + end = System.currentTimeMillis(); 1.911 + System.out.println("test_srac_and: " + (end - start)); 1.912 + start = System.currentTimeMillis(); 1.913 + for (int i=0; i<ITERS; i++) { 1.914 + test_srav_and(a0, a1, BIT_MASK); 1.915 + } 1.916 + end = System.currentTimeMillis(); 1.917 + System.out.println("test_srav_and: " + (end - start)); 1.918 + 1.919 + start = System.currentTimeMillis(); 1.920 + for (int i=0; i<ITERS; i++) { 1.921 + test_pack2(p2, a1); 1.922 + } 1.923 + end = System.currentTimeMillis(); 1.924 + System.out.println("test_pack2: " + (end - start)); 1.925 + start = System.currentTimeMillis(); 1.926 + for (int i=0; i<ITERS; i++) { 1.927 + test_unpack2(a0, p2); 1.928 + } 1.929 + end = System.currentTimeMillis(); 1.930 + System.out.println("test_unpack2: " + (end - start)); 1.931 + start = System.currentTimeMillis(); 1.932 + for (int i=0; i<ITERS; i++) { 1.933 + test_pack2_swap(p2, a1); 1.934 + } 1.935 + end = System.currentTimeMillis(); 1.936 + System.out.println("test_pack2_swap: " + (end - start)); 1.937 + start = System.currentTimeMillis(); 1.938 + for (int i=0; i<ITERS; i++) { 1.939 + test_unpack2_swap(a0, p2); 1.940 + } 1.941 + end = System.currentTimeMillis(); 1.942 + System.out.println("test_unpack2_swap: " + (end - start)); 1.943 + 1.944 + start = System.currentTimeMillis(); 1.945 + for (int i=0; i<ITERS; i++) { 1.946 + test_pack4(p4, a1); 1.947 + } 1.948 + end = System.currentTimeMillis(); 1.949 + System.out.println("test_pack4: " + (end - start)); 1.950 + start = System.currentTimeMillis(); 1.951 + for (int i=0; i<ITERS; i++) { 1.952 + test_unpack4(a0, p4); 1.953 + } 1.954 + end = System.currentTimeMillis(); 1.955 + System.out.println("test_unpack4: " + (end - start)); 1.956 + start = System.currentTimeMillis(); 1.957 + for (int i=0; i<ITERS; i++) { 1.958 + test_pack4_swap(p4, a1); 1.959 + } 1.960 + end = System.currentTimeMillis(); 1.961 + System.out.println("test_pack4_swap: " + (end - start)); 1.962 + start = System.currentTimeMillis(); 1.963 + for (int i=0; i<ITERS; i++) { 1.964 + test_unpack4_swap(a0, p4); 1.965 + } 1.966 + end = System.currentTimeMillis(); 1.967 + System.out.println("test_unpack4_swap: " + (end - start)); 1.968 + 1.969 + return errn; 1.970 + } 1.971 + 1.972 + static int test_sum(short[] a1) { 1.973 + int sum = 0; 1.974 + for (int i = 0; i < a1.length; i+=1) { 1.975 + sum += a1[i]; 1.976 + } 1.977 + return sum; 1.978 + } 1.979 + 1.980 + static void test_addc(short[] a0, short[] a1) { 1.981 + for (int i = 0; i < a0.length; i+=1) { 1.982 + a0[i] = (short)(a1[i]+VALUE); 1.983 + } 1.984 + } 1.985 + static void test_addv(short[] a0, short[] a1, short b) { 1.986 + for (int i = 0; i < a0.length; i+=1) { 1.987 + a0[i] = (short)(a1[i]+b); 1.988 + } 1.989 + } 1.990 + static void test_adda(short[] a0, short[] a1, short[] a2) { 1.991 + for (int i = 0; i < a0.length; i+=1) { 1.992 + a0[i] = (short)(a1[i]+a2[i]); 1.993 + } 1.994 + } 1.995 + 1.996 + static void test_subc(short[] a0, short[] a1) { 1.997 + for (int i = 0; i < a0.length; i+=1) { 1.998 + a0[i] = (short)(a1[i]-VALUE); 1.999 + } 1.1000 + } 1.1001 + static void test_subv(short[] a0, short[] a1, short b) { 1.1002 + for (int i = 0; i < a0.length; i+=1) { 1.1003 + a0[i] = (short)(a1[i]-b); 1.1004 + } 1.1005 + } 1.1006 + static void test_suba(short[] a0, short[] a1, short[] a2) { 1.1007 + for (int i = 0; i < a0.length; i+=1) { 1.1008 + a0[i] = (short)(a1[i]-a2[i]); 1.1009 + } 1.1010 + } 1.1011 + 1.1012 + static void test_mulc(short[] a0, short[] a1) { 1.1013 + for (int i = 0; i < a0.length; i+=1) { 1.1014 + a0[i] = (short)(a1[i]*VALUE); 1.1015 + } 1.1016 + } 1.1017 + static void test_mulc_n(short[] a0, short[] a1) { 1.1018 + for (int i = 0; i < a0.length; i+=1) { 1.1019 + a0[i] = (short)(a1[i]*(-VALUE)); 1.1020 + } 1.1021 + } 1.1022 + static void test_mulv(short[] a0, short[] a1, short b) { 1.1023 + for (int i = 0; i < a0.length; i+=1) { 1.1024 + a0[i] = (short)(a1[i]*b); 1.1025 + } 1.1026 + } 1.1027 + static void test_mula(short[] a0, short[] a1, short[] a2) { 1.1028 + for (int i = 0; i < a0.length; i+=1) { 1.1029 + a0[i] = (short)(a1[i]*a2[i]); 1.1030 + } 1.1031 + } 1.1032 + 1.1033 + static void test_divc(short[] a0, short[] a1) { 1.1034 + for (int i = 0; i < a0.length; i+=1) { 1.1035 + a0[i] = (short)(a1[i]/VALUE); 1.1036 + } 1.1037 + } 1.1038 + static void test_divc_n(short[] a0, short[] a1) { 1.1039 + for (int i = 0; i < a0.length; i+=1) { 1.1040 + a0[i] = (short)(a1[i]/(-VALUE)); 1.1041 + } 1.1042 + } 1.1043 + static void test_divv(short[] a0, short[] a1, short b) { 1.1044 + for (int i = 0; i < a0.length; i+=1) { 1.1045 + a0[i] = (short)(a1[i]/b); 1.1046 + } 1.1047 + } 1.1048 + static void test_diva(short[] a0, short[] a1, short[] a2) { 1.1049 + for (int i = 0; i < a0.length; i+=1) { 1.1050 + a0[i] = (short)(a1[i]/a2[i]); 1.1051 + } 1.1052 + } 1.1053 + 1.1054 + static void test_andc(short[] a0, short[] a1) { 1.1055 + for (int i = 0; i < a0.length; i+=1) { 1.1056 + a0[i] = (short)(a1[i]&BIT_MASK); 1.1057 + } 1.1058 + } 1.1059 + static void test_andv(short[] a0, short[] a1, short b) { 1.1060 + for (int i = 0; i < a0.length; i+=1) { 1.1061 + a0[i] = (short)(a1[i]&b); 1.1062 + } 1.1063 + } 1.1064 + static void test_anda(short[] a0, short[] a1, short[] a2) { 1.1065 + for (int i = 0; i < a0.length; i+=1) { 1.1066 + a0[i] = (short)(a1[i]&a2[i]); 1.1067 + } 1.1068 + } 1.1069 + 1.1070 + static void test_orc(short[] a0, short[] a1) { 1.1071 + for (int i = 0; i < a0.length; i+=1) { 1.1072 + a0[i] = (short)(a1[i]|BIT_MASK); 1.1073 + } 1.1074 + } 1.1075 + static void test_orv(short[] a0, short[] a1, short b) { 1.1076 + for (int i = 0; i < a0.length; i+=1) { 1.1077 + a0[i] = (short)(a1[i]|b); 1.1078 + } 1.1079 + } 1.1080 + static void test_ora(short[] a0, short[] a1, short[] a2) { 1.1081 + for (int i = 0; i < a0.length; i+=1) { 1.1082 + a0[i] = (short)(a1[i]|a2[i]); 1.1083 + } 1.1084 + } 1.1085 + 1.1086 + static void test_xorc(short[] a0, short[] a1) { 1.1087 + for (int i = 0; i < a0.length; i+=1) { 1.1088 + a0[i] = (short)(a1[i]^BIT_MASK); 1.1089 + } 1.1090 + } 1.1091 + static void test_xorv(short[] a0, short[] a1, short b) { 1.1092 + for (int i = 0; i < a0.length; i+=1) { 1.1093 + a0[i] = (short)(a1[i]^b); 1.1094 + } 1.1095 + } 1.1096 + static void test_xora(short[] a0, short[] a1, short[] a2) { 1.1097 + for (int i = 0; i < a0.length; i+=1) { 1.1098 + a0[i] = (short)(a1[i]^a2[i]); 1.1099 + } 1.1100 + } 1.1101 + 1.1102 + static void test_sllc(short[] a0, short[] a1) { 1.1103 + for (int i = 0; i < a0.length; i+=1) { 1.1104 + a0[i] = (short)(a1[i]<<VALUE); 1.1105 + } 1.1106 + } 1.1107 + static void test_sllc_n(short[] a0, short[] a1) { 1.1108 + for (int i = 0; i < a0.length; i+=1) { 1.1109 + a0[i] = (short)(a1[i]<<(-VALUE)); 1.1110 + } 1.1111 + } 1.1112 + static void test_sllc_o(short[] a0, short[] a1) { 1.1113 + for (int i = 0; i < a0.length; i+=1) { 1.1114 + a0[i] = (short)(a1[i]<<SHIFT); 1.1115 + } 1.1116 + } 1.1117 + static void test_sllc_on(short[] a0, short[] a1) { 1.1118 + for (int i = 0; i < a0.length; i+=1) { 1.1119 + a0[i] = (short)(a1[i]<<(-SHIFT)); 1.1120 + } 1.1121 + } 1.1122 + static void test_sllv(short[] a0, short[] a1, int b) { 1.1123 + for (int i = 0; i < a0.length; i+=1) { 1.1124 + a0[i] = (short)(a1[i]<<b); 1.1125 + } 1.1126 + } 1.1127 + static void test_sllc_add(short[] a0, short[] a1) { 1.1128 + for (int i = 0; i < a0.length; i+=1) { 1.1129 + a0[i] = (short)((a1[i] + ADD_INIT)<<VALUE); 1.1130 + } 1.1131 + } 1.1132 + static void test_sllv_add(short[] a0, short[] a1, int b) { 1.1133 + for (int i = 0; i < a0.length; i+=1) { 1.1134 + a0[i] = (short)((a1[i] + b)<<VALUE); 1.1135 + } 1.1136 + } 1.1137 + static void test_sllc_and(short[] a0, short[] a1) { 1.1138 + for (int i = 0; i < a0.length; i+=1) { 1.1139 + a0[i] = (short)((a1[i] & BIT_MASK)<<VALUE); 1.1140 + } 1.1141 + } 1.1142 + static void test_sllv_and(short[] a0, short[] a1, int b) { 1.1143 + for (int i = 0; i < a0.length; i+=1) { 1.1144 + a0[i] = (short)((a1[i] & b)<<VALUE); 1.1145 + } 1.1146 + } 1.1147 + 1.1148 + static void test_srlc(short[] a0, short[] a1) { 1.1149 + for (int i = 0; i < a0.length; i+=1) { 1.1150 + a0[i] = (short)(a1[i]>>>VALUE); 1.1151 + } 1.1152 + } 1.1153 + static void test_srlc_n(short[] a0, short[] a1) { 1.1154 + for (int i = 0; i < a0.length; i+=1) { 1.1155 + a0[i] = (short)(a1[i]>>>(-VALUE)); 1.1156 + } 1.1157 + } 1.1158 + static void test_srlc_o(short[] a0, short[] a1) { 1.1159 + for (int i = 0; i < a0.length; i+=1) { 1.1160 + a0[i] = (short)(a1[i]>>>SHIFT); 1.1161 + } 1.1162 + } 1.1163 + static void test_srlc_on(short[] a0, short[] a1) { 1.1164 + for (int i = 0; i < a0.length; i+=1) { 1.1165 + a0[i] = (short)(a1[i]>>>(-SHIFT)); 1.1166 + } 1.1167 + } 1.1168 + static void test_srlv(short[] a0, short[] a1, int b) { 1.1169 + for (int i = 0; i < a0.length; i+=1) { 1.1170 + a0[i] = (short)(a1[i]>>>b); 1.1171 + } 1.1172 + } 1.1173 + static void test_srlc_add(short[] a0, short[] a1) { 1.1174 + for (int i = 0; i < a0.length; i+=1) { 1.1175 + a0[i] = (short)((a1[i] + ADD_INIT)>>>VALUE); 1.1176 + } 1.1177 + } 1.1178 + static void test_srlv_add(short[] a0, short[] a1, int b) { 1.1179 + for (int i = 0; i < a0.length; i+=1) { 1.1180 + a0[i] = (short)((a1[i] + b)>>>VALUE); 1.1181 + } 1.1182 + } 1.1183 + static void test_srlc_and(short[] a0, short[] a1) { 1.1184 + for (int i = 0; i < a0.length; i+=1) { 1.1185 + a0[i] = (short)((a1[i] & BIT_MASK)>>>VALUE); 1.1186 + } 1.1187 + } 1.1188 + static void test_srlv_and(short[] a0, short[] a1, int b) { 1.1189 + for (int i = 0; i < a0.length; i+=1) { 1.1190 + a0[i] = (short)((a1[i] & b)>>>VALUE); 1.1191 + } 1.1192 + } 1.1193 + 1.1194 + static void test_srac(short[] a0, short[] a1) { 1.1195 + for (int i = 0; i < a0.length; i+=1) { 1.1196 + a0[i] = (short)(a1[i]>>VALUE); 1.1197 + } 1.1198 + } 1.1199 + static void test_srac_n(short[] a0, short[] a1) { 1.1200 + for (int i = 0; i < a0.length; i+=1) { 1.1201 + a0[i] = (short)(a1[i]>>(-VALUE)); 1.1202 + } 1.1203 + } 1.1204 + static void test_srac_o(short[] a0, short[] a1) { 1.1205 + for (int i = 0; i < a0.length; i+=1) { 1.1206 + a0[i] = (short)(a1[i]>>SHIFT); 1.1207 + } 1.1208 + } 1.1209 + static void test_srac_on(short[] a0, short[] a1) { 1.1210 + for (int i = 0; i < a0.length; i+=1) { 1.1211 + a0[i] = (short)(a1[i]>>(-SHIFT)); 1.1212 + } 1.1213 + } 1.1214 + static void test_srav(short[] a0, short[] a1, int b) { 1.1215 + for (int i = 0; i < a0.length; i+=1) { 1.1216 + a0[i] = (short)(a1[i]>>b); 1.1217 + } 1.1218 + } 1.1219 + static void test_srac_add(short[] a0, short[] a1) { 1.1220 + for (int i = 0; i < a0.length; i+=1) { 1.1221 + a0[i] = (short)((a1[i] + ADD_INIT)>>VALUE); 1.1222 + } 1.1223 + } 1.1224 + static void test_srav_add(short[] a0, short[] a1, int b) { 1.1225 + for (int i = 0; i < a0.length; i+=1) { 1.1226 + a0[i] = (short)((a1[i] + b)>>VALUE); 1.1227 + } 1.1228 + } 1.1229 + static void test_srac_and(short[] a0, short[] a1) { 1.1230 + for (int i = 0; i < a0.length; i+=1) { 1.1231 + a0[i] = (short)((a1[i] & BIT_MASK)>>VALUE); 1.1232 + } 1.1233 + } 1.1234 + static void test_srav_and(short[] a0, short[] a1, int b) { 1.1235 + for (int i = 0; i < a0.length; i+=1) { 1.1236 + a0[i] = (short)((a1[i] & b)>>VALUE); 1.1237 + } 1.1238 + } 1.1239 + 1.1240 + static void test_pack2(int[] p2, short[] a1) { 1.1241 + if (p2.length*2 > a1.length) return; 1.1242 + for (int i = 0; i < p2.length; i+=1) { 1.1243 + int l0 = (int)a1[i*2+0]; 1.1244 + int l1 = (int)a1[i*2+1]; 1.1245 + p2[i] = (l1 << 16) | (l0 & 0xFFFF); 1.1246 + } 1.1247 + } 1.1248 + static void test_unpack2(short[] a0, int[] p2) { 1.1249 + if (p2.length*2 > a0.length) return; 1.1250 + for (int i = 0; i < p2.length; i+=1) { 1.1251 + int l = p2[i]; 1.1252 + a0[i*2+0] = (short)(l & 0xFFFF); 1.1253 + a0[i*2+1] = (short)(l >> 16); 1.1254 + } 1.1255 + } 1.1256 + static void test_pack2_swap(int[] p2, short[] a1) { 1.1257 + if (p2.length*2 > a1.length) return; 1.1258 + for (int i = 0; i < p2.length; i+=1) { 1.1259 + int l0 = (int)a1[i*2+0]; 1.1260 + int l1 = (int)a1[i*2+1]; 1.1261 + p2[i] = (l0 << 16) | (l1 & 0xFFFF); 1.1262 + } 1.1263 + } 1.1264 + static void test_unpack2_swap(short[] a0, int[] p2) { 1.1265 + if (p2.length*2 > a0.length) return; 1.1266 + for (int i = 0; i < p2.length; i+=1) { 1.1267 + int l = p2[i]; 1.1268 + a0[i*2+0] = (short)(l >> 16); 1.1269 + a0[i*2+1] = (short)(l & 0xFFFF); 1.1270 + } 1.1271 + } 1.1272 + 1.1273 + static void test_pack4(long[] p4, short[] a1) { 1.1274 + if (p4.length*4 > a1.length) return; 1.1275 + for (int i = 0; i < p4.length; i+=1) { 1.1276 + long l0 = (long)a1[i*4+0]; 1.1277 + long l1 = (long)a1[i*4+1]; 1.1278 + long l2 = (long)a1[i*4+2]; 1.1279 + long l3 = (long)a1[i*4+3]; 1.1280 + p4[i] = (l0 & 0xFFFFl) | 1.1281 + ((l1 & 0xFFFFl) << 16) | 1.1282 + ((l2 & 0xFFFFl) << 32) | 1.1283 + ((l3 & 0xFFFFl) << 48); 1.1284 + } 1.1285 + } 1.1286 + static void test_unpack4(short[] a0, long[] p4) { 1.1287 + if (p4.length*4 > a0.length) return; 1.1288 + for (int i = 0; i < p4.length; i+=1) { 1.1289 + long l = p4[i]; 1.1290 + a0[i*4+0] = (short)(l & 0xFFFFl); 1.1291 + a0[i*4+1] = (short)(l >> 16); 1.1292 + a0[i*4+2] = (short)(l >> 32); 1.1293 + a0[i*4+3] = (short)(l >> 48); 1.1294 + } 1.1295 + } 1.1296 + static void test_pack4_swap(long[] p4, short[] a1) { 1.1297 + if (p4.length*4 > a1.length) return; 1.1298 + for (int i = 0; i < p4.length; i+=1) { 1.1299 + long l0 = (long)a1[i*4+0]; 1.1300 + long l1 = (long)a1[i*4+1]; 1.1301 + long l2 = (long)a1[i*4+2]; 1.1302 + long l3 = (long)a1[i*4+3]; 1.1303 + p4[i] = (l3 & 0xFFFFl) | 1.1304 + ((l2 & 0xFFFFl) << 16) | 1.1305 + ((l1 & 0xFFFFl) << 32) | 1.1306 + ((l0 & 0xFFFFl) << 48); 1.1307 + } 1.1308 + } 1.1309 + static void test_unpack4_swap(short[] a0, long[] p4) { 1.1310 + if (p4.length*4 > a0.length) return; 1.1311 + for (int i = 0; i < p4.length; i+=1) { 1.1312 + long l = p4[i]; 1.1313 + a0[i*4+0] = (short)(l >> 48); 1.1314 + a0[i*4+1] = (short)(l >> 32); 1.1315 + a0[i*4+2] = (short)(l >> 16); 1.1316 + a0[i*4+3] = (short)(l & 0xFFFFl); 1.1317 + } 1.1318 + } 1.1319 + 1.1320 + static int verify(String text, int i, short elem, short val) { 1.1321 + if (elem != val) { 1.1322 + System.err.println(text + "[" + i + "] = " + elem + " != " + val); 1.1323 + return 1; 1.1324 + } 1.1325 + return 0; 1.1326 + } 1.1327 + 1.1328 + static int verify(String text, int i, int elem, int val) { 1.1329 + if (elem != val) { 1.1330 + System.err.println(text + "[" + i + "] = " + Integer.toHexString(elem) + " != " + Integer.toHexString(val)); 1.1331 + return 1; 1.1332 + } 1.1333 + return 0; 1.1334 + } 1.1335 + 1.1336 + static int verify(String text, int i, long elem, long val) { 1.1337 + if (elem != val) { 1.1338 + System.err.println(text + "[" + i + "] = " + Long.toHexString(elem) + " != " + Long.toHexString(val)); 1.1339 + return 1; 1.1340 + } 1.1341 + return 0; 1.1342 + } 1.1343 +}