1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 1.2 +++ b/test/compiler/7119644/TestShortVect.java Wed Apr 27 01:25:04 2016 +0800 1.3 @@ -0,0 +1,953 @@ 1.4 +/* 1.5 + * Copyright (c) 2012, Oracle and/or its affiliates. All rights reserved. 1.6 + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 1.7 + * 1.8 + * This code is free software; you can redistribute it and/or modify it 1.9 + * under the terms of the GNU General Public License version 2 only, as 1.10 + * published by the Free Software Foundation. 1.11 + * 1.12 + * This code is distributed in the hope that it will be useful, but WITHOUT 1.13 + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 1.14 + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 1.15 + * version 2 for more details (a copy is included in the LICENSE file that 1.16 + * accompanied this code). 1.17 + * 1.18 + * You should have received a copy of the GNU General Public License version 1.19 + * 2 along with this work; if not, write to the Free Software Foundation, 1.20 + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 1.21 + * 1.22 + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 1.23 + * or visit www.oracle.com if you need additional information or have any 1.24 + * questions. 1.25 + * 1.26 + */ 1.27 + 1.28 +/** 1.29 + * @test 1.30 + * @bug 7119644 1.31 + * @summary Increase superword's vector size up to 256 bits 1.32 + * 1.33 + * @run main/othervm/timeout=300 -Xbatch -XX:+IgnoreUnrecognizedVMOptions -XX:-TieredCompilation -XX:-OptimizeFill TestShortVect 1.34 + */ 1.35 + 1.36 +public class TestShortVect { 1.37 + private static final int ARRLEN = 997; 1.38 + private static final int ITERS = 11000; 1.39 + private static final int OFFSET = 3; 1.40 + private static final int SCALE = 2; 1.41 + private static final int ALIGN_OFF = 8; 1.42 + private static final int UNALIGN_OFF = 5; 1.43 + 1.44 + public static void main(String args[]) { 1.45 + System.out.println("Testing Short vectors"); 1.46 + int errn = test(); 1.47 + if (errn > 0) { 1.48 + System.err.println("FAILED: " + errn + " errors"); 1.49 + System.exit(97); 1.50 + } 1.51 + System.out.println("PASSED"); 1.52 + } 1.53 + 1.54 + static int test() { 1.55 + short[] a1 = new short[ARRLEN]; 1.56 + short[] a2 = new short[ARRLEN]; 1.57 + System.out.println("Warmup"); 1.58 + for (int i=0; i<ITERS; i++) { 1.59 + test_ci(a1); 1.60 + test_vi(a2, (short)123); 1.61 + test_cp(a1, a2); 1.62 + test_2ci(a1, a2); 1.63 + test_2vi(a1, a2, (short)123, (short)103); 1.64 + test_ci_neg(a1); 1.65 + test_vi_neg(a2, (short)123); 1.66 + test_cp_neg(a1, a2); 1.67 + test_2ci_neg(a1, a2); 1.68 + test_2vi_neg(a1, a2, (short)123, (short)103); 1.69 + test_ci_oppos(a1); 1.70 + test_vi_oppos(a2, (short)123); 1.71 + test_cp_oppos(a1, a2); 1.72 + test_2ci_oppos(a1, a2); 1.73 + test_2vi_oppos(a1, a2, (short)123, (short)103); 1.74 + test_ci_off(a1); 1.75 + test_vi_off(a2, (short)123); 1.76 + test_cp_off(a1, a2); 1.77 + test_2ci_off(a1, a2); 1.78 + test_2vi_off(a1, a2, (short)123, (short)103); 1.79 + test_ci_inv(a1, OFFSET); 1.80 + test_vi_inv(a2, (short)123, OFFSET); 1.81 + test_cp_inv(a1, a2, OFFSET); 1.82 + test_2ci_inv(a1, a2, OFFSET); 1.83 + test_2vi_inv(a1, a2, (short)123, (short)103, OFFSET); 1.84 + test_ci_scl(a1); 1.85 + test_vi_scl(a2, (short)123); 1.86 + test_cp_scl(a1, a2); 1.87 + test_2ci_scl(a1, a2); 1.88 + test_2vi_scl(a1, a2, (short)123, (short)103); 1.89 + test_cp_alndst(a1, a2); 1.90 + test_cp_alnsrc(a1, a2); 1.91 + test_2ci_aln(a1, a2); 1.92 + test_2vi_aln(a1, a2, (short)123, (short)103); 1.93 + test_cp_unalndst(a1, a2); 1.94 + test_cp_unalnsrc(a1, a2); 1.95 + test_2ci_unaln(a1, a2); 1.96 + test_2vi_unaln(a1, a2, (short)123, (short)103); 1.97 + } 1.98 + // Initialize 1.99 + for (int i=0; i<ARRLEN; i++) { 1.100 + a1[i] = -1; 1.101 + a2[i] = -1; 1.102 + } 1.103 + // Test and verify results 1.104 + System.out.println("Verification"); 1.105 + int errn = 0; 1.106 + { 1.107 + test_ci(a1); 1.108 + for (int i=0; i<ARRLEN; i++) { 1.109 + errn += verify("test_ci: a1", i, a1[i], (short)-123); 1.110 + } 1.111 + test_vi(a2, (short)123); 1.112 + for (int i=0; i<ARRLEN; i++) { 1.113 + errn += verify("test_vi: a2", i, a2[i], (short)123); 1.114 + } 1.115 + test_cp(a1, a2); 1.116 + for (int i=0; i<ARRLEN; i++) { 1.117 + errn += verify("test_cp: a1", i, a1[i], (short)123); 1.118 + } 1.119 + test_2ci(a1, a2); 1.120 + for (int i=0; i<ARRLEN; i++) { 1.121 + errn += verify("test_2ci: a1", i, a1[i], (short)-123); 1.122 + errn += verify("test_2ci: a2", i, a2[i], (short)-103); 1.123 + } 1.124 + test_2vi(a1, a2, (short)123, (short)103); 1.125 + for (int i=0; i<ARRLEN; i++) { 1.126 + errn += verify("test_2vi: a1", i, a1[i], (short)123); 1.127 + errn += verify("test_2vi: a2", i, a2[i], (short)103); 1.128 + } 1.129 + // Reset for negative stride 1.130 + for (int i=0; i<ARRLEN; i++) { 1.131 + a1[i] = -1; 1.132 + a2[i] = -1; 1.133 + } 1.134 + test_ci_neg(a1); 1.135 + for (int i=0; i<ARRLEN; i++) { 1.136 + errn += verify("test_ci_neg: a1", i, a1[i], (short)-123); 1.137 + } 1.138 + test_vi_neg(a2, (short)123); 1.139 + for (int i=0; i<ARRLEN; i++) { 1.140 + errn += verify("test_vi_neg: a2", i, a2[i], (short)123); 1.141 + } 1.142 + test_cp_neg(a1, a2); 1.143 + for (int i=0; i<ARRLEN; i++) { 1.144 + errn += verify("test_cp_neg: a1", i, a1[i], (short)123); 1.145 + } 1.146 + test_2ci_neg(a1, a2); 1.147 + for (int i=0; i<ARRLEN; i++) { 1.148 + errn += verify("test_2ci_neg: a1", i, a1[i], (short)-123); 1.149 + errn += verify("test_2ci_neg: a2", i, a2[i], (short)-103); 1.150 + } 1.151 + test_2vi_neg(a1, a2, (short)123, (short)103); 1.152 + for (int i=0; i<ARRLEN; i++) { 1.153 + errn += verify("test_2vi_neg: a1", i, a1[i], (short)123); 1.154 + errn += verify("test_2vi_neg: a2", i, a2[i], (short)103); 1.155 + } 1.156 + // Reset for opposite stride 1.157 + for (int i=0; i<ARRLEN; i++) { 1.158 + a1[i] = -1; 1.159 + a2[i] = -1; 1.160 + } 1.161 + test_ci_oppos(a1); 1.162 + for (int i=0; i<ARRLEN; i++) { 1.163 + errn += verify("test_ci_oppos: a1", i, a1[i], (short)-123); 1.164 + } 1.165 + test_vi_oppos(a2, (short)123); 1.166 + for (int i=0; i<ARRLEN; i++) { 1.167 + errn += verify("test_vi_oppos: a2", i, a2[i], (short)123); 1.168 + } 1.169 + test_cp_oppos(a1, a2); 1.170 + for (int i=0; i<ARRLEN; i++) { 1.171 + errn += verify("test_cp_oppos: a1", i, a1[i], (short)123); 1.172 + } 1.173 + test_2ci_oppos(a1, a2); 1.174 + for (int i=0; i<ARRLEN; i++) { 1.175 + errn += verify("test_2ci_oppos: a1", i, a1[i], (short)-123); 1.176 + errn += verify("test_2ci_oppos: a2", i, a2[i], (short)-103); 1.177 + } 1.178 + test_2vi_oppos(a1, a2, (short)123, (short)103); 1.179 + for (int i=0; i<ARRLEN; i++) { 1.180 + errn += verify("test_2vi_oppos: a1", i, a1[i], (short)123); 1.181 + errn += verify("test_2vi_oppos: a2", i, a2[i], (short)103); 1.182 + } 1.183 + // Reset for indexing with offset 1.184 + for (int i=0; i<ARRLEN; i++) { 1.185 + a1[i] = -1; 1.186 + a2[i] = -1; 1.187 + } 1.188 + test_ci_off(a1); 1.189 + for (int i=OFFSET; i<ARRLEN; i++) { 1.190 + errn += verify("test_ci_off: a1", i, a1[i], (short)-123); 1.191 + } 1.192 + test_vi_off(a2, (short)123); 1.193 + for (int i=OFFSET; i<ARRLEN; i++) { 1.194 + errn += verify("test_vi_off: a2", i, a2[i], (short)123); 1.195 + } 1.196 + test_cp_off(a1, a2); 1.197 + for (int i=OFFSET; i<ARRLEN; i++) { 1.198 + errn += verify("test_cp_off: a1", i, a1[i], (short)123); 1.199 + } 1.200 + test_2ci_off(a1, a2); 1.201 + for (int i=OFFSET; i<ARRLEN; i++) { 1.202 + errn += verify("test_2ci_off: a1", i, a1[i], (short)-123); 1.203 + errn += verify("test_2ci_off: a2", i, a2[i], (short)-103); 1.204 + } 1.205 + test_2vi_off(a1, a2, (short)123, (short)103); 1.206 + for (int i=OFFSET; i<ARRLEN; i++) { 1.207 + errn += verify("test_2vi_off: a1", i, a1[i], (short)123); 1.208 + errn += verify("test_2vi_off: a2", i, a2[i], (short)103); 1.209 + } 1.210 + for (int i=0; i<OFFSET; i++) { 1.211 + errn += verify("test_2vi_off: a1", i, a1[i], (short)-1); 1.212 + errn += verify("test_2vi_off: a2", i, a2[i], (short)-1); 1.213 + } 1.214 + // Reset for indexing with invariant offset 1.215 + for (int i=0; i<ARRLEN; i++) { 1.216 + a1[i] = -1; 1.217 + a2[i] = -1; 1.218 + } 1.219 + test_ci_inv(a1, OFFSET); 1.220 + for (int i=OFFSET; i<ARRLEN; i++) { 1.221 + errn += verify("test_ci_inv: a1", i, a1[i], (short)-123); 1.222 + } 1.223 + test_vi_inv(a2, (short)123, OFFSET); 1.224 + for (int i=OFFSET; i<ARRLEN; i++) { 1.225 + errn += verify("test_vi_inv: a2", i, a2[i], (short)123); 1.226 + } 1.227 + test_cp_inv(a1, a2, OFFSET); 1.228 + for (int i=OFFSET; i<ARRLEN; i++) { 1.229 + errn += verify("test_cp_inv: a1", i, a1[i], (short)123); 1.230 + } 1.231 + test_2ci_inv(a1, a2, OFFSET); 1.232 + for (int i=OFFSET; i<ARRLEN; i++) { 1.233 + errn += verify("test_2ci_inv: a1", i, a1[i], (short)-123); 1.234 + errn += verify("test_2ci_inv: a2", i, a2[i], (short)-103); 1.235 + } 1.236 + test_2vi_inv(a1, a2, (short)123, (short)103, OFFSET); 1.237 + for (int i=OFFSET; i<ARRLEN; i++) { 1.238 + errn += verify("test_2vi_inv: a1", i, a1[i], (short)123); 1.239 + errn += verify("test_2vi_inv: a2", i, a2[i], (short)103); 1.240 + } 1.241 + for (int i=0; i<OFFSET; i++) { 1.242 + errn += verify("test_2vi_inv: a1", i, a1[i], (short)-1); 1.243 + errn += verify("test_2vi_inv: a2", i, a2[i], (short)-1); 1.244 + } 1.245 + // Reset for indexing with scale 1.246 + for (int i=0; i<ARRLEN; i++) { 1.247 + a1[i] = -1; 1.248 + a2[i] = -1; 1.249 + } 1.250 + test_ci_scl(a1); 1.251 + for (int i=0; i<ARRLEN; i++) { 1.252 + int val = (i%SCALE != 0) ? -1 : -123; 1.253 + errn += verify("test_ci_scl: a1", i, a1[i], (short)val); 1.254 + } 1.255 + test_vi_scl(a2, (short)123); 1.256 + for (int i=0; i<ARRLEN; i++) { 1.257 + int val = (i%SCALE != 0) ? -1 : 123; 1.258 + errn += verify("test_vi_scl: a2", i, a2[i], (short)val); 1.259 + } 1.260 + test_cp_scl(a1, a2); 1.261 + for (int i=0; i<ARRLEN; i++) { 1.262 + int val = (i%SCALE != 0) ? -1 : 123; 1.263 + errn += verify("test_cp_scl: a1", i, a1[i], (short)val); 1.264 + } 1.265 + test_2ci_scl(a1, a2); 1.266 + for (int i=0; i<ARRLEN; i++) { 1.267 + if (i%SCALE != 0) { 1.268 + errn += verify("test_2ci_scl: a1", i, a1[i], (short)-1); 1.269 + } else if (i*SCALE < ARRLEN) { 1.270 + errn += verify("test_2ci_scl: a1", i*SCALE, a1[i*SCALE], (short)-123); 1.271 + } 1.272 + if (i%SCALE != 0) { 1.273 + errn += verify("test_2ci_scl: a2", i, a2[i], (short)-1); 1.274 + } else if (i*SCALE < ARRLEN) { 1.275 + errn += verify("test_2ci_scl: a2", i*SCALE, a2[i*SCALE], (short)-103); 1.276 + } 1.277 + } 1.278 + test_2vi_scl(a1, a2, (short)123, (short)103); 1.279 + for (int i=0; i<ARRLEN; i++) { 1.280 + if (i%SCALE != 0) { 1.281 + errn += verify("test_2vi_scl: a1", i, a1[i], (short)-1); 1.282 + } else if (i*SCALE < ARRLEN) { 1.283 + errn += verify("test_2vi_scl: a1", i*SCALE, a1[i*SCALE], (short)123); 1.284 + } 1.285 + if (i%SCALE != 0) { 1.286 + errn += verify("test_2vi_scl: a2", i, a2[i], (short)-1); 1.287 + } else if (i*SCALE < ARRLEN) { 1.288 + errn += verify("test_2vi_scl: a2", i*SCALE, a2[i*SCALE], (short)103); 1.289 + } 1.290 + } 1.291 + // Reset for 2 arrays with relative aligned offset 1.292 + for (int i=0; i<ARRLEN; i++) { 1.293 + a1[i] = -1; 1.294 + a2[i] = -1; 1.295 + } 1.296 + test_vi(a2, (short)123); 1.297 + test_cp_alndst(a1, a2); 1.298 + for (int i=0; i<ALIGN_OFF; i++) { 1.299 + errn += verify("test_cp_alndst: a1", i, a1[i], (short)-1); 1.300 + } 1.301 + for (int i=ALIGN_OFF; i<ARRLEN; i++) { 1.302 + errn += verify("test_cp_alndst: a1", i, a1[i], (short)123); 1.303 + } 1.304 + test_vi(a2, (short)-123); 1.305 + test_cp_alnsrc(a1, a2); 1.306 + for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { 1.307 + errn += verify("test_cp_alnsrc: a1", i, a1[i], (short)-123); 1.308 + } 1.309 + for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { 1.310 + errn += verify("test_cp_alnsrc: a1", i, a1[i], (short)123); 1.311 + } 1.312 + for (int i=0; i<ARRLEN; i++) { 1.313 + a1[i] = -1; 1.314 + a2[i] = -1; 1.315 + } 1.316 + test_2ci_aln(a1, a2); 1.317 + for (int i=0; i<ALIGN_OFF; i++) { 1.318 + errn += verify("test_2ci_aln: a1", i, a1[i], (short)-1); 1.319 + } 1.320 + for (int i=ALIGN_OFF; i<ARRLEN; i++) { 1.321 + errn += verify("test_2ci_aln: a1", i, a1[i], (short)-123); 1.322 + } 1.323 + for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { 1.324 + errn += verify("test_2ci_aln: a2", i, a2[i], (short)-103); 1.325 + } 1.326 + for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { 1.327 + errn += verify("test_2ci_aln: a2", i, a2[i], (short)-1); 1.328 + } 1.329 + for (int i=0; i<ARRLEN; i++) { 1.330 + a1[i] = -1; 1.331 + a2[i] = -1; 1.332 + } 1.333 + test_2vi_aln(a1, a2, (short)123, (short)103); 1.334 + for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { 1.335 + errn += verify("test_2vi_aln: a1", i, a1[i], (short)123); 1.336 + } 1.337 + for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { 1.338 + errn += verify("test_2vi_aln: a1", i, a1[i], (short)-1); 1.339 + } 1.340 + for (int i=0; i<ALIGN_OFF; i++) { 1.341 + errn += verify("test_2vi_aln: a2", i, a2[i], (short)-1); 1.342 + } 1.343 + for (int i=ALIGN_OFF; i<ARRLEN; i++) { 1.344 + errn += verify("test_2vi_aln: a2", i, a2[i], (short)103); 1.345 + } 1.346 + 1.347 + // Reset for 2 arrays with relative unaligned offset 1.348 + for (int i=0; i<ARRLEN; i++) { 1.349 + a1[i] = -1; 1.350 + a2[i] = -1; 1.351 + } 1.352 + test_vi(a2, (short)123); 1.353 + test_cp_unalndst(a1, a2); 1.354 + for (int i=0; i<UNALIGN_OFF; i++) { 1.355 + errn += verify("test_cp_unalndst: a1", i, a1[i], (short)-1); 1.356 + } 1.357 + for (int i=UNALIGN_OFF; i<ARRLEN; i++) { 1.358 + errn += verify("test_cp_unalndst: a1", i, a1[i], (short)123); 1.359 + } 1.360 + test_vi(a2, (short)-123); 1.361 + test_cp_unalnsrc(a1, a2); 1.362 + for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { 1.363 + errn += verify("test_cp_unalnsrc: a1", i, a1[i], (short)-123); 1.364 + } 1.365 + for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { 1.366 + errn += verify("test_cp_unalnsrc: a1", i, a1[i], (short)123); 1.367 + } 1.368 + for (int i=0; i<ARRLEN; i++) { 1.369 + a1[i] = -1; 1.370 + a2[i] = -1; 1.371 + } 1.372 + test_2ci_unaln(a1, a2); 1.373 + for (int i=0; i<UNALIGN_OFF; i++) { 1.374 + errn += verify("test_2ci_unaln: a1", i, a1[i], (short)-1); 1.375 + } 1.376 + for (int i=UNALIGN_OFF; i<ARRLEN; i++) { 1.377 + errn += verify("test_2ci_unaln: a1", i, a1[i], (short)-123); 1.378 + } 1.379 + for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { 1.380 + errn += verify("test_2ci_unaln: a2", i, a2[i], (short)-103); 1.381 + } 1.382 + for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { 1.383 + errn += verify("test_2ci_unaln: a2", i, a2[i], (short)-1); 1.384 + } 1.385 + for (int i=0; i<ARRLEN; i++) { 1.386 + a1[i] = -1; 1.387 + a2[i] = -1; 1.388 + } 1.389 + test_2vi_unaln(a1, a2, (short)123, (short)103); 1.390 + for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { 1.391 + errn += verify("test_2vi_unaln: a1", i, a1[i], (short)123); 1.392 + } 1.393 + for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { 1.394 + errn += verify("test_2vi_unaln: a1", i, a1[i], (short)-1); 1.395 + } 1.396 + for (int i=0; i<UNALIGN_OFF; i++) { 1.397 + errn += verify("test_2vi_unaln: a2", i, a2[i], (short)-1); 1.398 + } 1.399 + for (int i=UNALIGN_OFF; i<ARRLEN; i++) { 1.400 + errn += verify("test_2vi_unaln: a2", i, a2[i], (short)103); 1.401 + } 1.402 + 1.403 + // Reset for aligned overlap initialization 1.404 + for (int i=0; i<ALIGN_OFF; i++) { 1.405 + a1[i] = (short)i; 1.406 + } 1.407 + for (int i=ALIGN_OFF; i<ARRLEN; i++) { 1.408 + a1[i] = -1; 1.409 + } 1.410 + test_cp_alndst(a1, a1); 1.411 + for (int i=0; i<ARRLEN; i++) { 1.412 + int v = i%ALIGN_OFF; 1.413 + errn += verify("test_cp_alndst_overlap: a1", i, a1[i], (short)v); 1.414 + } 1.415 + for (int i=0; i<ALIGN_OFF; i++) { 1.416 + a1[i+ALIGN_OFF] = -1; 1.417 + } 1.418 + test_cp_alnsrc(a1, a1); 1.419 + for (int i=0; i<ALIGN_OFF; i++) { 1.420 + errn += verify("test_cp_alnsrc_overlap: a1", i, a1[i], (short)-1); 1.421 + } 1.422 + for (int i=ALIGN_OFF; i<ARRLEN; i++) { 1.423 + int v = i%ALIGN_OFF; 1.424 + errn += verify("test_cp_alnsrc_overlap: a1", i, a1[i], (short)v); 1.425 + } 1.426 + for (int i=0; i<ARRLEN; i++) { 1.427 + a1[i] = -1; 1.428 + } 1.429 + test_2ci_aln(a1, a1); 1.430 + for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { 1.431 + errn += verify("test_2ci_aln_overlap: a1", i, a1[i], (short)-103); 1.432 + } 1.433 + for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { 1.434 + errn += verify("test_2ci_aln_overlap: a1", i, a1[i], (short)-123); 1.435 + } 1.436 + for (int i=0; i<ARRLEN; i++) { 1.437 + a1[i] = -1; 1.438 + } 1.439 + test_2vi_aln(a1, a1, (short)123, (short)103); 1.440 + for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { 1.441 + errn += verify("test_2vi_aln_overlap: a1", i, a1[i], (short)123); 1.442 + } 1.443 + for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { 1.444 + errn += verify("test_2vi_aln_overlap: a1", i, a1[i], (short)103); 1.445 + } 1.446 + 1.447 + // Reset for unaligned overlap initialization 1.448 + for (int i=0; i<UNALIGN_OFF; i++) { 1.449 + a1[i] = (short)i; 1.450 + } 1.451 + for (int i=UNALIGN_OFF; i<ARRLEN; i++) { 1.452 + a1[i] = -1; 1.453 + } 1.454 + test_cp_unalndst(a1, a1); 1.455 + for (int i=0; i<ARRLEN; i++) { 1.456 + int v = i%UNALIGN_OFF; 1.457 + errn += verify("test_cp_unalndst_overlap: a1", i, a1[i], (short)v); 1.458 + } 1.459 + for (int i=0; i<UNALIGN_OFF; i++) { 1.460 + a1[i+UNALIGN_OFF] = -1; 1.461 + } 1.462 + test_cp_unalnsrc(a1, a1); 1.463 + for (int i=0; i<UNALIGN_OFF; i++) { 1.464 + errn += verify("test_cp_unalnsrc_overlap: a1", i, a1[i], (short)-1); 1.465 + } 1.466 + for (int i=UNALIGN_OFF; i<ARRLEN; i++) { 1.467 + int v = i%UNALIGN_OFF; 1.468 + errn += verify("test_cp_unalnsrc_overlap: a1", i, a1[i], (short)v); 1.469 + } 1.470 + for (int i=0; i<ARRLEN; i++) { 1.471 + a1[i] = -1; 1.472 + } 1.473 + test_2ci_unaln(a1, a1); 1.474 + for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { 1.475 + errn += verify("test_2ci_unaln_overlap: a1", i, a1[i], (short)-103); 1.476 + } 1.477 + for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { 1.478 + errn += verify("test_2ci_unaln_overlap: a1", i, a1[i], (short)-123); 1.479 + } 1.480 + for (int i=0; i<ARRLEN; i++) { 1.481 + a1[i] = -1; 1.482 + } 1.483 + test_2vi_unaln(a1, a1, (short)123, (short)103); 1.484 + for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { 1.485 + errn += verify("test_2vi_unaln_overlap: a1", i, a1[i], (short)123); 1.486 + } 1.487 + for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { 1.488 + errn += verify("test_2vi_unaln_overlap: a1", i, a1[i], (short)103); 1.489 + } 1.490 + 1.491 + } 1.492 + 1.493 + if (errn > 0) 1.494 + return errn; 1.495 + 1.496 + System.out.println("Time"); 1.497 + long start, end; 1.498 + start = System.currentTimeMillis(); 1.499 + for (int i=0; i<ITERS; i++) { 1.500 + test_ci(a1); 1.501 + } 1.502 + end = System.currentTimeMillis(); 1.503 + System.out.println("test_ci: " + (end - start)); 1.504 + start = System.currentTimeMillis(); 1.505 + for (int i=0; i<ITERS; i++) { 1.506 + test_vi(a2, (short)123); 1.507 + } 1.508 + end = System.currentTimeMillis(); 1.509 + System.out.println("test_vi: " + (end - start)); 1.510 + start = System.currentTimeMillis(); 1.511 + for (int i=0; i<ITERS; i++) { 1.512 + test_cp(a1, a2); 1.513 + } 1.514 + end = System.currentTimeMillis(); 1.515 + System.out.println("test_cp: " + (end - start)); 1.516 + start = System.currentTimeMillis(); 1.517 + for (int i=0; i<ITERS; i++) { 1.518 + test_2ci(a1, a2); 1.519 + } 1.520 + end = System.currentTimeMillis(); 1.521 + System.out.println("test_2ci: " + (end - start)); 1.522 + start = System.currentTimeMillis(); 1.523 + for (int i=0; i<ITERS; i++) { 1.524 + test_2vi(a1, a2, (short)123, (short)103); 1.525 + } 1.526 + end = System.currentTimeMillis(); 1.527 + System.out.println("test_2vi: " + (end - start)); 1.528 + 1.529 + start = System.currentTimeMillis(); 1.530 + for (int i=0; i<ITERS; i++) { 1.531 + test_ci_neg(a1); 1.532 + } 1.533 + end = System.currentTimeMillis(); 1.534 + System.out.println("test_ci_neg: " + (end - start)); 1.535 + start = System.currentTimeMillis(); 1.536 + for (int i=0; i<ITERS; i++) { 1.537 + test_vi_neg(a2, (short)123); 1.538 + } 1.539 + end = System.currentTimeMillis(); 1.540 + System.out.println("test_vi_neg: " + (end - start)); 1.541 + start = System.currentTimeMillis(); 1.542 + for (int i=0; i<ITERS; i++) { 1.543 + test_cp_neg(a1, a2); 1.544 + } 1.545 + end = System.currentTimeMillis(); 1.546 + System.out.println("test_cp_neg: " + (end - start)); 1.547 + start = System.currentTimeMillis(); 1.548 + for (int i=0; i<ITERS; i++) { 1.549 + test_2ci_neg(a1, a2); 1.550 + } 1.551 + end = System.currentTimeMillis(); 1.552 + System.out.println("test_2ci_neg: " + (end - start)); 1.553 + start = System.currentTimeMillis(); 1.554 + for (int i=0; i<ITERS; i++) { 1.555 + test_2vi_neg(a1, a2, (short)123, (short)103); 1.556 + } 1.557 + end = System.currentTimeMillis(); 1.558 + System.out.println("test_2vi_neg: " + (end - start)); 1.559 + 1.560 + start = System.currentTimeMillis(); 1.561 + for (int i=0; i<ITERS; i++) { 1.562 + test_ci_oppos(a1); 1.563 + } 1.564 + end = System.currentTimeMillis(); 1.565 + System.out.println("test_ci_oppos: " + (end - start)); 1.566 + start = System.currentTimeMillis(); 1.567 + for (int i=0; i<ITERS; i++) { 1.568 + test_vi_oppos(a2, (short)123); 1.569 + } 1.570 + end = System.currentTimeMillis(); 1.571 + System.out.println("test_vi_oppos: " + (end - start)); 1.572 + start = System.currentTimeMillis(); 1.573 + for (int i=0; i<ITERS; i++) { 1.574 + test_cp_oppos(a1, a2); 1.575 + } 1.576 + end = System.currentTimeMillis(); 1.577 + System.out.println("test_cp_oppos: " + (end - start)); 1.578 + start = System.currentTimeMillis(); 1.579 + for (int i=0; i<ITERS; i++) { 1.580 + test_2ci_oppos(a1, a2); 1.581 + } 1.582 + end = System.currentTimeMillis(); 1.583 + System.out.println("test_2ci_oppos: " + (end - start)); 1.584 + start = System.currentTimeMillis(); 1.585 + for (int i=0; i<ITERS; i++) { 1.586 + test_2vi_oppos(a1, a2, (short)123, (short)103); 1.587 + } 1.588 + end = System.currentTimeMillis(); 1.589 + System.out.println("test_2vi_oppos: " + (end - start)); 1.590 + 1.591 + start = System.currentTimeMillis(); 1.592 + for (int i=0; i<ITERS; i++) { 1.593 + test_ci_off(a1); 1.594 + } 1.595 + end = System.currentTimeMillis(); 1.596 + System.out.println("test_ci_off: " + (end - start)); 1.597 + start = System.currentTimeMillis(); 1.598 + for (int i=0; i<ITERS; i++) { 1.599 + test_vi_off(a2, (short)123); 1.600 + } 1.601 + end = System.currentTimeMillis(); 1.602 + System.out.println("test_vi_off: " + (end - start)); 1.603 + start = System.currentTimeMillis(); 1.604 + for (int i=0; i<ITERS; i++) { 1.605 + test_cp_off(a1, a2); 1.606 + } 1.607 + end = System.currentTimeMillis(); 1.608 + System.out.println("test_cp_off: " + (end - start)); 1.609 + start = System.currentTimeMillis(); 1.610 + for (int i=0; i<ITERS; i++) { 1.611 + test_2ci_off(a1, a2); 1.612 + } 1.613 + end = System.currentTimeMillis(); 1.614 + System.out.println("test_2ci_off: " + (end - start)); 1.615 + start = System.currentTimeMillis(); 1.616 + for (int i=0; i<ITERS; i++) { 1.617 + test_2vi_off(a1, a2, (short)123, (short)103); 1.618 + } 1.619 + end = System.currentTimeMillis(); 1.620 + System.out.println("test_2vi_off: " + (end - start)); 1.621 + 1.622 + start = System.currentTimeMillis(); 1.623 + for (int i=0; i<ITERS; i++) { 1.624 + test_ci_inv(a1, OFFSET); 1.625 + } 1.626 + end = System.currentTimeMillis(); 1.627 + System.out.println("test_ci_inv: " + (end - start)); 1.628 + start = System.currentTimeMillis(); 1.629 + for (int i=0; i<ITERS; i++) { 1.630 + test_vi_inv(a2, (short)123, OFFSET); 1.631 + } 1.632 + end = System.currentTimeMillis(); 1.633 + System.out.println("test_vi_inv: " + (end - start)); 1.634 + start = System.currentTimeMillis(); 1.635 + for (int i=0; i<ITERS; i++) { 1.636 + test_cp_inv(a1, a2, OFFSET); 1.637 + } 1.638 + end = System.currentTimeMillis(); 1.639 + System.out.println("test_cp_inv: " + (end - start)); 1.640 + start = System.currentTimeMillis(); 1.641 + for (int i=0; i<ITERS; i++) { 1.642 + test_2ci_inv(a1, a2, OFFSET); 1.643 + } 1.644 + end = System.currentTimeMillis(); 1.645 + System.out.println("test_2ci_inv: " + (end - start)); 1.646 + start = System.currentTimeMillis(); 1.647 + for (int i=0; i<ITERS; i++) { 1.648 + test_2vi_inv(a1, a2, (short)123, (short)103, OFFSET); 1.649 + } 1.650 + end = System.currentTimeMillis(); 1.651 + System.out.println("test_2vi_inv: " + (end - start)); 1.652 + 1.653 + start = System.currentTimeMillis(); 1.654 + for (int i=0; i<ITERS; i++) { 1.655 + test_ci_scl(a1); 1.656 + } 1.657 + end = System.currentTimeMillis(); 1.658 + System.out.println("test_ci_scl: " + (end - start)); 1.659 + start = System.currentTimeMillis(); 1.660 + for (int i=0; i<ITERS; i++) { 1.661 + test_vi_scl(a2, (short)123); 1.662 + } 1.663 + end = System.currentTimeMillis(); 1.664 + System.out.println("test_vi_scl: " + (end - start)); 1.665 + start = System.currentTimeMillis(); 1.666 + for (int i=0; i<ITERS; i++) { 1.667 + test_cp_scl(a1, a2); 1.668 + } 1.669 + end = System.currentTimeMillis(); 1.670 + System.out.println("test_cp_scl: " + (end - start)); 1.671 + start = System.currentTimeMillis(); 1.672 + for (int i=0; i<ITERS; i++) { 1.673 + test_2ci_scl(a1, a2); 1.674 + } 1.675 + end = System.currentTimeMillis(); 1.676 + System.out.println("test_2ci_scl: " + (end - start)); 1.677 + start = System.currentTimeMillis(); 1.678 + for (int i=0; i<ITERS; i++) { 1.679 + test_2vi_scl(a1, a2, (short)123, (short)103); 1.680 + } 1.681 + end = System.currentTimeMillis(); 1.682 + System.out.println("test_2vi_scl: " + (end - start)); 1.683 + 1.684 + start = System.currentTimeMillis(); 1.685 + for (int i=0; i<ITERS; i++) { 1.686 + test_cp_alndst(a1, a2); 1.687 + } 1.688 + end = System.currentTimeMillis(); 1.689 + System.out.println("test_cp_alndst: " + (end - start)); 1.690 + start = System.currentTimeMillis(); 1.691 + for (int i=0; i<ITERS; i++) { 1.692 + test_cp_alnsrc(a1, a2); 1.693 + } 1.694 + end = System.currentTimeMillis(); 1.695 + System.out.println("test_cp_alnsrc: " + (end - start)); 1.696 + start = System.currentTimeMillis(); 1.697 + for (int i=0; i<ITERS; i++) { 1.698 + test_2ci_aln(a1, a2); 1.699 + } 1.700 + end = System.currentTimeMillis(); 1.701 + System.out.println("test_2ci_aln: " + (end - start)); 1.702 + start = System.currentTimeMillis(); 1.703 + for (int i=0; i<ITERS; i++) { 1.704 + test_2vi_aln(a1, a2, (short)123, (short)103); 1.705 + } 1.706 + end = System.currentTimeMillis(); 1.707 + System.out.println("test_2vi_aln: " + (end - start)); 1.708 + 1.709 + start = System.currentTimeMillis(); 1.710 + for (int i=0; i<ITERS; i++) { 1.711 + test_cp_unalndst(a1, a2); 1.712 + } 1.713 + end = System.currentTimeMillis(); 1.714 + System.out.println("test_cp_unalndst: " + (end - start)); 1.715 + start = System.currentTimeMillis(); 1.716 + for (int i=0; i<ITERS; i++) { 1.717 + test_cp_unalnsrc(a1, a2); 1.718 + } 1.719 + end = System.currentTimeMillis(); 1.720 + System.out.println("test_cp_unalnsrc: " + (end - start)); 1.721 + start = System.currentTimeMillis(); 1.722 + for (int i=0; i<ITERS; i++) { 1.723 + test_2ci_unaln(a1, a2); 1.724 + } 1.725 + end = System.currentTimeMillis(); 1.726 + System.out.println("test_2ci_unaln: " + (end - start)); 1.727 + start = System.currentTimeMillis(); 1.728 + for (int i=0; i<ITERS; i++) { 1.729 + test_2vi_unaln(a1, a2, (short)123, (short)103); 1.730 + } 1.731 + end = System.currentTimeMillis(); 1.732 + System.out.println("test_2vi_unaln: " + (end - start)); 1.733 + 1.734 + return errn; 1.735 + } 1.736 + 1.737 + static void test_ci(short[] a) { 1.738 + for (int i = 0; i < a.length; i+=1) { 1.739 + a[i] = -123; 1.740 + } 1.741 + } 1.742 + static void test_vi(short[] a, short b) { 1.743 + for (int i = 0; i < a.length; i+=1) { 1.744 + a[i] = b; 1.745 + } 1.746 + } 1.747 + static void test_cp(short[] a, short[] b) { 1.748 + for (int i = 0; i < a.length; i+=1) { 1.749 + a[i] = b[i]; 1.750 + } 1.751 + } 1.752 + static void test_2ci(short[] a, short[] b) { 1.753 + for (int i = 0; i < a.length; i+=1) { 1.754 + a[i] = -123; 1.755 + b[i] = -103; 1.756 + } 1.757 + } 1.758 + static void test_2vi(short[] a, short[] b, short c, short d) { 1.759 + for (int i = 0; i < a.length; i+=1) { 1.760 + a[i] = c; 1.761 + b[i] = d; 1.762 + } 1.763 + } 1.764 + static void test_ci_neg(short[] a) { 1.765 + for (int i = a.length-1; i >= 0; i-=1) { 1.766 + a[i] = -123; 1.767 + } 1.768 + } 1.769 + static void test_vi_neg(short[] a, short b) { 1.770 + for (int i = a.length-1; i >= 0; i-=1) { 1.771 + a[i] = b; 1.772 + } 1.773 + } 1.774 + static void test_cp_neg(short[] a, short[] b) { 1.775 + for (int i = a.length-1; i >= 0; i-=1) { 1.776 + a[i] = b[i]; 1.777 + } 1.778 + } 1.779 + static void test_2ci_neg(short[] a, short[] b) { 1.780 + for (int i = a.length-1; i >= 0; i-=1) { 1.781 + a[i] = -123; 1.782 + b[i] = -103; 1.783 + } 1.784 + } 1.785 + static void test_2vi_neg(short[] a, short[] b, short c, short d) { 1.786 + for (int i = a.length-1; i >= 0; i-=1) { 1.787 + a[i] = c; 1.788 + b[i] = d; 1.789 + } 1.790 + } 1.791 + static void test_ci_oppos(short[] a) { 1.792 + int limit = a.length-1; 1.793 + for (int i = 0; i < a.length; i+=1) { 1.794 + a[limit-i] = -123; 1.795 + } 1.796 + } 1.797 + static void test_vi_oppos(short[] a, short b) { 1.798 + int limit = a.length-1; 1.799 + for (int i = limit; i >= 0; i-=1) { 1.800 + a[limit-i] = b; 1.801 + } 1.802 + } 1.803 + static void test_cp_oppos(short[] a, short[] b) { 1.804 + int limit = a.length-1; 1.805 + for (int i = 0; i < a.length; i+=1) { 1.806 + a[i] = b[limit-i]; 1.807 + } 1.808 + } 1.809 + static void test_2ci_oppos(short[] a, short[] b) { 1.810 + int limit = a.length-1; 1.811 + for (int i = 0; i < a.length; i+=1) { 1.812 + a[limit-i] = -123; 1.813 + b[i] = -103; 1.814 + } 1.815 + } 1.816 + static void test_2vi_oppos(short[] a, short[] b, short c, short d) { 1.817 + int limit = a.length-1; 1.818 + for (int i = limit; i >= 0; i-=1) { 1.819 + a[i] = c; 1.820 + b[limit-i] = d; 1.821 + } 1.822 + } 1.823 + static void test_ci_off(short[] a) { 1.824 + for (int i = 0; i < a.length-OFFSET; i+=1) { 1.825 + a[i+OFFSET] = -123; 1.826 + } 1.827 + } 1.828 + static void test_vi_off(short[] a, short b) { 1.829 + for (int i = 0; i < a.length-OFFSET; i+=1) { 1.830 + a[i+OFFSET] = b; 1.831 + } 1.832 + } 1.833 + static void test_cp_off(short[] a, short[] b) { 1.834 + for (int i = 0; i < a.length-OFFSET; i+=1) { 1.835 + a[i+OFFSET] = b[i+OFFSET]; 1.836 + } 1.837 + } 1.838 + static void test_2ci_off(short[] a, short[] b) { 1.839 + for (int i = 0; i < a.length-OFFSET; i+=1) { 1.840 + a[i+OFFSET] = -123; 1.841 + b[i+OFFSET] = -103; 1.842 + } 1.843 + } 1.844 + static void test_2vi_off(short[] a, short[] b, short c, short d) { 1.845 + for (int i = 0; i < a.length-OFFSET; i+=1) { 1.846 + a[i+OFFSET] = c; 1.847 + b[i+OFFSET] = d; 1.848 + } 1.849 + } 1.850 + static void test_ci_inv(short[] a, int k) { 1.851 + for (int i = 0; i < a.length-k; i+=1) { 1.852 + a[i+k] = -123; 1.853 + } 1.854 + } 1.855 + static void test_vi_inv(short[] a, short b, int k) { 1.856 + for (int i = 0; i < a.length-k; i+=1) { 1.857 + a[i+k] = b; 1.858 + } 1.859 + } 1.860 + static void test_cp_inv(short[] a, short[] b, int k) { 1.861 + for (int i = 0; i < a.length-k; i+=1) { 1.862 + a[i+k] = b[i+k]; 1.863 + } 1.864 + } 1.865 + static void test_2ci_inv(short[] a, short[] b, int k) { 1.866 + for (int i = 0; i < a.length-k; i+=1) { 1.867 + a[i+k] = -123; 1.868 + b[i+k] = -103; 1.869 + } 1.870 + } 1.871 + static void test_2vi_inv(short[] a, short[] b, short c, short d, int k) { 1.872 + for (int i = 0; i < a.length-k; i+=1) { 1.873 + a[i+k] = c; 1.874 + b[i+k] = d; 1.875 + } 1.876 + } 1.877 + static void test_ci_scl(short[] a) { 1.878 + for (int i = 0; i*SCALE < a.length; i+=1) { 1.879 + a[i*SCALE] = -123; 1.880 + } 1.881 + } 1.882 + static void test_vi_scl(short[] a, short b) { 1.883 + for (int i = 0; i*SCALE < a.length; i+=1) { 1.884 + a[i*SCALE] = b; 1.885 + } 1.886 + } 1.887 + static void test_cp_scl(short[] a, short[] b) { 1.888 + for (int i = 0; i*SCALE < a.length; i+=1) { 1.889 + a[i*SCALE] = b[i*SCALE]; 1.890 + } 1.891 + } 1.892 + static void test_2ci_scl(short[] a, short[] b) { 1.893 + for (int i = 0; i*SCALE < a.length; i+=1) { 1.894 + a[i*SCALE] = -123; 1.895 + b[i*SCALE] = -103; 1.896 + } 1.897 + } 1.898 + static void test_2vi_scl(short[] a, short[] b, short c, short d) { 1.899 + for (int i = 0; i*SCALE < a.length; i+=1) { 1.900 + a[i*SCALE] = c; 1.901 + b[i*SCALE] = d; 1.902 + } 1.903 + } 1.904 + static void test_cp_alndst(short[] a, short[] b) { 1.905 + for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { 1.906 + a[i+ALIGN_OFF] = b[i]; 1.907 + } 1.908 + } 1.909 + static void test_cp_alnsrc(short[] a, short[] b) { 1.910 + for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { 1.911 + a[i] = b[i+ALIGN_OFF]; 1.912 + } 1.913 + } 1.914 + static void test_2ci_aln(short[] a, short[] b) { 1.915 + for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { 1.916 + a[i+ALIGN_OFF] = -123; 1.917 + b[i] = -103; 1.918 + } 1.919 + } 1.920 + static void test_2vi_aln(short[] a, short[] b, short c, short d) { 1.921 + for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { 1.922 + a[i] = c; 1.923 + b[i+ALIGN_OFF] = d; 1.924 + } 1.925 + } 1.926 + static void test_cp_unalndst(short[] a, short[] b) { 1.927 + for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { 1.928 + a[i+UNALIGN_OFF] = b[i]; 1.929 + } 1.930 + } 1.931 + static void test_cp_unalnsrc(short[] a, short[] b) { 1.932 + for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { 1.933 + a[i] = b[i+UNALIGN_OFF]; 1.934 + } 1.935 + } 1.936 + static void test_2ci_unaln(short[] a, short[] b) { 1.937 + for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { 1.938 + a[i+UNALIGN_OFF] = -123; 1.939 + b[i] = -103; 1.940 + } 1.941 + } 1.942 + static void test_2vi_unaln(short[] a, short[] b, short c, short d) { 1.943 + for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { 1.944 + a[i] = c; 1.945 + b[i+UNALIGN_OFF] = d; 1.946 + } 1.947 + } 1.948 + 1.949 + static int verify(String text, int i, short elem, short val) { 1.950 + if (elem != val) { 1.951 + System.err.println(text + "[" + i + "] = " + elem + " != " + val); 1.952 + return 1; 1.953 + } 1.954 + return 0; 1.955 + } 1.956 +}