Wed, 21 May 2014 10:56:41 -0700
Added tag jdk8u20-b15 for changeset 8c785f9bde6f
aoqi@0 | 1 | /* |
aoqi@0 | 2 | * Copyright (c) 2012, Oracle and/or its affiliates. All rights reserved. |
aoqi@0 | 3 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
aoqi@0 | 4 | * |
aoqi@0 | 5 | * This code is free software; you can redistribute it and/or modify it |
aoqi@0 | 6 | * under the terms of the GNU General Public License version 2 only, as |
aoqi@0 | 7 | * published by the Free Software Foundation. |
aoqi@0 | 8 | * |
aoqi@0 | 9 | * This code is distributed in the hope that it will be useful, but WITHOUT |
aoqi@0 | 10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
aoqi@0 | 11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
aoqi@0 | 12 | * version 2 for more details (a copy is included in the LICENSE file that |
aoqi@0 | 13 | * accompanied this code). |
aoqi@0 | 14 | * |
aoqi@0 | 15 | * You should have received a copy of the GNU General Public License version |
aoqi@0 | 16 | * 2 along with this work; if not, write to the Free Software Foundation, |
aoqi@0 | 17 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
aoqi@0 | 18 | * |
aoqi@0 | 19 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
aoqi@0 | 20 | * or visit www.oracle.com if you need additional information or have any |
aoqi@0 | 21 | * questions. |
aoqi@0 | 22 | * |
aoqi@0 | 23 | */ |
aoqi@0 | 24 | |
aoqi@0 | 25 | /** |
aoqi@0 | 26 | * @test |
aoqi@0 | 27 | * @bug 7119644 |
aoqi@0 | 28 | * @summary Increase superword's vector size up to 256 bits |
aoqi@0 | 29 | * |
aoqi@0 | 30 | * @run main/othervm/timeout=300 -Xbatch -XX:+IgnoreUnrecognizedVMOptions -XX:-TieredCompilation -XX:-OptimizeFill TestByteFloatVect |
aoqi@0 | 31 | */ |
aoqi@0 | 32 | |
aoqi@0 | 33 | public class TestByteFloatVect { |
aoqi@0 | 34 | private static final int ARRLEN = 997; |
aoqi@0 | 35 | private static final int ITERS = 11000; |
aoqi@0 | 36 | private static final int OFFSET = 3; |
aoqi@0 | 37 | private static final int SCALE = 2; |
aoqi@0 | 38 | private static final int ALIGN_OFF = 8; |
aoqi@0 | 39 | private static final int UNALIGN_OFF = 5; |
aoqi@0 | 40 | |
aoqi@0 | 41 | public static void main(String args[]) { |
aoqi@0 | 42 | System.out.println("Testing Byte + Float vectors"); |
aoqi@0 | 43 | int errn = test(); |
aoqi@0 | 44 | if (errn > 0) { |
aoqi@0 | 45 | System.err.println("FAILED: " + errn + " errors"); |
aoqi@0 | 46 | System.exit(97); |
aoqi@0 | 47 | } |
aoqi@0 | 48 | System.out.println("PASSED"); |
aoqi@0 | 49 | } |
aoqi@0 | 50 | |
aoqi@0 | 51 | static int test() { |
aoqi@0 | 52 | byte[] a1 = new byte[ARRLEN]; |
aoqi@0 | 53 | byte[] a2 = new byte[ARRLEN]; |
aoqi@0 | 54 | float[] b1 = new float[ARRLEN]; |
aoqi@0 | 55 | float[] b2 = new float[ARRLEN]; |
aoqi@0 | 56 | System.out.println("Warmup"); |
aoqi@0 | 57 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 58 | test_ci(a1, b1); |
aoqi@0 | 59 | test_vi(a2, b2, (byte)123, 103.f); |
aoqi@0 | 60 | test_cp(a1, a2, b1, b2); |
aoqi@0 | 61 | test_ci_neg(a1, b1); |
aoqi@0 | 62 | test_vi_neg(a1, b1, (byte)123, 103.f); |
aoqi@0 | 63 | test_cp_neg(a1, a2, b1, b2); |
aoqi@0 | 64 | test_ci_oppos(a1, b1); |
aoqi@0 | 65 | test_vi_oppos(a1, b1, (byte)123, 103.f); |
aoqi@0 | 66 | test_cp_oppos(a1, a2, b1, b2); |
aoqi@0 | 67 | test_ci_aln(a1, b1); |
aoqi@0 | 68 | test_vi_aln(a1, b1, (byte)123, 103.f); |
aoqi@0 | 69 | test_cp_alndst(a1, a2, b1, b2); |
aoqi@0 | 70 | test_cp_alnsrc(a1, a2, b1, b2); |
aoqi@0 | 71 | test_ci_unaln(a1, b1); |
aoqi@0 | 72 | test_vi_unaln(a1, b1, (byte)123, 103.f); |
aoqi@0 | 73 | test_cp_unalndst(a1, a2, b1, b2); |
aoqi@0 | 74 | test_cp_unalnsrc(a1, a2, b1, b2); |
aoqi@0 | 75 | } |
aoqi@0 | 76 | // Initialize |
aoqi@0 | 77 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 78 | a1[i] = -1; |
aoqi@0 | 79 | a2[i] = -1; |
aoqi@0 | 80 | b1[i] = -1.f; |
aoqi@0 | 81 | b2[i] = -1.f; |
aoqi@0 | 82 | } |
aoqi@0 | 83 | // Test and verify results |
aoqi@0 | 84 | System.out.println("Verification"); |
aoqi@0 | 85 | int errn = 0; |
aoqi@0 | 86 | { |
aoqi@0 | 87 | test_ci(a1, b1); |
aoqi@0 | 88 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 89 | errn += verify("test_ci: a1", i, a1[i], (byte)-123); |
aoqi@0 | 90 | errn += verify("test_ci: b1", i, b1[i], -103.f); |
aoqi@0 | 91 | } |
aoqi@0 | 92 | test_vi(a2, b2, (byte)123, 103.f); |
aoqi@0 | 93 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 94 | errn += verify("test_vi: a2", i, a2[i], (byte)123); |
aoqi@0 | 95 | errn += verify("test_vi: b2", i, b2[i], 103.f); |
aoqi@0 | 96 | } |
aoqi@0 | 97 | test_cp(a1, a2, b1, b2); |
aoqi@0 | 98 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 99 | errn += verify("test_cp: a1", i, a1[i], (byte)123); |
aoqi@0 | 100 | errn += verify("test_cp: b1", i, b1[i], 103.f); |
aoqi@0 | 101 | } |
aoqi@0 | 102 | |
aoqi@0 | 103 | // Reset for negative stride |
aoqi@0 | 104 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 105 | a1[i] = -1; |
aoqi@0 | 106 | a2[i] = -1; |
aoqi@0 | 107 | b1[i] = -1.f; |
aoqi@0 | 108 | b2[i] = -1.f; |
aoqi@0 | 109 | } |
aoqi@0 | 110 | test_ci_neg(a1, b1); |
aoqi@0 | 111 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 112 | errn += verify("test_ci_neg: a1", i, a1[i], (byte)-123); |
aoqi@0 | 113 | errn += verify("test_ci_neg: b1", i, b1[i], -103.f); |
aoqi@0 | 114 | } |
aoqi@0 | 115 | test_vi_neg(a2, b2, (byte)123, 103.f); |
aoqi@0 | 116 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 117 | errn += verify("test_vi_neg: a2", i, a2[i], (byte)123); |
aoqi@0 | 118 | errn += verify("test_vi_neg: b2", i, b2[i], 103.f); |
aoqi@0 | 119 | } |
aoqi@0 | 120 | test_cp_neg(a1, a2, b1, b2); |
aoqi@0 | 121 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 122 | errn += verify("test_cp_neg: a1", i, a1[i], (byte)123); |
aoqi@0 | 123 | errn += verify("test_cp_neg: b1", i, b1[i], 103.f); |
aoqi@0 | 124 | } |
aoqi@0 | 125 | |
aoqi@0 | 126 | // Reset for opposite stride |
aoqi@0 | 127 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 128 | a1[i] = -1; |
aoqi@0 | 129 | a2[i] = -1; |
aoqi@0 | 130 | b1[i] = -1.f; |
aoqi@0 | 131 | b2[i] = -1.f; |
aoqi@0 | 132 | } |
aoqi@0 | 133 | test_ci_oppos(a1, b1); |
aoqi@0 | 134 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 135 | errn += verify("test_ci_oppos: a1", i, a1[i], (byte)-123); |
aoqi@0 | 136 | errn += verify("test_ci_oppos: b1", i, b1[i], -103.f); |
aoqi@0 | 137 | } |
aoqi@0 | 138 | test_vi_oppos(a2, b2, (byte)123, 103.f); |
aoqi@0 | 139 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 140 | errn += verify("test_vi_oppos: a2", i, a2[i], (byte)123); |
aoqi@0 | 141 | errn += verify("test_vi_oppos: b2", i, b2[i], 103.f); |
aoqi@0 | 142 | } |
aoqi@0 | 143 | test_cp_oppos(a1, a2, b1, b2); |
aoqi@0 | 144 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 145 | errn += verify("test_cp_oppos: a1", i, a1[i], (byte)123); |
aoqi@0 | 146 | errn += verify("test_cp_oppos: b1", i, b1[i], 103.f); |
aoqi@0 | 147 | } |
aoqi@0 | 148 | |
aoqi@0 | 149 | // Reset for 2 arrays with relative aligned offset |
aoqi@0 | 150 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 151 | a1[i] = -1; |
aoqi@0 | 152 | a2[i] = 123; |
aoqi@0 | 153 | b1[i] = -1.f; |
aoqi@0 | 154 | b2[i] = 123.f; |
aoqi@0 | 155 | } |
aoqi@0 | 156 | test_cp_alndst(a1, a2, b1, b2); |
aoqi@0 | 157 | for (int i=0; i<ALIGN_OFF; i++) { |
aoqi@0 | 158 | errn += verify("test_cp_alndst: a1", i, a1[i], (byte)-1); |
aoqi@0 | 159 | errn += verify("test_cp_alndst: b1", i, b1[i], -1.f); |
aoqi@0 | 160 | } |
aoqi@0 | 161 | for (int i=ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 162 | errn += verify("test_cp_alndst: a1", i, a1[i], (byte)123); |
aoqi@0 | 163 | errn += verify("test_cp_alndst: b1", i, b1[i], 123.f); |
aoqi@0 | 164 | } |
aoqi@0 | 165 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 166 | a2[i] = -123; |
aoqi@0 | 167 | b2[i] = -123.f; |
aoqi@0 | 168 | } |
aoqi@0 | 169 | test_cp_alnsrc(a1, a2, b1, b2); |
aoqi@0 | 170 | for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { |
aoqi@0 | 171 | errn += verify("test_cp_alnsrc: a1", i, a1[i], (byte)-123); |
aoqi@0 | 172 | errn += verify("test_cp_alnsrc: b1", i, b1[i], -123.f); |
aoqi@0 | 173 | } |
aoqi@0 | 174 | for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 175 | errn += verify("test_cp_alnsrc: a1", i, a1[i], (byte)123); |
aoqi@0 | 176 | errn += verify("test_cp_alnsrc: b1", i, b1[i], 123.f); |
aoqi@0 | 177 | } |
aoqi@0 | 178 | |
aoqi@0 | 179 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 180 | a1[i] = -1; |
aoqi@0 | 181 | b1[i] = -1.f; |
aoqi@0 | 182 | } |
aoqi@0 | 183 | test_ci_aln(a1, b1); |
aoqi@0 | 184 | for (int i=0; i<ALIGN_OFF; i++) { |
aoqi@0 | 185 | errn += verify("test_ci_aln: a1", i, a1[i], (byte)-1); |
aoqi@0 | 186 | } |
aoqi@0 | 187 | for (int i=ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 188 | errn += verify("test_ci_aln: a1", i, a1[i], (byte)-123); |
aoqi@0 | 189 | } |
aoqi@0 | 190 | for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { |
aoqi@0 | 191 | errn += verify("test_ci_aln: b1", i, b1[i], -103.f); |
aoqi@0 | 192 | } |
aoqi@0 | 193 | for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 194 | errn += verify("test_ci_aln: b1", i, b1[i], -1.f); |
aoqi@0 | 195 | } |
aoqi@0 | 196 | |
aoqi@0 | 197 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 198 | a1[i] = -1; |
aoqi@0 | 199 | b1[i] = -1.f; |
aoqi@0 | 200 | } |
aoqi@0 | 201 | test_vi_aln(a1, b1, (byte)123, 103.f); |
aoqi@0 | 202 | for (int i=0; i<ARRLEN-ALIGN_OFF; i++) { |
aoqi@0 | 203 | errn += verify("test_vi_aln: a1", i, a1[i], (byte)123); |
aoqi@0 | 204 | } |
aoqi@0 | 205 | for (int i=ARRLEN-ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 206 | errn += verify("test_vi_aln: a1", i, a1[i], (byte)-1); |
aoqi@0 | 207 | } |
aoqi@0 | 208 | for (int i=0; i<ALIGN_OFF; i++) { |
aoqi@0 | 209 | errn += verify("test_vi_aln: b1", i, b1[i], -1.f); |
aoqi@0 | 210 | } |
aoqi@0 | 211 | for (int i=ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 212 | errn += verify("test_vi_aln: b1", i, b1[i], 103.f); |
aoqi@0 | 213 | } |
aoqi@0 | 214 | |
aoqi@0 | 215 | // Reset for 2 arrays with relative unaligned offset |
aoqi@0 | 216 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 217 | a1[i] = -1; |
aoqi@0 | 218 | a2[i] = 123; |
aoqi@0 | 219 | b1[i] = -1.f; |
aoqi@0 | 220 | b2[i] = 123.f; |
aoqi@0 | 221 | } |
aoqi@0 | 222 | test_cp_unalndst(a1, a2, b1, b2); |
aoqi@0 | 223 | for (int i=0; i<UNALIGN_OFF; i++) { |
aoqi@0 | 224 | errn += verify("test_cp_unalndst: a1", i, a1[i], (byte)-1); |
aoqi@0 | 225 | errn += verify("test_cp_unalndst: b1", i, b1[i], -1.f); |
aoqi@0 | 226 | } |
aoqi@0 | 227 | for (int i=UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 228 | errn += verify("test_cp_unalndst: a1", i, a1[i], (byte)123); |
aoqi@0 | 229 | errn += verify("test_cp_unalndst: b1", i, b1[i], 123.f); |
aoqi@0 | 230 | } |
aoqi@0 | 231 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 232 | a2[i] = -123; |
aoqi@0 | 233 | b2[i] = -123.f; |
aoqi@0 | 234 | } |
aoqi@0 | 235 | test_cp_unalnsrc(a1, a2, b1, b2); |
aoqi@0 | 236 | for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { |
aoqi@0 | 237 | errn += verify("test_cp_unalnsrc: a1", i, a1[i], (byte)-123); |
aoqi@0 | 238 | errn += verify("test_cp_unalnsrc: b1", i, b1[i], -123.f); |
aoqi@0 | 239 | } |
aoqi@0 | 240 | for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 241 | errn += verify("test_cp_unalnsrc: a1", i, a1[i], (byte)123); |
aoqi@0 | 242 | errn += verify("test_cp_unalnsrc: b1", i, b1[i], 123.f); |
aoqi@0 | 243 | } |
aoqi@0 | 244 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 245 | a1[i] = -1; |
aoqi@0 | 246 | b1[i] = -1; |
aoqi@0 | 247 | } |
aoqi@0 | 248 | test_ci_unaln(a1, b1); |
aoqi@0 | 249 | for (int i=0; i<UNALIGN_OFF; i++) { |
aoqi@0 | 250 | errn += verify("test_ci_unaln: a1", i, a1[i], (byte)-1); |
aoqi@0 | 251 | } |
aoqi@0 | 252 | for (int i=UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 253 | errn += verify("test_ci_unaln: a1", i, a1[i], (byte)-123); |
aoqi@0 | 254 | } |
aoqi@0 | 255 | for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { |
aoqi@0 | 256 | errn += verify("test_ci_unaln: b1", i, b1[i], -103.f); |
aoqi@0 | 257 | } |
aoqi@0 | 258 | for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 259 | errn += verify("test_ci_unaln: b1", i, b1[i], -1.f); |
aoqi@0 | 260 | } |
aoqi@0 | 261 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 262 | a1[i] = -1; |
aoqi@0 | 263 | b1[i] = -1; |
aoqi@0 | 264 | } |
aoqi@0 | 265 | test_vi_unaln(a1, b1, (byte)123, 103.f); |
aoqi@0 | 266 | for (int i=0; i<ARRLEN-UNALIGN_OFF; i++) { |
aoqi@0 | 267 | errn += verify("test_vi_unaln: a1", i, a1[i], (byte)123); |
aoqi@0 | 268 | } |
aoqi@0 | 269 | for (int i=ARRLEN-UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 270 | errn += verify("test_vi_unaln: a1", i, a1[i], (byte)-1); |
aoqi@0 | 271 | } |
aoqi@0 | 272 | for (int i=0; i<UNALIGN_OFF; i++) { |
aoqi@0 | 273 | errn += verify("test_vi_unaln: b1", i, b1[i], -1.f); |
aoqi@0 | 274 | } |
aoqi@0 | 275 | for (int i=UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 276 | errn += verify("test_vi_unaln: b1", i, b1[i], 103.f); |
aoqi@0 | 277 | } |
aoqi@0 | 278 | |
aoqi@0 | 279 | // Reset for aligned overlap initialization |
aoqi@0 | 280 | for (int i=0; i<ALIGN_OFF; i++) { |
aoqi@0 | 281 | a1[i] = (byte)i; |
aoqi@0 | 282 | b1[i] = (float)i; |
aoqi@0 | 283 | } |
aoqi@0 | 284 | for (int i=ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 285 | a1[i] = -1; |
aoqi@0 | 286 | b1[i] = -1.f; |
aoqi@0 | 287 | } |
aoqi@0 | 288 | test_cp_alndst(a1, a1, b1, b1); |
aoqi@0 | 289 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 290 | int v = i%ALIGN_OFF; |
aoqi@0 | 291 | errn += verify("test_cp_alndst_overlap: a1", i, a1[i], (byte)v); |
aoqi@0 | 292 | errn += verify("test_cp_alndst_overlap: b1", i, b1[i], (float)v); |
aoqi@0 | 293 | } |
aoqi@0 | 294 | for (int i=0; i<ALIGN_OFF; i++) { |
aoqi@0 | 295 | a1[i+ALIGN_OFF] = -1; |
aoqi@0 | 296 | b1[i+ALIGN_OFF] = -1.f; |
aoqi@0 | 297 | } |
aoqi@0 | 298 | test_cp_alnsrc(a1, a1, b1, b1); |
aoqi@0 | 299 | for (int i=0; i<ALIGN_OFF; i++) { |
aoqi@0 | 300 | errn += verify("test_cp_alnsrc_overlap: a1", i, a1[i], (byte)-1); |
aoqi@0 | 301 | errn += verify("test_cp_alnsrc_overlap: b1", i, b1[i], -1.f); |
aoqi@0 | 302 | } |
aoqi@0 | 303 | for (int i=ALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 304 | int v = i%ALIGN_OFF; |
aoqi@0 | 305 | errn += verify("test_cp_alnsrc_overlap: a1", i, a1[i], (byte)v); |
aoqi@0 | 306 | errn += verify("test_cp_alnsrc_overlap: b1", i, b1[i], (float)v); |
aoqi@0 | 307 | } |
aoqi@0 | 308 | |
aoqi@0 | 309 | // Reset for unaligned overlap initialization |
aoqi@0 | 310 | for (int i=0; i<UNALIGN_OFF; i++) { |
aoqi@0 | 311 | a1[i] = (byte)i; |
aoqi@0 | 312 | b1[i] = (float)i; |
aoqi@0 | 313 | } |
aoqi@0 | 314 | for (int i=UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 315 | a1[i] = -1; |
aoqi@0 | 316 | b1[i] = -1.f; |
aoqi@0 | 317 | } |
aoqi@0 | 318 | test_cp_unalndst(a1, a1, b1, b1); |
aoqi@0 | 319 | for (int i=0; i<ARRLEN; i++) { |
aoqi@0 | 320 | int v = i%UNALIGN_OFF; |
aoqi@0 | 321 | errn += verify("test_cp_unalndst_overlap: a1", i, a1[i], (byte)v); |
aoqi@0 | 322 | errn += verify("test_cp_unalndst_overlap: b1", i, b1[i], (float)v); |
aoqi@0 | 323 | } |
aoqi@0 | 324 | for (int i=0; i<UNALIGN_OFF; i++) { |
aoqi@0 | 325 | a1[i+UNALIGN_OFF] = -1; |
aoqi@0 | 326 | b1[i+UNALIGN_OFF] = -1.f; |
aoqi@0 | 327 | } |
aoqi@0 | 328 | test_cp_unalnsrc(a1, a1, b1, b1); |
aoqi@0 | 329 | for (int i=0; i<UNALIGN_OFF; i++) { |
aoqi@0 | 330 | errn += verify("test_cp_unalnsrc_overlap: a1", i, a1[i], (byte)-1); |
aoqi@0 | 331 | errn += verify("test_cp_unalnsrc_overlap: b1", i, b1[i], -1.f); |
aoqi@0 | 332 | } |
aoqi@0 | 333 | for (int i=UNALIGN_OFF; i<ARRLEN; i++) { |
aoqi@0 | 334 | int v = i%UNALIGN_OFF; |
aoqi@0 | 335 | errn += verify("test_cp_unalnsrc_overlap: a1", i, a1[i], (byte)v); |
aoqi@0 | 336 | errn += verify("test_cp_unalnsrc_overlap: b1", i, b1[i], (float)v); |
aoqi@0 | 337 | } |
aoqi@0 | 338 | |
aoqi@0 | 339 | } |
aoqi@0 | 340 | |
aoqi@0 | 341 | if (errn > 0) |
aoqi@0 | 342 | return errn; |
aoqi@0 | 343 | |
aoqi@0 | 344 | System.out.println("Time"); |
aoqi@0 | 345 | long start, end; |
aoqi@0 | 346 | start = System.currentTimeMillis(); |
aoqi@0 | 347 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 348 | test_ci(a1, b1); |
aoqi@0 | 349 | } |
aoqi@0 | 350 | end = System.currentTimeMillis(); |
aoqi@0 | 351 | System.out.println("test_ci: " + (end - start)); |
aoqi@0 | 352 | start = System.currentTimeMillis(); |
aoqi@0 | 353 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 354 | test_vi(a2, b2, (byte)123, 103.f); |
aoqi@0 | 355 | } |
aoqi@0 | 356 | end = System.currentTimeMillis(); |
aoqi@0 | 357 | System.out.println("test_vi: " + (end - start)); |
aoqi@0 | 358 | start = System.currentTimeMillis(); |
aoqi@0 | 359 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 360 | test_cp(a1, a2, b1, b2); |
aoqi@0 | 361 | } |
aoqi@0 | 362 | end = System.currentTimeMillis(); |
aoqi@0 | 363 | System.out.println("test_cp: " + (end - start)); |
aoqi@0 | 364 | start = System.currentTimeMillis(); |
aoqi@0 | 365 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 366 | test_ci_neg(a1, b1); |
aoqi@0 | 367 | } |
aoqi@0 | 368 | end = System.currentTimeMillis(); |
aoqi@0 | 369 | System.out.println("test_ci_neg: " + (end - start)); |
aoqi@0 | 370 | start = System.currentTimeMillis(); |
aoqi@0 | 371 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 372 | test_vi_neg(a1, b1, (byte)123, 103.f); |
aoqi@0 | 373 | } |
aoqi@0 | 374 | end = System.currentTimeMillis(); |
aoqi@0 | 375 | System.out.println("test_vi_neg: " + (end - start)); |
aoqi@0 | 376 | start = System.currentTimeMillis(); |
aoqi@0 | 377 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 378 | test_cp_neg(a1, a2, b1, b2); |
aoqi@0 | 379 | } |
aoqi@0 | 380 | end = System.currentTimeMillis(); |
aoqi@0 | 381 | System.out.println("test_cp_neg: " + (end - start)); |
aoqi@0 | 382 | start = System.currentTimeMillis(); |
aoqi@0 | 383 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 384 | test_ci_oppos(a1, b1); |
aoqi@0 | 385 | } |
aoqi@0 | 386 | end = System.currentTimeMillis(); |
aoqi@0 | 387 | System.out.println("test_ci_oppos: " + (end - start)); |
aoqi@0 | 388 | start = System.currentTimeMillis(); |
aoqi@0 | 389 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 390 | test_vi_oppos(a1, b1, (byte)123, 103.f); |
aoqi@0 | 391 | } |
aoqi@0 | 392 | end = System.currentTimeMillis(); |
aoqi@0 | 393 | System.out.println("test_vi_oppos: " + (end - start)); |
aoqi@0 | 394 | start = System.currentTimeMillis(); |
aoqi@0 | 395 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 396 | test_cp_oppos(a1, a2, b1, b2); |
aoqi@0 | 397 | } |
aoqi@0 | 398 | end = System.currentTimeMillis(); |
aoqi@0 | 399 | System.out.println("test_cp_oppos: " + (end - start)); |
aoqi@0 | 400 | start = System.currentTimeMillis(); |
aoqi@0 | 401 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 402 | test_ci_aln(a1, b1); |
aoqi@0 | 403 | } |
aoqi@0 | 404 | end = System.currentTimeMillis(); |
aoqi@0 | 405 | System.out.println("test_ci_aln: " + (end - start)); |
aoqi@0 | 406 | start = System.currentTimeMillis(); |
aoqi@0 | 407 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 408 | test_vi_aln(a1, b1, (byte)123, 103.f); |
aoqi@0 | 409 | } |
aoqi@0 | 410 | end = System.currentTimeMillis(); |
aoqi@0 | 411 | System.out.println("test_vi_aln: " + (end - start)); |
aoqi@0 | 412 | start = System.currentTimeMillis(); |
aoqi@0 | 413 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 414 | test_cp_alndst(a1, a2, b1, b2); |
aoqi@0 | 415 | } |
aoqi@0 | 416 | end = System.currentTimeMillis(); |
aoqi@0 | 417 | System.out.println("test_cp_alndst: " + (end - start)); |
aoqi@0 | 418 | start = System.currentTimeMillis(); |
aoqi@0 | 419 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 420 | test_cp_alnsrc(a1, a2, b1, b2); |
aoqi@0 | 421 | } |
aoqi@0 | 422 | end = System.currentTimeMillis(); |
aoqi@0 | 423 | System.out.println("test_cp_alnsrc: " + (end - start)); |
aoqi@0 | 424 | start = System.currentTimeMillis(); |
aoqi@0 | 425 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 426 | test_ci_unaln(a1, b1); |
aoqi@0 | 427 | } |
aoqi@0 | 428 | end = System.currentTimeMillis(); |
aoqi@0 | 429 | System.out.println("test_ci_unaln: " + (end - start)); |
aoqi@0 | 430 | start = System.currentTimeMillis(); |
aoqi@0 | 431 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 432 | test_vi_unaln(a1, b1, (byte)123, 103.f); |
aoqi@0 | 433 | } |
aoqi@0 | 434 | end = System.currentTimeMillis(); |
aoqi@0 | 435 | System.out.println("test_vi_unaln: " + (end - start)); |
aoqi@0 | 436 | start = System.currentTimeMillis(); |
aoqi@0 | 437 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 438 | test_cp_unalndst(a1, a2, b1, b2); |
aoqi@0 | 439 | } |
aoqi@0 | 440 | end = System.currentTimeMillis(); |
aoqi@0 | 441 | System.out.println("test_cp_unalndst: " + (end - start)); |
aoqi@0 | 442 | start = System.currentTimeMillis(); |
aoqi@0 | 443 | for (int i=0; i<ITERS; i++) { |
aoqi@0 | 444 | test_cp_unalnsrc(a1, a2, b1, b2); |
aoqi@0 | 445 | } |
aoqi@0 | 446 | end = System.currentTimeMillis(); |
aoqi@0 | 447 | System.out.println("test_cp_unalnsrc: " + (end - start)); |
aoqi@0 | 448 | return errn; |
aoqi@0 | 449 | } |
aoqi@0 | 450 | |
aoqi@0 | 451 | static void test_ci(byte[] a, float[] b) { |
aoqi@0 | 452 | for (int i = 0; i < a.length; i+=1) { |
aoqi@0 | 453 | a[i] = -123; |
aoqi@0 | 454 | b[i] = -103.f; |
aoqi@0 | 455 | } |
aoqi@0 | 456 | } |
aoqi@0 | 457 | static void test_vi(byte[] a, float[] b, byte c, float d) { |
aoqi@0 | 458 | for (int i = 0; i < a.length; i+=1) { |
aoqi@0 | 459 | a[i] = c; |
aoqi@0 | 460 | b[i] = d; |
aoqi@0 | 461 | } |
aoqi@0 | 462 | } |
aoqi@0 | 463 | static void test_cp(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 464 | for (int i = 0; i < a.length; i+=1) { |
aoqi@0 | 465 | a[i] = b[i]; |
aoqi@0 | 466 | c[i] = d[i]; |
aoqi@0 | 467 | } |
aoqi@0 | 468 | } |
aoqi@0 | 469 | static void test_ci_neg(byte[] a, float[] b) { |
aoqi@0 | 470 | for (int i = a.length-1; i >= 0; i-=1) { |
aoqi@0 | 471 | a[i] = -123; |
aoqi@0 | 472 | b[i] = -103.f; |
aoqi@0 | 473 | } |
aoqi@0 | 474 | } |
aoqi@0 | 475 | static void test_vi_neg(byte[] a, float[] b, byte c, float d) { |
aoqi@0 | 476 | for (int i = a.length-1; i >= 0; i-=1) { |
aoqi@0 | 477 | a[i] = c; |
aoqi@0 | 478 | b[i] = d; |
aoqi@0 | 479 | } |
aoqi@0 | 480 | } |
aoqi@0 | 481 | static void test_cp_neg(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 482 | for (int i = a.length-1; i >= 0; i-=1) { |
aoqi@0 | 483 | a[i] = b[i]; |
aoqi@0 | 484 | c[i] = d[i]; |
aoqi@0 | 485 | } |
aoqi@0 | 486 | } |
aoqi@0 | 487 | static void test_ci_oppos(byte[] a, float[] b) { |
aoqi@0 | 488 | int limit = a.length-1; |
aoqi@0 | 489 | for (int i = 0; i < a.length; i+=1) { |
aoqi@0 | 490 | a[limit-i] = -123; |
aoqi@0 | 491 | b[i] = -103.f; |
aoqi@0 | 492 | } |
aoqi@0 | 493 | } |
aoqi@0 | 494 | static void test_vi_oppos(byte[] a, float[] b, byte c, float d) { |
aoqi@0 | 495 | int limit = a.length-1; |
aoqi@0 | 496 | for (int i = a.length-1; i >= 0; i-=1) { |
aoqi@0 | 497 | a[i] = c; |
aoqi@0 | 498 | b[limit-i] = d; |
aoqi@0 | 499 | } |
aoqi@0 | 500 | } |
aoqi@0 | 501 | static void test_cp_oppos(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 502 | int limit = a.length-1; |
aoqi@0 | 503 | for (int i = 0; i < a.length; i+=1) { |
aoqi@0 | 504 | a[i] = b[limit-i]; |
aoqi@0 | 505 | c[limit-i] = d[i]; |
aoqi@0 | 506 | } |
aoqi@0 | 507 | } |
aoqi@0 | 508 | static void test_ci_aln(byte[] a, float[] b) { |
aoqi@0 | 509 | for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { |
aoqi@0 | 510 | a[i+ALIGN_OFF] = -123; |
aoqi@0 | 511 | b[i] = -103.f; |
aoqi@0 | 512 | } |
aoqi@0 | 513 | } |
aoqi@0 | 514 | static void test_vi_aln(byte[] a, float[] b, byte c, float d) { |
aoqi@0 | 515 | for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { |
aoqi@0 | 516 | a[i] = c; |
aoqi@0 | 517 | b[i+ALIGN_OFF] = d; |
aoqi@0 | 518 | } |
aoqi@0 | 519 | } |
aoqi@0 | 520 | static void test_cp_alndst(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 521 | for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { |
aoqi@0 | 522 | a[i+ALIGN_OFF] = b[i]; |
aoqi@0 | 523 | c[i+ALIGN_OFF] = d[i]; |
aoqi@0 | 524 | } |
aoqi@0 | 525 | } |
aoqi@0 | 526 | static void test_cp_alnsrc(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 527 | for (int i = 0; i < a.length-ALIGN_OFF; i+=1) { |
aoqi@0 | 528 | a[i] = b[i+ALIGN_OFF]; |
aoqi@0 | 529 | c[i] = d[i+ALIGN_OFF]; |
aoqi@0 | 530 | } |
aoqi@0 | 531 | } |
aoqi@0 | 532 | static void test_ci_unaln(byte[] a, float[] b) { |
aoqi@0 | 533 | for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { |
aoqi@0 | 534 | a[i+UNALIGN_OFF] = -123; |
aoqi@0 | 535 | b[i] = -103.f; |
aoqi@0 | 536 | } |
aoqi@0 | 537 | } |
aoqi@0 | 538 | static void test_vi_unaln(byte[] a, float[] b, byte c, float d) { |
aoqi@0 | 539 | for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { |
aoqi@0 | 540 | a[i] = c; |
aoqi@0 | 541 | b[i+UNALIGN_OFF] = d; |
aoqi@0 | 542 | } |
aoqi@0 | 543 | } |
aoqi@0 | 544 | static void test_cp_unalndst(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 545 | for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { |
aoqi@0 | 546 | a[i+UNALIGN_OFF] = b[i]; |
aoqi@0 | 547 | c[i+UNALIGN_OFF] = d[i]; |
aoqi@0 | 548 | } |
aoqi@0 | 549 | } |
aoqi@0 | 550 | static void test_cp_unalnsrc(byte[] a, byte[] b, float[] c, float[] d) { |
aoqi@0 | 551 | for (int i = 0; i < a.length-UNALIGN_OFF; i+=1) { |
aoqi@0 | 552 | a[i] = b[i+UNALIGN_OFF]; |
aoqi@0 | 553 | c[i] = d[i+UNALIGN_OFF]; |
aoqi@0 | 554 | } |
aoqi@0 | 555 | } |
aoqi@0 | 556 | |
aoqi@0 | 557 | static int verify(String text, int i, byte elem, byte val) { |
aoqi@0 | 558 | if (elem != val) { |
aoqi@0 | 559 | System.err.println(text + "[" + i + "] = " + elem + " != " + val); |
aoqi@0 | 560 | return 1; |
aoqi@0 | 561 | } |
aoqi@0 | 562 | return 0; |
aoqi@0 | 563 | } |
aoqi@0 | 564 | static int verify(String text, int i, float elem, float val) { |
aoqi@0 | 565 | if (elem != val) { |
aoqi@0 | 566 | System.err.println(text + "[" + i + "] = " + elem + " != " + val); |
aoqi@0 | 567 | return 1; |
aoqi@0 | 568 | } |
aoqi@0 | 569 | return 0; |
aoqi@0 | 570 | } |
aoqi@0 | 571 | } |