|  | /* | 
|  |  | 
|  | Copyright (c) 2009, 2010, 2011 STMicroelectronics | 
|  | Written by Christophe Lyon | 
|  |  | 
|  | Permission is hereby granted, free of charge, to any person obtaining a copy | 
|  | of this software and associated documentation files (the "Software"), to deal | 
|  | in the Software without restriction, including without limitation the rights | 
|  | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | 
|  | copies of the Software, and to permit persons to whom the Software is | 
|  | furnished to do so, subject to the following conditions: | 
|  |  | 
|  | The above copyright notice and this permission notice shall be included in | 
|  | all copies or substantial portions of the Software. | 
|  |  | 
|  | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | 
|  | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | 
|  | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | 
|  | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | 
|  | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | 
|  | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | 
|  | THE SOFTWARE. | 
|  |  | 
|  | */ | 
|  |  | 
|  | #ifdef __arm__ | 
|  | #include <arm_neon.h> | 
|  | #else | 
|  | #error Target not supported | 
|  | #endif | 
|  |  | 
|  | #include "stm-arm-neon-ref.h" | 
|  |  | 
|  | #define INSN vqshrn_n | 
|  | #define TEST_MSG "VQSHRN_N" | 
|  |  | 
|  | #define FNNAME1(NAME) void exec_ ## NAME (void) | 
|  | #define FNNAME(NAME) FNNAME1(NAME) | 
|  |  | 
|  | FNNAME (INSN) | 
|  | { | 
|  | /* Basic test: y=vqshrn_n(x,v), then store the result.  */ | 
|  | #define TEST_VQSHRN_N2(INSN, T1, T2, W, W2, N, V)	\ | 
|  | Neon_Overflow = 0;					\ | 
|  | VECT_VAR(vector_res, T1, W2, N) =			\ | 
|  | INSN##_##T2##W(VECT_VAR(vector, T1, W, N),		\ | 
|  | V);					\ | 
|  | vst1_##T2##W2(VECT_VAR(result, T1, W2, N),		\ | 
|  | VECT_VAR(vector_res, T1, W2, N));	\ | 
|  | dump_neon_overflow(TEST_MSG, xSTR(INSN##_##T2##W)) | 
|  |  | 
|  | /* Two auxliary macros are necessary to expand INSN */ | 
|  | #define TEST_VQSHRN_N1(INSN, T1, T2, W, W2, N, V)	\ | 
|  | TEST_VQSHRN_N2(INSN, T1, T2, W, W2, N, V) | 
|  |  | 
|  | #define TEST_VQSHRN_N(T1, T2, W, W2, N, V)	\ | 
|  | TEST_VQSHRN_N1(INSN, T1, T2, W, W2, N, V) | 
|  |  | 
|  |  | 
|  | /* With ARM RVCT, we need to declare variables before any executable | 
|  | statement */ | 
|  |  | 
|  | /* vector is twice as large as vector_res */ | 
|  | DECL_VARIABLE(vector, int, 16, 8); | 
|  | DECL_VARIABLE(vector, int, 32, 4); | 
|  | DECL_VARIABLE(vector, int, 64, 2); | 
|  | DECL_VARIABLE(vector, uint, 16, 8); | 
|  | DECL_VARIABLE(vector, uint, 32, 4); | 
|  | DECL_VARIABLE(vector, uint, 64, 2); | 
|  |  | 
|  | DECL_VARIABLE(vector_res, int, 8, 8); | 
|  | DECL_VARIABLE(vector_res, int, 16, 4); | 
|  | DECL_VARIABLE(vector_res, int, 32, 2); | 
|  | DECL_VARIABLE(vector_res, uint, 8, 8); | 
|  | DECL_VARIABLE(vector_res, uint, 16, 4); | 
|  | DECL_VARIABLE(vector_res, uint, 32, 2); | 
|  |  | 
|  | clean_results (); | 
|  |  | 
|  | TEST_VLOAD(vector, buffer, q, int, s, 16, 8); | 
|  | TEST_VLOAD(vector, buffer, q, int, s, 32, 4); | 
|  | TEST_VLOAD(vector, buffer, q, int, s, 64, 2); | 
|  | TEST_VLOAD(vector, buffer, q, uint, u, 16, 8); | 
|  | TEST_VLOAD(vector, buffer, q, uint, u, 32, 4); | 
|  | TEST_VLOAD(vector, buffer, q, uint, u, 64, 2); | 
|  |  | 
|  | /* Choose shift amount arbitrarily  */ | 
|  | fprintf(ref_file, "\n%s overflow output:\n", TEST_MSG); | 
|  | TEST_VQSHRN_N(int, s, 16, 8, 8, 1); | 
|  | TEST_VQSHRN_N(int, s, 32, 16, 4, 1); | 
|  | TEST_VQSHRN_N(int, s, 64, 32, 2, 2); | 
|  | TEST_VQSHRN_N(uint, u, 16, 8, 8, 2); | 
|  | TEST_VQSHRN_N(uint, u, 32, 16, 4, 3); | 
|  | TEST_VQSHRN_N(uint, u, 64, 32, 2, 3); | 
|  |  | 
|  | /* FIXME: only a few result buffers are used, but we output all of them */ | 
|  | dump_results_hex (TEST_MSG); | 
|  |  | 
|  |  | 
|  | /* Another set of tests */ | 
|  | TEST_VDUP(vector, q, int, s, 16, 8, 0x7FFF); | 
|  | TEST_VDUP(vector, q, int, s, 32, 4, 0x7FFFFFFF); | 
|  | TEST_VDUP(vector, q, int, s, 64, 2, 0x7FFFFFFFFFFFFFFFLL); | 
|  | TEST_VDUP(vector, q, uint, u, 16, 8, 0xFFFF); | 
|  | TEST_VDUP(vector, q, uint, u, 32, 4, 0xFFFFFFFF); | 
|  | TEST_VDUP(vector, q, uint, u, 64, 2, 0xFFFFFFFFFFFFFFFFULL); | 
|  |  | 
|  | /* shift by 3 to exercise saturation code in the lib  */ | 
|  | fprintf(ref_file, "\n%s overflow output:\n", | 
|  | TEST_MSG " (check saturation: shift by 3)"); | 
|  | TEST_VQSHRN_N(int, s, 16, 8, 8, 3); | 
|  | TEST_VQSHRN_N(int, s, 32, 16, 4, 3); | 
|  | TEST_VQSHRN_N(int, s, 64, 32, 2, 3); | 
|  | TEST_VQSHRN_N(uint, u, 16, 8, 8, 3); | 
|  | TEST_VQSHRN_N(uint, u, 32, 16, 4, 3); | 
|  | TEST_VQSHRN_N(uint, u, 64, 32, 2, 3); | 
|  |  | 
|  | /* FIXME: only a few result buffers are used, but we output all of them */ | 
|  | dump_results_hex2 (TEST_MSG, " (check saturation: shift by 3)"); | 
|  |  | 
|  |  | 
|  | /* shift by max to exercise saturation code in the lib  */ | 
|  | fprintf(ref_file, "\n%s overflow output:\n", | 
|  | TEST_MSG " (check saturation: shift by max)"); | 
|  | TEST_VQSHRN_N(int, s, 16, 8, 8, 8); | 
|  | TEST_VQSHRN_N(int, s, 32, 16, 4, 16); | 
|  | TEST_VQSHRN_N(int, s, 64, 32, 2, 32); | 
|  | TEST_VQSHRN_N(uint, u, 16, 8, 8, 8); | 
|  | TEST_VQSHRN_N(uint, u, 32, 16, 4, 16); | 
|  | TEST_VQSHRN_N(uint, u, 64, 32, 2, 32); | 
|  |  | 
|  | /* FIXME: only a few result buffers are used, but we output all of them */ | 
|  | dump_results_hex2 (TEST_MSG, " (check saturation: shift by max)"); | 
|  | } |