blob: ae52667ae2071a89a6502964620edda545a779e0 [file] [log] [blame]
Christophe Lyon073831a2011-01-24 17:37:40 +01001/*
2
Christophe Lyonc94d4c12013-03-29 16:32:37 +01003Copyright (c) 2009, 2010, 2011, 2012 STMicroelectronics
Christophe Lyon073831a2011-01-24 17:37:40 +01004Written by Christophe Lyon
5
6Permission is hereby granted, free of charge, to any person obtaining a copy
7of this software and associated documentation files (the "Software"), to deal
8in the Software without restriction, including without limitation the rights
9to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10copies of the Software, and to permit persons to whom the Software is
11furnished to do so, subject to the following conditions:
12
13The above copyright notice and this permission notice shall be included in
14all copies or substantial portions of the Software.
15
16THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22THE SOFTWARE.
23
24*/
25
Christophe Lyon1775be02014-07-10 13:46:54 +020026#if defined(__arm__) || defined(__aarch64__)
Christophe Lyon073831a2011-01-24 17:37:40 +010027#include <arm_neon.h>
28#else
Christophe Lyon0dab5f72011-07-19 17:14:09 +020029#include "stm-arm-neon.h"
Christophe Lyon073831a2011-01-24 17:37:40 +010030#endif
31
32#include "stm-arm-neon-ref.h"
33
34#define INSN vqdmulh
35#define TEST_MSG "VQDMULH_LANE"
36#define FNNAME1(NAME) void exec_ ## NAME ## _lane (void)
37#define FNNAME(NAME) FNNAME1(NAME)
38
39FNNAME (INSN)
40{
41 /* vector_res = vqdmulh_lane(vector,vector2,lane), then store the result. */
Christophe Lyon4a6e5cc2014-06-03 22:47:52 +020042#define TEST_VQDMULH_LANE2(INSN, Q, T1, T2, W, N, N2, L) \
Christophe Lyonc1cc7822015-01-20 16:04:24 +010043 Set_Neon_Cumulative_Sat(0, VECT_VAR(vector_res, T1, W, N)); \
Christophe Lyon4a6e5cc2014-06-03 22:47:52 +020044 VECT_VAR(vector_res, T1, W, N) = \
45 INSN##Q##_lane_##T2##W(VECT_VAR(vector, T1, W, N), \
46 VECT_VAR(vector2, T1, W, N2), \
47 L); \
48 vst1##Q##_##T2##W(VECT_VAR(result, T1, W, N), \
49 VECT_VAR(vector_res, T1, W, N)); \
50 dump_neon_cumulative_sat(TEST_MSG, xSTR(INSN##Q##_lane_##T2##W), \
51 xSTR(T1), W, N)
Christophe Lyon073831a2011-01-24 17:37:40 +010052
53 /* Two auxliary macros are necessary to expand INSN */
54#define TEST_VQDMULH_LANE1(INSN, Q, T1, T2, W, N, N2, L) \
55 TEST_VQDMULH_LANE2(INSN, Q, T1, T2, W, N, N2, L)
56
57#define TEST_VQDMULH_LANE(Q, T1, T2, W, N, N2, L) \
58 TEST_VQDMULH_LANE1(INSN, Q, T1, T2, W, N, N2, L)
59
60 /* With ARM RVCT, we need to declare variables before any executable
61 statement */
62 DECL_VARIABLE(vector, int, 16, 4);
63 DECL_VARIABLE(vector, int, 32, 2);
64 DECL_VARIABLE(vector, int, 16, 8);
65 DECL_VARIABLE(vector, int, 32, 4);
66
67 DECL_VARIABLE(vector_res, int, 16, 4);
68 DECL_VARIABLE(vector_res, int, 32, 2);
69 DECL_VARIABLE(vector_res, int, 16, 8);
70 DECL_VARIABLE(vector_res, int, 32, 4);
71
72 /* vector2: vqdmulh_lane and vqdmulhq_lane have a 2nd argument with
73 the same number of elements, so we need only one variable of each
74 type. */
75 DECL_VARIABLE(vector2, int, 16, 4);
76 DECL_VARIABLE(vector2, int, 32, 2);
77
78 clean_results ();
79
Christophe Lyonf2053672014-12-16 10:26:00 +010080 VLOAD(vector, buffer, , int, s, 16, 4);
81 VLOAD(vector, buffer, , int, s, 32, 2);
Christophe Lyon073831a2011-01-24 17:37:40 +010082
Christophe Lyonf2053672014-12-16 10:26:00 +010083 VLOAD(vector, buffer, q, int, s, 16, 8);
84 VLOAD(vector, buffer, q, int, s, 32, 4);
Christophe Lyon073831a2011-01-24 17:37:40 +010085
86 /* Initialize vector2 */
Christophe Lyonf2053672014-12-16 10:26:00 +010087 VDUP(vector2, , int, s, 16, 4, 0x55);
88 VDUP(vector2, , int, s, 32, 2, 0xBB);
Christophe Lyon073831a2011-01-24 17:37:40 +010089
90 /* Choose lane arbitrarily */
Christophe Lyon4a6e5cc2014-06-03 22:47:52 +020091 fprintf(ref_file, "\n%s cumulative saturation output:\n", TEST_MSG);
Christophe Lyon073831a2011-01-24 17:37:40 +010092 TEST_VQDMULH_LANE(, int, s, 16, 4, 4, 2);
93 TEST_VQDMULH_LANE(, int, s, 32, 2, 2, 1);
94 TEST_VQDMULH_LANE(q, int, s, 16, 8, 4, 3);
95 TEST_VQDMULH_LANE(q, int, s, 32, 4, 2, 0);
96
97 /* FIXME: only a subset of the result buffers are used, but we
98 output all of them */
99 dump_results_hex (TEST_MSG);
100
101
Christophe Lyonf2053672014-12-16 10:26:00 +0100102 VDUP(vector, , int, s, 16, 4, 0x8000);
103 VDUP(vector, , int, s, 32, 2, 0x80000000);
104 VDUP(vector, q, int, s, 16, 8, 0x8000);
105 VDUP(vector, q, int, s, 32, 4, 0x80000000);
106 VDUP(vector2, , int, s, 16, 4, 0x8000);
107 VDUP(vector2, , int, s, 32, 2, 0x80000000);
Christophe Lyon073831a2011-01-24 17:37:40 +0100108
Christophe Lyon4a6e5cc2014-06-03 22:47:52 +0200109 fprintf(ref_file, "\n%s cumulative saturation output:\n",
110 TEST_MSG " (check mul cumulative saturation)");
Christophe Lyon073831a2011-01-24 17:37:40 +0100111 TEST_VQDMULH_LANE(, int, s, 16, 4, 4, 3);
112 TEST_VQDMULH_LANE(, int, s, 32, 2, 2, 1);
113 TEST_VQDMULH_LANE(q, int, s, 16, 8, 4, 2);
114 TEST_VQDMULH_LANE(q, int, s, 32, 4, 2, 1);
Christophe Lyon4a6e5cc2014-06-03 22:47:52 +0200115 dump_results_hex2 (TEST_MSG, " (check mul cumulative saturation)");
Christophe Lyon073831a2011-01-24 17:37:40 +0100116}