forked from jratcliff63367/sse2neon
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSSE2NEONTEST.h
159 lines (150 loc) · 9.79 KB
/
SSE2NEONTEST.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
#ifndef SSE2NEONTEST_H
#define SSE2NEONTEST_H
// SSE2NEONTEST performs a set of 'unit tests' making sure that each SSE call
// provides the output we expect. If this fires an assert, then something didn't match up.
namespace SSE2NEON
{
// Currently 39 SSE intrinsics have unit tests fully implemented and verified.
// There are an additional 56 intrinsics which do not yet have a unit
// test implementation and, therefore, should not be considered fully
// verified at this time. These will be implemented as soon as possible.
// Note: The way unit tests are implemented is that 10,000 random floating point
// and integer vec4 numbers are generated as sample data.
//
// A short C implementation of every intrinsic is implemented and compared to the
// actual expected results from the corresponding SSE intrinsic against all of the
// 10,000 randomized input vectors.
// When running on ARM, then the results are compared to the NEON approximate version.
enum InstructionTest
{
IT_MM_SETZERO_SI128, // Unit test implemented and verified as fully working
IT_MM_SETZERO_PS, // Unit test implemented and verified as fully working
IT_MM_SET1_PS, // Unit test implemented and verified as fully working
IT_MM_SET_PS1, // Unit test implemented and verified as fully working
IT_MM_SET_PS, // Unit test implemented and verified as fully working
IT_MM_SET1_EPI32, // Unit test implemented and verified as fully working
IT_MM_SET_EPI32, // Unit test implemented and verified as fully working
IT_MM_STORE_PS, // Unit test implemented and verified as fully working
IT_MM_SHUFFLE_PS, // Unit test implemented and verified as fully working
IT_MM_LOAD1_PS, // Unit test implemented and verified as fully working
IT_MM_ANDNOT_PS, // Unit test implemented and verified as fully working
IT_MM_ANDNOT_SI128, // Unit test implemented and verified as fully working
IT_MM_AND_SI128, // Unit test implemented and verified as fully working
IT_MM_AND_PS, // Unit test implemented and verified as fully working
IT_MM_OR_PS, // Unit test implemented and verified as fully working
IT_MM_OR_SI128, // Unit test implemented and verified as fully working
IT_MM_MOVEMASK_PS, // Unit test implemented and verified as fully working
IT_MM_MOVEMASK_EPI8, // Unit test implemented and verified as fully working
IT_MM_SUB_PS, // Unit test implemented and verified as fully working
IT_MM_SUB_EPI32, // Unit test implemented and verified as fully working
IT_MM_ADD_PS, // Unit test implemented and verified as fully working
IT_MM_ADD_EPI32, // Unit test implemented and verified as fully working
IT_MM_MULLO_EPI16, // Unit test implemented and verified as fully working
IT_MM_MUL_PS, // Unit test implemented and verified as fully working
IT_MM_RCP_PS, // Unit test implemented and verified as fully working
IT_MM_MAX_PS, // Unit test implemented and verified as fully working
IT_MM_MIN_PS, // Unit test implemented and verified as fully working
IT_MM_MIN_EPI16, // Unit test implemented and verified as fully working
IT_MM_MULHI_EPI16, // Unit test implemented and verified as fully working
IT_MM_CMPLT_PS, // Unit test implemented and verified as fully working
IT_MM_CMPGT_PS, // Unit test implemented and verified as fully working
IT_MM_CMPGE_PS, // Unit test implemented and verified as fully working
IT_MM_CMPLE_PS, // Unit test implemented and verified as fully working
IT_MM_CMPEQ_PS, // Unit test implemented and verified as fully working
IT_MM_CMPLT_EPI32, // Unit test implemented and verified as fully working
IT_MM_CMPGT_EPI32, // Unit test implemented and verified as fully working
IT_MM_CVTTPS_EPI32, // Unit test implemented and verified as fully working
IT_MM_CVTEPI32_PS, // Unit test implemented and verified as fully working
IT_MM_CVTPS_EPI32, // Unit test implemented and verified as fully working
IT_MM_CVTSS_F32, // Unit test *not yet implemented*
IT_MM_SETR_PS, // Unit test *not yet implemented*
IT_MM_STOREU_PS, // Unit test *not yet implemented*
IT_MM_STORE_SI128, // Unit test *not yet implemented*
IT_MM_STORE_SS, // Unit test *not yet implemented*
IT_MM_STOREL_EPI64, // Unit test *not yet implemented*
IT_MM_LOAD_PS, // Unit test *not yet implemented*
IT_MM_LOADU_PS, // Unit test *not yet implemented*
IT_MM_LOAD_SS, // Unit test *not yet implemented*
IT_MM_CMPNEQ_PS, // Unit test *not yet implemented*
IT_MM_XOR_PS, // Unit test *not yet implemented*
IT_MM_XOR_SI128, // Unit test *not yet implemented*
IT_MM_SHUFFLE_EPI32_DEFAULT, // Unit test *not yet implemented*
IT_MM_SHUFFLE_EPI32_FUNCTION, // Unit test *not yet implemented*
IT_MM_SHUFFLE_EPI32_SPLAT, // Unit test *not yet implemented*
IT_MM_SHUFFLE_EPI32_SINGLE, // Unit test *not yet implemented*
IT_MM_SHUFFLEHI_EPI16_FUNCTION, // Unit test *not yet implemented*
IT_MM_ADD_SS, // Unit test *not yet implemented*
IT_MM_ADD_EPI16, // Unit test *not yet implemented*
IT_MM_MULLO_EPI32, // Unit test *not yet implemented*
IT_MM_DIV_PS, // Unit test *not yet implemented*
IT_MM_DIV_SS, // Unit test *not yet implemented*
IT_MM_SQRT_PS, // Unit test *not yet implemented*
IT_MM_SQRT_SS, // Unit test *not yet implemented*
IT_MM_RSQRT_PS, // Unit test *not yet implemented*
IT_MM_MAX_SS, // Unit test *not yet implemented*
IT_MM_MIN_SS, // Unit test *not yet implemented*
IT_MM_MAX_EPI32, // Unit test *not yet implemented*
IT_MM_MIN_EPI32, // Unit test *not yet implemented*
IT_MM_HADD_PS, // Unit test *not yet implemented*
IT_MM_CMPORD_PS, // Unit test *not yet implemented*
IT_MM_COMILT_SS, // Unit test *not yet implemented*
IT_MM_COMIGT_SS, // Unit test *not yet implemented*
IT_MM_COMILE_SS, // Unit test *not yet implemented*
IT_MM_COMIGE_SS, // Unit test *not yet implemented*
IT_MM_COMIEQ_SS, // Unit test *not yet implemented*
IT_MM_COMINEQ_SS, // Unit test *not yet implemented*
IT_MM_CVTSI128_SI32, // Unit test *not yet implemented*
IT_MM_CVTSI32_SI128, // Unit test *not yet implemented*
IT_MM_CASTPS_SI128, // Unit test *not yet implemented*
IT_MM_CASTSI128_PS, // Unit test *not yet implemented*
IT_MM_LOAD_SI128, // Unit test *not yet implemented*
IT_MM_PACKS_EPI16, // Unit test *not yet implemented*
IT_MM_PACKUS_EPI16, // Unit test *not yet implemented*
IT_MM_PACKS_EPI32, // Unit test *not yet implemented*
IT_MM_UNPACKLO_EPI8, // Unit test *not yet implemented*
IT_MM_UNPACKLO_EPI16, // Unit test *not yet implemented*
IT_MM_UNPACKLO_EPI32, // Unit test *not yet implemented*
IT_MM_UNPACKLO_PS, // Unit test *not yet implemented*
IT_MM_UNPACKHI_PS, // Unit test *not yet implemented*
IT_MM_UNPACKHI_EPI8, // Unit test *not yet implemented*
IT_MM_UNPACKHI_EPI16, // Unit test *not yet implemented*
IT_MM_UNPACKHI_EPI32, // Unit test *not yet implemented*
IT_MM_SFENCE, // Unit test *not yet implemented*
IT_MM_STREAM_SI128, // Unit test *not yet implemented*
IT_MM_CLFLUSH, // Unit test *not yet implemented*
//added by hasindu
IT_MM_SET1_EPI16,
IT_MM_SET_EPI16,
IT_MM_SLLI_EPI16,
IT_MM_SRLI_EPI16,
IT_MM_CMPEQ_EPI16,
IT_MM_SET1_EPI8,
IT_MM_ADDS_EPU8,
IT_MM_SUBS_EPU8,
IT_MM_MAX_EPU8,
IT_MM_CMPEQ_EPI8,
IT_MM_ADDS_EPI16,
IT_MM_MAX_EPI16,
IT_MM_SUBS_EPU16,
IT_MM_CMPGT_EPI16,
IT_MM_LOADU_SI128,
IT_MM_STOREU_SI128,
IT_MM_ADD_EPI8,
IT_MM_CMPGT_EPI8,
IT_MM_CMPLT_EPI8,
IT_MM_SUB_EPI8,
IT_MM_SETR_EPI32,
IT_MM_MIN_EPU8,
IT_LAST
};
class SSE2NEONTest
{
public:
static SSE2NEONTest* create(void); // create the test.
static const char *getInstructionTestString(InstructionTest test);
// Run test of this instruction; return true if it passed, false if it failed
virtual bool runTest(InstructionTest test) = 0;
virtual void release(void) = 0;
};
}
#endif