forked from pytorch/QNNPACK
-
Notifications
You must be signed in to change notification settings - Fork 0
/
u8rmax.cc
88 lines (76 loc) · 1.95 KB
/
u8rmax.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
/*
* Copyright (c) Facebook, Inc. and its affiliates.
* All rights reserved.
*
* This source code is licensed under the BSD-style license found in the
* LICENSE file in the root directory of this source tree.
*/
#include <gtest/gtest.h>
#include <cpuinfo.h>
#include <qnnpack/isa-checks.h>
#include <qnnpack/u8rmax.h>
#include "rmax-microkernel-tester.h"
#if CPUINFO_ARCH_ARM || CPUINFO_ARCH_ARM64
TEST(U8RMAX__NEON, n_lt_16) {
TEST_REQUIRES_ARM_NEON;
for (size_t n = 1; n < 16; n++) {
RMaxMicrokernelTester()
.n(n)
.test(u8rmax_ukernel__neon);
}
}
TEST(U8RMAX__NEON, n_eq_16) {
TEST_REQUIRES_ARM_NEON;
RMaxMicrokernelTester()
.n(16)
.test(u8rmax_ukernel__neon);
}
TEST(U8RMAX__NEON, n_div_16) {
TEST_REQUIRES_ARM_NEON;
for (size_t n = 16; n < 128; n += 16) {
RMaxMicrokernelTester()
.n(n)
.test(u8rmax_ukernel__neon);
}
}
TEST(U8RMAX__NEON, n_gt_16) {
TEST_REQUIRES_ARM_NEON;
for (size_t n = 16; n < 32; n++) {
RMaxMicrokernelTester()
.n(n)
.test(u8rmax_ukernel__neon);
}
}
#endif /* CPUINFO_ARCH_ARM || CPUINFO_ARCH_ARM64 */
#if CPUINFO_ARCH_X86 || CPUINFO_ARCH_X86_64
TEST(U8RMAX__SSE2, n_lt_16) {
TEST_REQUIRES_X86_SSE2;
for (size_t n = 1; n < 16; n++) {
RMaxMicrokernelTester()
.n(n)
.test(u8rmax_ukernel__sse2);
}
}
TEST(U8RMAX__SSE2, n_eq_16) {
TEST_REQUIRES_X86_SSE2;
RMaxMicrokernelTester()
.n(16)
.test(u8rmax_ukernel__sse2);
}
TEST(U8RMAX__SSE2, n_div_16) {
TEST_REQUIRES_X86_SSE2;
for (size_t n = 16; n < 128; n += 16) {
RMaxMicrokernelTester()
.n(n)
.test(u8rmax_ukernel__sse2);
}
}
TEST(U8RMAX__SSE2, n_gt_16) {
TEST_REQUIRES_X86_SSE2;
for (size_t n = 17; n < 32; n++) {
RMaxMicrokernelTester()
.n(n)
.test(u8rmax_ukernel__sse2);
}
}
#endif /* CPUINFO_ARCH_X86 || CPUINFO_ARCH_X86_64 */