-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcmp.cpp
72 lines (60 loc) · 1.82 KB
/
cmp.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
#include <benchmark/benchmark.h>
#include <xmmintrin.h>
struct Vec4 {
Vec4() : Vec4(0.0f, 0.0f, 0.0f, 0.0f) {}
Vec4(float x, float y, float z, float w) : x(x), y(y), z(z), w(w) {}
float x, y, z, w;
};
bool cmp_sisd(Vec4 a, Vec4 b) {
return a.x == b.x && a.y == b.y && a.z == b.z && a.w == b.w;
}
bool cmp_simd(Vec4 a, Vec4 b) {
const __m128 xmm_a = _mm_load_ps(&a.x);
const __m128 xmm_b = _mm_load_ps(&b.x);
const __m128 eq = _mm_cmpeq_ps(xmm_a, xmm_b);
return ((_mm_movemask_ps(eq) & 0xf) == 0xf);
}
static void cmp_sisd_eq_bench(benchmark::State& state) {
for (auto _ : state) {
Vec4 a = {1.0f, 1.0f, 1.0f, 1.0f};
Vec4 b = {1.0f, 1.0f, 1.0f, 1.0f};
benchmark::DoNotOptimize(a);
benchmark::DoNotOptimize(b);
bool res = cmp_sisd(a, b);
benchmark::DoNotOptimize(res);
}
}
BENCHMARK(cmp_sisd_eq_bench);
static void cmp_simd_eq_bench(benchmark::State& state) {
for (auto _ : state) {
Vec4 a = {1.0f, 1.0f, 1.0f, 1.0f};
Vec4 b = {1.0f, 1.0f, 1.0f, 1.0f};
benchmark::DoNotOptimize(a);
benchmark::DoNotOptimize(b);
bool res = cmp_simd(a, b);
benchmark::DoNotOptimize(res);
}
}
BENCHMARK(cmp_simd_eq_bench);
static void cmp_sisd_neq_bench(benchmark::State& state) {
for (auto _ : state) {
Vec4 a = {1.0f, 5.0f, 1.0f, 1.0f};
Vec4 b = {1.0f, 1.0f, 1.0f, 1.0f};
benchmark::DoNotOptimize(a);
benchmark::DoNotOptimize(b);
bool res = cmp_sisd(a, b);
benchmark::DoNotOptimize(res);
}
}
BENCHMARK(cmp_sisd_eq_bench);
static void cmp_simd_neq_bench(benchmark::State& state) {
for (auto _ : state) {
Vec4 a = {1.0f, 5.0f, 1.0f, 1.0f};
Vec4 b = {1.0f, 1.0f, 1.0f, 1.0f};
benchmark::DoNotOptimize(a);
benchmark::DoNotOptimize(b);
bool res = cmp_simd(a, b);
benchmark::DoNotOptimize(res);
}
}
BENCHMARK(cmp_simd_eq_bench);