forked from GameTechDev/OcclusionCulling
-
Notifications
You must be signed in to change notification settings - Fork 1
/
HelperSSE.h
84 lines (72 loc) · 2.05 KB
/
HelperSSE.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
////////////////////////////////////////////////////////////////////////////////
// Copyright 2017 Intel Corporation
//
// Licensed under the Apache License, Version 2.0 (the "License"); you may not
// use this file except in compliance with the License. You may obtain a copy
// of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
// WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
// License for the specific language governing permissions and limitations
// under the License.
////////////////////////////////////////////////////////////////////////////////
#include "immintrin.h"
#include <intrin.h>
#ifndef HELPERSSE_H
#define HELPERSSE_H
// Find index of least-significant set bit in mask and clear it (mask must be nonzero)
static int FindClearLSB(unsigned int *mask)
{
unsigned long idx;
_BitScanForward(&idx, *mask);
*mask &= *mask - 1;
return idx;
}
class HelperSSE
{
public:
HelperSSE();
~HelperSSE();
protected:
struct vFloat4
{
__m128 X;
__m128 Y;
__m128 Z;
__m128 W;
};
struct vFxPt4
{
__m128i X;
__m128i Y;
__m128i Z;
__m128i W;
};
__m128 TransformCoords(const __m128 *v, __m128 *m);
void MatrixMultiply(const __m128 *m1, const __m128 *m2, __m128 *result);
__forceinline __m128i Min(const __m128i &v0, const __m128i &v1)
{
__m128i tmp;
tmp = _mm_min_epi32(v0, v1);
return tmp;
}
__forceinline __m128i Max(const __m128i &v0, const __m128i &v1)
{
__m128i tmp;
tmp = _mm_max_epi32(v0, v1);
return tmp;
}
};
class CPUTCamera;
struct float4x4;
struct BoxTestSetupSSE : public HelperSSE
{
__m128 mViewProjViewport[4];
CPUTCamera *mpCamera;
float radiusThreshold;
void Init(const __m128 viewMatrix[4], const __m128 projMatrix[4], const float4x4 &viewportMatix, CPUTCamera *pCamera, float sizeThreshold);
};
#endif