godot/thirdparty/embree/kernels/geometry/pointi.h
jfons 767e374dce Upgrade Embree to the latest official release.
Since Embree v3.13.0 supports AARCH64, switch back to the
official repo instead of using Embree-aarch64.

`thirdparty/embree/patches/godot-changes.patch` should now contain
an accurate diff of the changes done to the library.
2021-05-21 17:00:24 +02:00

413 lines
16 KiB
C++

// Copyright 2009-2021 Intel Corporation
// SPDX-License-Identifier: Apache-2.0
#pragma once
#include "primitive.h"
namespace embree
{
template<int M>
struct PointMi
{
/* Virtual interface to query information about the line segment type */
struct Type : public PrimitiveType
{
const char* name() const;
size_t sizeActive(const char* This) const;
size_t sizeTotal(const char* This) const;
size_t getBytes(const char* This) const;
};
static Type type;
public:
/* primitive supports multiple time segments */
static const bool singleTimeSegment = false;
/* Returns maximum number of stored line segments */
static __forceinline size_t max_size()
{
return M;
}
/* Returns required number of primitive blocks for N line segments */
static __forceinline size_t blocks(size_t N)
{
return (N + max_size() - 1) / max_size();
}
/* Returns required number of bytes for N line segments */
static __forceinline size_t bytes(size_t N)
{
return blocks(N) * sizeof(PointMi);
}
public:
/* Default constructor */
__forceinline PointMi() {}
/* Construction from vertices and IDs */
__forceinline PointMi(const vuint<M>& geomIDs, const vuint<M>& primIDs, Geometry::GType gtype, uint32_t numPrimitives)
: gtype((unsigned char)gtype),
numPrimitives(numPrimitives),
sharedGeomID(geomIDs[0]),
primIDs(primIDs)
{
assert(all(vuint<M>(geomID()) == geomIDs));
}
/* Returns a mask that tells which line segments are valid */
__forceinline vbool<M> valid() const {
return vint<M>(step) < vint<M>(numPrimitives);
}
/* Returns if the specified line segment is valid */
__forceinline bool valid(const size_t i) const
{
assert(i < M);
return i < numPrimitives;
}
/* Returns the number of stored line segments */
__forceinline size_t size() const {
return numPrimitives;
}
__forceinline unsigned int geomID(unsigned int i = 0) const {
return sharedGeomID;
}
__forceinline vuint<M>& primID() {
return primIDs;
}
__forceinline const vuint<M>& primID() const {
return primIDs;
}
__forceinline unsigned int primID(const size_t i) const {
assert(i < M);
return primIDs[i];
}
/* gather the line segments */
__forceinline void gather(Vec4vf<M>& p0, const Points* geom) const;
__forceinline void gather(Vec4vf<M>& p0, Vec3vf<M>& n0, const Points* geom) const;
__forceinline void gatheri(Vec4vf<M>& p0, const Points* geom, const int itime) const;
__forceinline void gatheri(Vec4vf<M>& p0, Vec3vf<M>& n0, const Points* geom, const int itime) const;
__forceinline void gather(Vec4vf<M>& p0, const Points* geom, float time) const;
__forceinline void gather(Vec4vf<M>& p0, Vec3vf<M>& n0, const Points* geom, float time) const;
/* Calculate the bounds of the line segments */
__forceinline const BBox3fa bounds(const Scene* scene, size_t itime = 0) const
{
BBox3fa bounds = empty;
for (size_t i = 0; i < M && valid(i); i++) {
const Points* geom = scene->get<Points>(geomID(i));
bounds.extend(geom->bounds(primID(i),itime));
}
return bounds;
}
/* Calculate the linear bounds of the primitive */
__forceinline LBBox3fa linearBounds(const Scene* scene, size_t itime) {
return LBBox3fa(bounds(scene, itime + 0), bounds(scene, itime + 1));
}
__forceinline LBBox3fa linearBounds(const Scene* const scene, size_t itime, size_t numTimeSteps)
{
LBBox3fa allBounds = empty;
for (size_t i = 0; i < M && valid(i); i++) {
const Points* geom = scene->get<Points>(geomID(i));
allBounds.extend(geom->linearBounds(primID(i), itime, numTimeSteps));
}
return allBounds;
}
__forceinline LBBox3fa linearBounds(const Scene* const scene, const BBox1f time_range)
{
LBBox3fa allBounds = empty;
for (size_t i = 0; i < M && valid(i); i++) {
const Points* geom = scene->get<Points>(geomID((unsigned int)i));
allBounds.extend(geom->linearBounds(primID(i), time_range));
}
return allBounds;
}
/* Fill line segment from line segment list */
template<typename PrimRefT>
__forceinline void fill(const PrimRefT* prims, size_t& begin, size_t end, Scene* scene)
{
Geometry::GType gty = scene->get(prims[begin].geomID())->getType();
vuint<M> geomID, primID;
vuint<M> v0;
const PrimRefT* prim = &prims[begin];
int numPrimitives = 0;
for (size_t i = 0; i < M; i++) {
if (begin < end) {
geomID[i] = prim->geomID();
primID[i] = prim->primID();
begin++;
numPrimitives++;
} else {
assert(i);
if (i > 0) {
geomID[i] = geomID[i - 1];
primID[i] = primID[i - 1];
}
}
if (begin < end)
prim = &prims[begin]; // FIXME: remove this line
}
new (this) PointMi(geomID, primID, gty, numPrimitives); // FIXME: use non temporal store
}
template<typename BVH, typename Allocator>
__forceinline static typename BVH::NodeRef createLeaf(BVH* bvh,
const PrimRef* prims,
const range<size_t>& set,
const Allocator& alloc)
{
size_t start = set.begin();
size_t items = PointMi::blocks(set.size());
size_t numbytes = PointMi::bytes(set.size());
PointMi* accel = (PointMi*)alloc.malloc1(numbytes, M * sizeof(float));
for (size_t i = 0; i < items; i++) {
accel[i].fill(prims, start, set.end(), bvh->scene);
}
return bvh->encodeLeaf((char*)accel, items);
};
__forceinline LBBox3fa fillMB(const PrimRef* prims, size_t& begin, size_t end, Scene* scene, size_t itime)
{
fill(prims, begin, end, scene);
return linearBounds(scene, itime);
}
__forceinline LBBox3fa fillMB(
const PrimRefMB* prims, size_t& begin, size_t end, Scene* scene, const BBox1f time_range)
{
fill(prims, begin, end, scene);
return linearBounds(scene, time_range);
}
template<typename BVH, typename SetMB, typename Allocator>
__forceinline static typename BVH::NodeRecordMB4D createLeafMB(BVH* bvh, const SetMB& prims, const Allocator& alloc)
{
size_t start = prims.object_range.begin();
size_t end = prims.object_range.end();
size_t items = PointMi::blocks(prims.object_range.size());
size_t numbytes = PointMi::bytes(prims.object_range.size());
PointMi* accel = (PointMi*)alloc.malloc1(numbytes, M * sizeof(float));
const typename BVH::NodeRef node = bvh->encodeLeaf((char*)accel, items);
LBBox3fa bounds = empty;
for (size_t i = 0; i < items; i++)
bounds.extend(accel[i].fillMB(prims.prims->data(), start, end, bvh->scene, prims.time_range));
return typename BVH::NodeRecordMB4D(node, bounds, prims.time_range);
};
/*! output operator */
friend __forceinline embree_ostream operator<<(embree_ostream cout, const PointMi& line)
{
return cout << "Line" << M << "i {" << line.v0 << ", " << line.geomID() << ", " << line.primID() << "}";
}
public:
unsigned char gtype;
unsigned char numPrimitives;
unsigned int sharedGeomID;
private:
vuint<M> primIDs; // primitive ID
};
template<>
__forceinline void PointMi<4>::gather(Vec4vf4& p0, const Points* geom) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0)));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1)));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2)));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3)));
transpose(a0, a1, a2, a3, p0.x, p0.y, p0.z, p0.w);
}
template<>
__forceinline void PointMi<4>::gather(Vec4vf4& p0, Vec3vf4& n0, const Points* geom) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0)));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1)));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2)));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3)));
transpose(a0, a1, a2, a3, p0.x, p0.y, p0.z, p0.w);
const vfloat4 b0 = vfloat4(geom->normal(primID(0)));
const vfloat4 b1 = vfloat4(geom->normal(primID(1)));
const vfloat4 b2 = vfloat4(geom->normal(primID(2)));
const vfloat4 b3 = vfloat4(geom->normal(primID(3)));
transpose(b0, b1, b2, b3, n0.x, n0.y, n0.z);
}
template<>
__forceinline void PointMi<4>::gatheri(Vec4vf4& p0, const Points* geom, const int itime) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0), itime));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1), itime));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2), itime));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3), itime));
transpose(a0, a1, a2, a3, p0.x, p0.y, p0.z, p0.w);
}
template<>
__forceinline void PointMi<4>::gatheri(Vec4vf4& p0, Vec3vf4& n0, const Points* geom, const int itime) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0), itime));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1), itime));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2), itime));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3), itime));
transpose(a0, a1, a2, a3, p0.x, p0.y, p0.z, p0.w);
const vfloat4 b0 = vfloat4(geom->normal(primID(0), itime));
const vfloat4 b1 = vfloat4(geom->normal(primID(1), itime));
const vfloat4 b2 = vfloat4(geom->normal(primID(2), itime));
const vfloat4 b3 = vfloat4(geom->normal(primID(3), itime));
transpose(b0, b1, b2, b3, n0.x, n0.y, n0.z);
}
template<>
__forceinline void PointMi<4>::gather(Vec4vf4& p0, const Points* geom, float time) const
{
float ftime;
const int itime = geom->timeSegment(time, ftime);
Vec4vf4 a0; gatheri(a0, geom, itime);
Vec4vf4 b0; gatheri(b0, geom, itime + 1);
p0 = lerp(a0, b0, vfloat4(ftime));
}
template<>
__forceinline void PointMi<4>::gather(Vec4vf4& p0, Vec3vf4& n0, const Points* geom, float time) const
{
float ftime;
const int itime = geom->timeSegment(time, ftime);
Vec4vf4 a0, b0;
Vec3vf4 norm0, norm1;
gatheri(a0, norm0, geom, itime);
gatheri(b0, norm1, geom, itime + 1);
p0 = lerp(a0, b0, vfloat4(ftime));
n0 = lerp(norm0, norm1, vfloat4(ftime));
}
#if defined(__AVX__)
template<>
__forceinline void PointMi<8>::gather(Vec4vf8& p0, const Points* geom) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0)));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1)));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2)));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3)));
const vfloat4 a4 = vfloat4::loadu(geom->vertexPtr(primID(4)));
const vfloat4 a5 = vfloat4::loadu(geom->vertexPtr(primID(5)));
const vfloat4 a6 = vfloat4::loadu(geom->vertexPtr(primID(6)));
const vfloat4 a7 = vfloat4::loadu(geom->vertexPtr(primID(7)));
transpose(a0, a1, a2, a3, a4, a5, a6, a7, p0.x, p0.y, p0.z, p0.w);
}
template<>
__forceinline void PointMi<8>::gather(Vec4vf8& p0, Vec3vf8& n0, const Points* geom) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0)));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1)));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2)));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3)));
const vfloat4 a4 = vfloat4::loadu(geom->vertexPtr(primID(4)));
const vfloat4 a5 = vfloat4::loadu(geom->vertexPtr(primID(5)));
const vfloat4 a6 = vfloat4::loadu(geom->vertexPtr(primID(6)));
const vfloat4 a7 = vfloat4::loadu(geom->vertexPtr(primID(7)));
transpose(a0, a1, a2, a3, a4, a5, a6, a7, p0.x, p0.y, p0.z, p0.w);
const vfloat4 b0 = vfloat4(geom->normal(primID(0)));
const vfloat4 b1 = vfloat4(geom->normal(primID(1)));
const vfloat4 b2 = vfloat4(geom->normal(primID(2)));
const vfloat4 b3 = vfloat4(geom->normal(primID(3)));
const vfloat4 b4 = vfloat4(geom->normal(primID(4)));
const vfloat4 b5 = vfloat4(geom->normal(primID(5)));
const vfloat4 b6 = vfloat4(geom->normal(primID(6)));
const vfloat4 b7 = vfloat4(geom->normal(primID(7)));
transpose(b0, b1, b2, b3, b4, b5, b6, b7, n0.x, n0.y, n0.z);
}
template<>
__forceinline void PointMi<8>::gatheri(Vec4vf8& p0, const Points* geom, const int itime) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0), itime));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1), itime));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2), itime));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3), itime));
const vfloat4 a4 = vfloat4::loadu(geom->vertexPtr(primID(4), itime));
const vfloat4 a5 = vfloat4::loadu(geom->vertexPtr(primID(5), itime));
const vfloat4 a6 = vfloat4::loadu(geom->vertexPtr(primID(6), itime));
const vfloat4 a7 = vfloat4::loadu(geom->vertexPtr(primID(7), itime));
transpose(a0, a1, a2, a3, a4, a5, a6, a7, p0.x, p0.y, p0.z, p0.w);
}
template<>
__forceinline void PointMi<8>::gatheri(Vec4vf8& p0, Vec3vf8& n0, const Points* geom, const int itime) const
{
const vfloat4 a0 = vfloat4::loadu(geom->vertexPtr(primID(0), itime));
const vfloat4 a1 = vfloat4::loadu(geom->vertexPtr(primID(1), itime));
const vfloat4 a2 = vfloat4::loadu(geom->vertexPtr(primID(2), itime));
const vfloat4 a3 = vfloat4::loadu(geom->vertexPtr(primID(3), itime));
const vfloat4 a4 = vfloat4::loadu(geom->vertexPtr(primID(4), itime));
const vfloat4 a5 = vfloat4::loadu(geom->vertexPtr(primID(5), itime));
const vfloat4 a6 = vfloat4::loadu(geom->vertexPtr(primID(6), itime));
const vfloat4 a7 = vfloat4::loadu(geom->vertexPtr(primID(7), itime));
transpose(a0, a1, a2, a3, a4, a5, a6, a7, p0.x, p0.y, p0.z, p0.w);
const vfloat4 b0 = vfloat4(geom->normal(primID(0), itime));
const vfloat4 b1 = vfloat4(geom->normal(primID(1), itime));
const vfloat4 b2 = vfloat4(geom->normal(primID(2), itime));
const vfloat4 b3 = vfloat4(geom->normal(primID(3), itime));
const vfloat4 b4 = vfloat4(geom->normal(primID(4), itime));
const vfloat4 b5 = vfloat4(geom->normal(primID(5), itime));
const vfloat4 b6 = vfloat4(geom->normal(primID(6), itime));
const vfloat4 b7 = vfloat4(geom->normal(primID(7), itime));
transpose(b0, b1, b2, b3, b4, b5, b6, b7, n0.x, n0.y, n0.z);
}
template<>
__forceinline void PointMi<8>::gather(Vec4vf8& p0, const Points* geom, float time) const
{
float ftime;
const int itime = geom->timeSegment(time, ftime);
Vec4vf8 a0;
gatheri(a0, geom, itime);
Vec4vf8 b0;
gatheri(b0, geom, itime + 1);
p0 = lerp(a0, b0, vfloat8(ftime));
}
template<>
__forceinline void PointMi<8>::gather(Vec4vf8& p0, Vec3vf8& n0, const Points* geom, float time) const
{
float ftime;
const int itime = geom->timeSegment(time, ftime);
Vec4vf8 a0, b0;
Vec3vf8 norm0, norm1;
gatheri(a0, norm0, geom, itime);
gatheri(b0, norm1, geom, itime + 1);
p0 = lerp(a0, b0, vfloat8(ftime));
n0 = lerp(norm0, norm1, vfloat8(ftime));
}
#endif
template<int M>
typename PointMi<M>::Type PointMi<M>::type;
typedef PointMi<4> Point4i;
typedef PointMi<8> Point8i;
} // namespace embree