godot/thirdparty/embree/kernels/geometry/subgrid.h
jfons 767e374dce Upgrade Embree to the latest official release.
Since Embree v3.13.0 supports AARCH64, switch back to the
official repo instead of using Embree-aarch64.

`thirdparty/embree/patches/godot-changes.patch` should now contain
an accurate diff of the changes done to the library.
2021-05-21 17:00:24 +02:00

518 lines
21 KiB
C++

// Copyright 2009-2021 Intel Corporation
// SPDX-License-Identifier: Apache-2.0
#pragma once
#include "../common/ray.h"
#include "../common/scene_grid_mesh.h"
#include "../bvh/bvh.h"
namespace embree
{
/* Stores M quads from an indexed face set */
struct SubGrid
{
/* Virtual interface to query information about the quad type */
struct Type : public PrimitiveType
{
const char* name() const;
size_t sizeActive(const char* This) const;
size_t sizeTotal(const char* This) const;
size_t getBytes(const char* This) const;
};
static Type type;
public:
/* primitive supports multiple time segments */
static const bool singleTimeSegment = false;
/* Returns maximum number of stored quads */
static __forceinline size_t max_size() { return 1; }
/* Returns required number of primitive blocks for N primitives */
static __forceinline size_t blocks(size_t N) { return (N+max_size()-1)/max_size(); }
public:
/* Default constructor */
__forceinline SubGrid() { }
/* Construction from vertices and IDs */
__forceinline SubGrid(const unsigned int x,
const unsigned int y,
const unsigned int geomID,
const unsigned int primID)
: _x(x), _y(y), _geomID(geomID), _primID(primID)
{
}
__forceinline bool invalid3x3X() const { return (unsigned int)_x & (1<<15); }
__forceinline bool invalid3x3Y() const { return (unsigned int)_y & (1<<15); }
/* Gather the quads */
__forceinline void gather(Vec3vf4& p0,
Vec3vf4& p1,
Vec3vf4& p2,
Vec3vf4& p3,
const GridMesh* const mesh,
const GridMesh::Grid &g) const
{
/* first quad always valid */
const size_t vtxID00 = g.startVtxID + x() + y() * g.lineVtxOffset;
const size_t vtxID01 = vtxID00 + 1;
const vfloat4 vtx00 = vfloat4::loadu(mesh->vertexPtr(vtxID00));
const vfloat4 vtx01 = vfloat4::loadu(mesh->vertexPtr(vtxID01));
const size_t vtxID10 = vtxID00 + g.lineVtxOffset;
const size_t vtxID11 = vtxID01 + g.lineVtxOffset;
const vfloat4 vtx10 = vfloat4::loadu(mesh->vertexPtr(vtxID10));
const vfloat4 vtx11 = vfloat4::loadu(mesh->vertexPtr(vtxID11));
/* deltaX => vtx02, vtx12 */
const size_t deltaX = invalid3x3X() ? 0 : 1;
const size_t vtxID02 = vtxID01 + deltaX;
const vfloat4 vtx02 = vfloat4::loadu(mesh->vertexPtr(vtxID02));
const size_t vtxID12 = vtxID11 + deltaX;
const vfloat4 vtx12 = vfloat4::loadu(mesh->vertexPtr(vtxID12));
/* deltaY => vtx20, vtx21 */
const size_t deltaY = invalid3x3Y() ? 0 : g.lineVtxOffset;
const size_t vtxID20 = vtxID10 + deltaY;
const size_t vtxID21 = vtxID11 + deltaY;
const vfloat4 vtx20 = vfloat4::loadu(mesh->vertexPtr(vtxID20));
const vfloat4 vtx21 = vfloat4::loadu(mesh->vertexPtr(vtxID21));
/* deltaX/deltaY => vtx22 */
const size_t vtxID22 = vtxID11 + deltaX + deltaY;
const vfloat4 vtx22 = vfloat4::loadu(mesh->vertexPtr(vtxID22));
transpose(vtx00,vtx01,vtx11,vtx10,p0.x,p0.y,p0.z);
transpose(vtx01,vtx02,vtx12,vtx11,p1.x,p1.y,p1.z);
transpose(vtx11,vtx12,vtx22,vtx21,p2.x,p2.y,p2.z);
transpose(vtx10,vtx11,vtx21,vtx20,p3.x,p3.y,p3.z);
}
template<typename T>
__forceinline vfloat4 getVertexMB(const GridMesh* const mesh, const size_t offset, const size_t itime, const float ftime) const
{
const T v0 = T::loadu(mesh->vertexPtr(offset,itime+0));
const T v1 = T::loadu(mesh->vertexPtr(offset,itime+1));
return lerp(v0,v1,ftime);
}
/* Gather the quads */
__forceinline void gatherMB(Vec3vf4& p0,
Vec3vf4& p1,
Vec3vf4& p2,
Vec3vf4& p3,
const GridMesh* const mesh,
const GridMesh::Grid &g,
const size_t itime,
const float ftime) const
{
/* first quad always valid */
const size_t vtxID00 = g.startVtxID + x() + y() * g.lineVtxOffset;
const size_t vtxID01 = vtxID00 + 1;
const vfloat4 vtx00 = getVertexMB<vfloat4>(mesh,vtxID00,itime,ftime);
const vfloat4 vtx01 = getVertexMB<vfloat4>(mesh,vtxID01,itime,ftime);
const size_t vtxID10 = vtxID00 + g.lineVtxOffset;
const size_t vtxID11 = vtxID01 + g.lineVtxOffset;
const vfloat4 vtx10 = getVertexMB<vfloat4>(mesh,vtxID10,itime,ftime);
const vfloat4 vtx11 = getVertexMB<vfloat4>(mesh,vtxID11,itime,ftime);
/* deltaX => vtx02, vtx12 */
const size_t deltaX = invalid3x3X() ? 0 : 1;
const size_t vtxID02 = vtxID01 + deltaX;
const vfloat4 vtx02 = getVertexMB<vfloat4>(mesh,vtxID02,itime,ftime);
const size_t vtxID12 = vtxID11 + deltaX;
const vfloat4 vtx12 = getVertexMB<vfloat4>(mesh,vtxID12,itime,ftime);
/* deltaY => vtx20, vtx21 */
const size_t deltaY = invalid3x3Y() ? 0 : g.lineVtxOffset;
const size_t vtxID20 = vtxID10 + deltaY;
const size_t vtxID21 = vtxID11 + deltaY;
const vfloat4 vtx20 = getVertexMB<vfloat4>(mesh,vtxID20,itime,ftime);
const vfloat4 vtx21 = getVertexMB<vfloat4>(mesh,vtxID21,itime,ftime);
/* deltaX/deltaY => vtx22 */
const size_t vtxID22 = vtxID11 + deltaX + deltaY;
const vfloat4 vtx22 = getVertexMB<vfloat4>(mesh,vtxID22,itime,ftime);
transpose(vtx00,vtx01,vtx11,vtx10,p0.x,p0.y,p0.z);
transpose(vtx01,vtx02,vtx12,vtx11,p1.x,p1.y,p1.z);
transpose(vtx11,vtx12,vtx22,vtx21,p2.x,p2.y,p2.z);
transpose(vtx10,vtx11,vtx21,vtx20,p3.x,p3.y,p3.z);
}
/* Gather the quads */
__forceinline void gather(Vec3vf4& p0,
Vec3vf4& p1,
Vec3vf4& p2,
Vec3vf4& p3,
const Scene *const scene) const
{
const GridMesh* const mesh = scene->get<GridMesh>(geomID());
const GridMesh::Grid &g = mesh->grid(primID());
gather(p0,p1,p2,p3,mesh,g);
}
/* Gather the quads in the motion blur case */
__forceinline void gatherMB(Vec3vf4& p0,
Vec3vf4& p1,
Vec3vf4& p2,
Vec3vf4& p3,
const Scene *const scene,
const size_t itime,
const float ftime) const
{
const GridMesh* const mesh = scene->get<GridMesh>(geomID());
const GridMesh::Grid &g = mesh->grid(primID());
gatherMB(p0,p1,p2,p3,mesh,g,itime,ftime);
}
/* Gather the quads */
__forceinline void gather(Vec3fa vtx[16], const Scene *const scene) const
{
const GridMesh* mesh = scene->get<GridMesh>(geomID());
const GridMesh::Grid &g = mesh->grid(primID());
/* first quad always valid */
const size_t vtxID00 = g.startVtxID + x() + y() * g.lineVtxOffset;
const size_t vtxID01 = vtxID00 + 1;
const Vec3fa vtx00 = Vec3fa::loadu(mesh->vertexPtr(vtxID00));
const Vec3fa vtx01 = Vec3fa::loadu(mesh->vertexPtr(vtxID01));
const size_t vtxID10 = vtxID00 + g.lineVtxOffset;
const size_t vtxID11 = vtxID01 + g.lineVtxOffset;
const Vec3fa vtx10 = Vec3fa::loadu(mesh->vertexPtr(vtxID10));
const Vec3fa vtx11 = Vec3fa::loadu(mesh->vertexPtr(vtxID11));
/* deltaX => vtx02, vtx12 */
const size_t deltaX = invalid3x3X() ? 0 : 1;
const size_t vtxID02 = vtxID01 + deltaX;
const Vec3fa vtx02 = Vec3fa::loadu(mesh->vertexPtr(vtxID02));
const size_t vtxID12 = vtxID11 + deltaX;
const Vec3fa vtx12 = Vec3fa::loadu(mesh->vertexPtr(vtxID12));
/* deltaY => vtx20, vtx21 */
const size_t deltaY = invalid3x3Y() ? 0 : g.lineVtxOffset;
const size_t vtxID20 = vtxID10 + deltaY;
const size_t vtxID21 = vtxID11 + deltaY;
const Vec3fa vtx20 = Vec3fa::loadu(mesh->vertexPtr(vtxID20));
const Vec3fa vtx21 = Vec3fa::loadu(mesh->vertexPtr(vtxID21));
/* deltaX/deltaY => vtx22 */
const size_t vtxID22 = vtxID11 + deltaX + deltaY;
const Vec3fa vtx22 = Vec3fa::loadu(mesh->vertexPtr(vtxID22));
vtx[ 0] = vtx00; vtx[ 1] = vtx01; vtx[ 2] = vtx11; vtx[ 3] = vtx10;
vtx[ 4] = vtx01; vtx[ 5] = vtx02; vtx[ 6] = vtx12; vtx[ 7] = vtx11;
vtx[ 8] = vtx10; vtx[ 9] = vtx11; vtx[10] = vtx21; vtx[11] = vtx20;
vtx[12] = vtx11; vtx[13] = vtx12; vtx[14] = vtx22; vtx[15] = vtx21;
}
/* Gather the quads */
__forceinline void gatherMB(vfloat4 vtx[16], const Scene *const scene, const size_t itime, const float ftime) const
{
const GridMesh* mesh = scene->get<GridMesh>(geomID());
const GridMesh::Grid &g = mesh->grid(primID());
/* first quad always valid */
const size_t vtxID00 = g.startVtxID + x() + y() * g.lineVtxOffset;
const size_t vtxID01 = vtxID00 + 1;
const vfloat4 vtx00 = getVertexMB<vfloat4>(mesh,vtxID00,itime,ftime);
const vfloat4 vtx01 = getVertexMB<vfloat4>(mesh,vtxID01,itime,ftime);
const size_t vtxID10 = vtxID00 + g.lineVtxOffset;
const size_t vtxID11 = vtxID01 + g.lineVtxOffset;
const vfloat4 vtx10 = getVertexMB<vfloat4>(mesh,vtxID10,itime,ftime);
const vfloat4 vtx11 = getVertexMB<vfloat4>(mesh,vtxID11,itime,ftime);
/* deltaX => vtx02, vtx12 */
const size_t deltaX = invalid3x3X() ? 0 : 1;
const size_t vtxID02 = vtxID01 + deltaX;
const vfloat4 vtx02 = getVertexMB<vfloat4>(mesh,vtxID02,itime,ftime);
const size_t vtxID12 = vtxID11 + deltaX;
const vfloat4 vtx12 = getVertexMB<vfloat4>(mesh,vtxID12,itime,ftime);
/* deltaY => vtx20, vtx21 */
const size_t deltaY = invalid3x3Y() ? 0 : g.lineVtxOffset;
const size_t vtxID20 = vtxID10 + deltaY;
const size_t vtxID21 = vtxID11 + deltaY;
const vfloat4 vtx20 = getVertexMB<vfloat4>(mesh,vtxID20,itime,ftime);
const vfloat4 vtx21 = getVertexMB<vfloat4>(mesh,vtxID21,itime,ftime);
/* deltaX/deltaY => vtx22 */
const size_t vtxID22 = vtxID11 + deltaX + deltaY;
const vfloat4 vtx22 = getVertexMB<vfloat4>(mesh,vtxID22,itime,ftime);
vtx[ 0] = vtx00; vtx[ 1] = vtx01; vtx[ 2] = vtx11; vtx[ 3] = vtx10;
vtx[ 4] = vtx01; vtx[ 5] = vtx02; vtx[ 6] = vtx12; vtx[ 7] = vtx11;
vtx[ 8] = vtx10; vtx[ 9] = vtx11; vtx[10] = vtx21; vtx[11] = vtx20;
vtx[12] = vtx11; vtx[13] = vtx12; vtx[14] = vtx22; vtx[15] = vtx21;
}
/* Calculate the bounds of the subgrid */
__forceinline const BBox3fa bounds(const Scene *const scene, const size_t itime=0) const
{
BBox3fa bounds = empty;
FATAL("not implemented yet");
return bounds;
}
/* Calculate the linear bounds of the primitive */
__forceinline LBBox3fa linearBounds(const Scene* const scene, const size_t itime)
{
return LBBox3fa(bounds(scene,itime+0),bounds(scene,itime+1));
}
__forceinline LBBox3fa linearBounds(const Scene *const scene, size_t itime, size_t numTimeSteps)
{
LBBox3fa allBounds = empty;
FATAL("not implemented yet");
return allBounds;
}
__forceinline LBBox3fa linearBounds(const Scene *const scene, const BBox1f time_range)
{
LBBox3fa allBounds = empty;
FATAL("not implemented yet");
return allBounds;
}
friend embree_ostream operator<<(embree_ostream cout, const SubGrid& sg) {
return cout << "SubGrid " << " ( x " << sg.x() << ", y = " << sg.y() << ", geomID = " << sg.geomID() << ", primID = " << sg.primID() << " )";
}
__forceinline unsigned int geomID() const { return _geomID; }
__forceinline unsigned int primID() const { return _primID; }
__forceinline unsigned int x() const { return (unsigned int)_x & 0x7fff; }
__forceinline unsigned int y() const { return (unsigned int)_y & 0x7fff; }
private:
unsigned short _x;
unsigned short _y;
unsigned int _geomID; // geometry ID of mesh
unsigned int _primID; // primitive ID of primitive inside mesh
};
struct SubGridID {
unsigned short x;
unsigned short y;
unsigned int primID;
__forceinline SubGridID() {}
__forceinline SubGridID(const unsigned int x, const unsigned int y, const unsigned int primID) :
x(x), y(y), primID(primID) {}
};
/* QuantizedBaseNode as large subgrid leaf */
template<int N>
struct SubGridQBVHN
{
/* Virtual interface to query information about the quad type */
struct Type : public PrimitiveType
{
const char* name() const;
size_t sizeActive(const char* This) const;
size_t sizeTotal(const char* This) const;
size_t getBytes(const char* This) const;
};
static Type type;
public:
__forceinline size_t size() const
{
for (size_t i=0;i<N;i++)
if (primID(i) == -1) return i;
return N;
}
__forceinline void clear() {
for (size_t i=0;i<N;i++)
subgridIDs[i] = SubGridID(0,0,(unsigned int)-1);
qnode.clear();
}
/* Default constructor */
__forceinline SubGridQBVHN() { }
/* Construction from vertices and IDs */
__forceinline SubGridQBVHN(const unsigned int x[N],
const unsigned int y[N],
const unsigned int primID[N],
const BBox3fa * const subGridBounds,
const unsigned int geomID,
const unsigned int items)
{
clear();
_geomID = geomID;
__aligned(64) typename BVHN<N>::AABBNode node;
node.clear();
for (size_t i=0;i<items;i++)
{
subgridIDs[i] = SubGridID(x[i],y[i],primID[i]);
node.setBounds(i,subGridBounds[i]);
}
qnode.init_dim(node);
}
__forceinline unsigned int geomID() const { return _geomID; }
__forceinline unsigned int primID(const size_t i) const { assert(i < N); return subgridIDs[i].primID; }
__forceinline unsigned int x(const size_t i) const { assert(i < N); return subgridIDs[i].x; }
__forceinline unsigned int y(const size_t i) const { assert(i < N); return subgridIDs[i].y; }
__forceinline SubGrid subgrid(const size_t i) const {
assert(i < N);
assert(primID(i) != -1);
return SubGrid(x(i),y(i),geomID(),primID(i));
}
public:
SubGridID subgridIDs[N];
typename BVHN<N>::QuantizedBaseNode qnode;
unsigned int _geomID; // geometry ID of mesh
friend embree_ostream operator<<(embree_ostream cout, const SubGridQBVHN& sg) {
cout << "SubGridQBVHN " << embree_endl;
for (size_t i=0;i<N;i++)
cout << i << " ( x = " << sg.subgridIDs[i].x << ", y = " << sg.subgridIDs[i].y << ", primID = " << sg.subgridIDs[i].primID << " )" << embree_endl;
cout << "geomID " << sg._geomID << embree_endl;
cout << "lowerX " << sg.qnode.dequantizeLowerX() << embree_endl;
cout << "upperX " << sg.qnode.dequantizeUpperX() << embree_endl;
cout << "lowerY " << sg.qnode.dequantizeLowerY() << embree_endl;
cout << "upperY " << sg.qnode.dequantizeUpperY() << embree_endl;
cout << "lowerZ " << sg.qnode.dequantizeLowerZ() << embree_endl;
cout << "upperZ " << sg.qnode.dequantizeUpperZ() << embree_endl;
return cout;
}
};
template<int N>
typename SubGridQBVHN<N>::Type SubGridQBVHN<N>::type;
typedef SubGridQBVHN<4> SubGridQBVH4;
typedef SubGridQBVHN<8> SubGridQBVH8;
/* QuantizedBaseNode as large subgrid leaf */
template<int N>
struct SubGridMBQBVHN
{
/* Virtual interface to query information about the quad type */
struct Type : public PrimitiveType
{
const char* name() const;
size_t sizeActive(const char* This) const;
size_t sizeTotal(const char* This) const;
size_t getBytes(const char* This) const;
};
static Type type;
public:
__forceinline size_t size() const
{
for (size_t i=0;i<N;i++)
if (primID(i) == -1) return i;
return N;
}
__forceinline void clear() {
for (size_t i=0;i<N;i++)
subgridIDs[i] = SubGridID(0,0,(unsigned int)-1);
qnode.clear();
}
/* Default constructor */
__forceinline SubGridMBQBVHN() { }
/* Construction from vertices and IDs */
__forceinline SubGridMBQBVHN(const unsigned int x[N],
const unsigned int y[N],
const unsigned int primID[N],
const BBox3fa * const subGridBounds0,
const BBox3fa * const subGridBounds1,
const unsigned int geomID,
const float toffset,
const float tscale,
const unsigned int items)
{
clear();
_geomID = geomID;
time_offset = toffset;
time_scale = tscale;
__aligned(64) typename BVHN<N>::AABBNode node0,node1;
node0.clear();
node1.clear();
for (size_t i=0;i<items;i++)
{
subgridIDs[i] = SubGridID(x[i],y[i],primID[i]);
node0.setBounds(i,subGridBounds0[i]);
node1.setBounds(i,subGridBounds1[i]);
}
qnode.node0.init_dim(node0);
qnode.node1.init_dim(node1);
}
__forceinline unsigned int geomID() const { return _geomID; }
__forceinline unsigned int primID(const size_t i) const { assert(i < N); return subgridIDs[i].primID; }
__forceinline unsigned int x(const size_t i) const { assert(i < N); return subgridIDs[i].x; }
__forceinline unsigned int y(const size_t i) const { assert(i < N); return subgridIDs[i].y; }
__forceinline SubGrid subgrid(const size_t i) const {
assert(i < N);
assert(primID(i) != -1);
return SubGrid(x(i),y(i),geomID(),primID(i));
}
__forceinline float adjustTime(const float t) const { return time_scale * (t-time_offset); }
template<int K>
__forceinline vfloat<K> adjustTime(const vfloat<K> &t) const { return time_scale * (t-time_offset); }
public:
SubGridID subgridIDs[N];
typename BVHN<N>::QuantizedBaseNodeMB qnode;
float time_offset;
float time_scale;
unsigned int _geomID; // geometry ID of mesh
friend embree_ostream operator<<(embree_ostream cout, const SubGridMBQBVHN& sg) {
cout << "SubGridMBQBVHN " << embree_endl;
for (size_t i=0;i<N;i++)
cout << i << " ( x = " << sg.subgridIDs[i].x << ", y = " << sg.subgridIDs[i].y << ", primID = " << sg.subgridIDs[i].primID << " )" << embree_endl;
cout << "geomID " << sg._geomID << embree_endl;
cout << "time_offset " << sg.time_offset << embree_endl;
cout << "time_scale " << sg.time_scale << embree_endl;
cout << "lowerX " << sg.qnode.node0.dequantizeLowerX() << embree_endl;
cout << "upperX " << sg.qnode.node0.dequantizeUpperX() << embree_endl;
cout << "lowerY " << sg.qnode.node0.dequantizeLowerY() << embree_endl;
cout << "upperY " << sg.qnode.node0.dequantizeUpperY() << embree_endl;
cout << "lowerZ " << sg.qnode.node0.dequantizeLowerZ() << embree_endl;
cout << "upperZ " << sg.qnode.node0.dequantizeUpperZ() << embree_endl;
cout << "lowerX " << sg.qnode.node1.dequantizeLowerX() << embree_endl;
cout << "upperX " << sg.qnode.node1.dequantizeUpperX() << embree_endl;
cout << "lowerY " << sg.qnode.node1.dequantizeLowerY() << embree_endl;
cout << "upperY " << sg.qnode.node1.dequantizeUpperY() << embree_endl;
cout << "lowerZ " << sg.qnode.node1.dequantizeLowerZ() << embree_endl;
cout << "upperZ " << sg.qnode.node1.dequantizeUpperZ() << embree_endl;
return cout;
}
};
}