scene_grid_mesh.h 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468
  1. // Copyright 2009-2021 Intel Corporation
  2. // SPDX-License-Identifier: Apache-2.0
  3. #pragma once
  4. #include "geometry.h"
  5. #include "buffer.h"
  6. namespace embree
  7. {
  8. /*! Grid Mesh */
  9. struct GridMesh : public Geometry
  10. {
  11. /*! type of this geometry */
  12. static const Geometry::GTypeMask geom_type = Geometry::MTY_GRID_MESH;
  13. /*! grid */
  14. struct Grid
  15. {
  16. unsigned int startVtxID;
  17. unsigned int lineVtxOffset;
  18. unsigned short resX,resY;
  19. /* border flags due to 3x3 vertex pattern */
  20. __forceinline unsigned int get3x3FlagsX(const unsigned int x) const
  21. {
  22. return (x + 2 >= (unsigned int)resX) ? (1<<15) : 0;
  23. }
  24. /* border flags due to 3x3 vertex pattern */
  25. __forceinline unsigned int get3x3FlagsY(const unsigned int y) const
  26. {
  27. return (y + 2 >= (unsigned int)resY) ? (1<<15) : 0;
  28. }
  29. /*! outputs grid structure */
  30. __forceinline friend embree_ostream operator<<(embree_ostream cout, const Grid& t) {
  31. return cout << "Grid { startVtxID " << t.startVtxID << ", lineVtxOffset " << t.lineVtxOffset << ", resX " << t.resX << ", resY " << t.resY << " }";
  32. }
  33. };
  34. public:
  35. /*! grid mesh construction */
  36. GridMesh (Device* device);
  37. /* geometry interface */
  38. public:
  39. void setMask(unsigned mask);
  40. void setNumTimeSteps (unsigned int numTimeSteps);
  41. void setVertexAttributeCount (unsigned int N);
  42. void setBuffer(RTCBufferType type, unsigned int slot, RTCFormat format, const Ref<Buffer>& buffer, size_t offset, size_t stride, unsigned int num);
  43. void* getBuffer(RTCBufferType type, unsigned int slot);
  44. void updateBuffer(RTCBufferType type, unsigned int slot);
  45. void commit();
  46. bool verify();
  47. void interpolate(const RTCInterpolateArguments* const args);
  48. template<int N>
  49. void interpolate_impl(const RTCInterpolateArguments* const args)
  50. {
  51. unsigned int primID = args->primID;
  52. float U = args->u;
  53. float V = args->v;
  54. /* clamp input u,v to [0;1] range */
  55. U = max(min(U,1.0f),0.0f);
  56. V = max(min(V,1.0f),0.0f);
  57. RTCBufferType bufferType = args->bufferType;
  58. unsigned int bufferSlot = args->bufferSlot;
  59. float* P = args->P;
  60. float* dPdu = args->dPdu;
  61. float* dPdv = args->dPdv;
  62. float* ddPdudu = args->ddPdudu;
  63. float* ddPdvdv = args->ddPdvdv;
  64. float* ddPdudv = args->ddPdudv;
  65. unsigned int valueCount = args->valueCount;
  66. /* calculate base pointer and stride */
  67. assert((bufferType == RTC_BUFFER_TYPE_VERTEX && bufferSlot < numTimeSteps) ||
  68. (bufferType == RTC_BUFFER_TYPE_VERTEX_ATTRIBUTE && bufferSlot <= vertexAttribs.size()));
  69. const char* src = nullptr;
  70. size_t stride = 0;
  71. if (bufferType == RTC_BUFFER_TYPE_VERTEX_ATTRIBUTE) {
  72. src = vertexAttribs[bufferSlot].getPtr();
  73. stride = vertexAttribs[bufferSlot].getStride();
  74. } else {
  75. src = vertices[bufferSlot].getPtr();
  76. stride = vertices[bufferSlot].getStride();
  77. }
  78. const Grid& grid = grids[primID];
  79. const int grid_width = grid.resX-1;
  80. const int grid_height = grid.resY-1;
  81. const float rcp_grid_width = rcp(float(grid_width));
  82. const float rcp_grid_height = rcp(float(grid_height));
  83. const int iu = min((int)floor(U*grid_width ),grid_width);
  84. const int iv = min((int)floor(V*grid_height),grid_height);
  85. const float u = U*grid_width-float(iu);
  86. const float v = V*grid_height-float(iv);
  87. for (unsigned int i=0; i<valueCount; i+=N)
  88. {
  89. const size_t ofs = i*sizeof(float);
  90. const unsigned int idx0 = grid.startVtxID + (iv+0)*grid.lineVtxOffset + iu;
  91. const unsigned int idx1 = grid.startVtxID + (iv+1)*grid.lineVtxOffset + iu;
  92. const vbool<N> valid = vint<N>((int)i)+vint<N>(step) < vint<N>(int(valueCount));
  93. const vfloat<N> p0 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx0+0)*stride+ofs]);
  94. const vfloat<N> p1 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx0+1)*stride+ofs]);
  95. const vfloat<N> p2 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx1+1)*stride+ofs]);
  96. const vfloat<N> p3 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx1+0)*stride+ofs]);
  97. const vbool<N> left = u+v <= 1.0f;
  98. const vfloat<N> Q0 = select(left,p0,p2);
  99. const vfloat<N> Q1 = select(left,p1,p3);
  100. const vfloat<N> Q2 = select(left,p3,p1);
  101. const vfloat<N> U = select(left,u,vfloat<N>(1.0f)-u);
  102. const vfloat<N> V = select(left,v,vfloat<N>(1.0f)-v);
  103. const vfloat<N> W = 1.0f-U-V;
  104. if (P) {
  105. mem<vfloat<N>>::storeu(valid,P+i,madd(W,Q0,madd(U,Q1,V*Q2)));
  106. }
  107. if (dPdu) {
  108. assert(dPdu); mem<vfloat<N>>::storeu(valid,dPdu+i,select(left,Q1-Q0,Q0-Q1)*rcp_grid_width);
  109. assert(dPdv); mem<vfloat<N>>::storeu(valid,dPdv+i,select(left,Q2-Q0,Q0-Q2)*rcp_grid_height);
  110. }
  111. if (ddPdudu) {
  112. assert(ddPdudu); mem<vfloat<N>>::storeu(valid,ddPdudu+i,vfloat<N>(zero));
  113. assert(ddPdvdv); mem<vfloat<N>>::storeu(valid,ddPdvdv+i,vfloat<N>(zero));
  114. assert(ddPdudv); mem<vfloat<N>>::storeu(valid,ddPdudv+i,vfloat<N>(zero));
  115. }
  116. }
  117. }
  118. void addElementsToCount (GeometryCounts & counts) const;
  119. __forceinline unsigned int getNumTotalQuads() const
  120. {
  121. size_t quads = 0;
  122. for (size_t primID=0; primID<numPrimitives; primID++)
  123. quads += getNumQuads(primID);
  124. return quads;
  125. }
  126. __forceinline unsigned int getNumQuads(const size_t gridID) const
  127. {
  128. const Grid& g = grid(gridID);
  129. return (unsigned int) max((int)1,((int)g.resX-1) * ((int)g.resY-1));
  130. }
  131. __forceinline unsigned int getNumSubGrids(const size_t gridID) const
  132. {
  133. const Grid& g = grid(gridID);
  134. return max((unsigned int)1,((unsigned int)g.resX >> 1) * ((unsigned int)g.resY >> 1));
  135. }
  136. /*! get fast access to first vertex buffer */
  137. __forceinline float * getCompactVertexArray () const {
  138. return (float*) vertices0.getPtr();
  139. }
  140. public:
  141. /*! returns number of vertices */
  142. __forceinline size_t numVertices() const {
  143. return vertices[0].size();
  144. }
  145. /*! returns i'th grid*/
  146. __forceinline const Grid& grid(size_t i) const {
  147. return grids[i];
  148. }
  149. /*! returns i'th vertex of the first time step */
  150. __forceinline const Vec3fa vertex(size_t i) const { // FIXME: check if this does a unaligned load
  151. return vertices0[i];
  152. }
  153. /*! returns i'th vertex of the first time step */
  154. __forceinline const char* vertexPtr(size_t i) const {
  155. return vertices0.getPtr(i);
  156. }
  157. /*! returns i'th vertex of itime'th timestep */
  158. __forceinline const Vec3fa vertex(size_t i, size_t itime) const {
  159. return vertices[itime][i];
  160. }
  161. /*! returns i'th vertex of for specified time */
  162. __forceinline const Vec3fa vertex(size_t i, float time) const
  163. {
  164. float ftime;
  165. const size_t itime = timeSegment(time, ftime);
  166. const float t0 = 1.0f - ftime;
  167. const float t1 = ftime;
  168. Vec3fa v0 = vertex(i, itime+0);
  169. Vec3fa v1 = vertex(i, itime+1);
  170. return madd(Vec3fa(t0),v0,t1*v1);
  171. }
  172. /*! returns i'th vertex of itime'th timestep */
  173. __forceinline const char* vertexPtr(size_t i, size_t itime) const {
  174. return vertices[itime].getPtr(i);
  175. }
  176. /*! returns i'th vertex of the first timestep */
  177. __forceinline size_t grid_vertex_index(const Grid& g, size_t x, size_t y) const {
  178. assert(x < (size_t)g.resX);
  179. assert(y < (size_t)g.resY);
  180. return g.startVtxID + x + y * g.lineVtxOffset;
  181. }
  182. /*! returns i'th vertex of the first timestep */
  183. __forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y) const {
  184. const size_t index = grid_vertex_index(g,x,y);
  185. return vertex(index);
  186. }
  187. /*! returns i'th vertex of the itime'th timestep */
  188. __forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y, size_t itime) const {
  189. const size_t index = grid_vertex_index(g,x,y);
  190. return vertex(index,itime);
  191. }
  192. /*! returns i'th vertex of the itime'th timestep */
  193. __forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y, float time) const {
  194. const size_t index = grid_vertex_index(g,x,y);
  195. return vertex(index,time);
  196. }
  197. /*! gathers quad vertices */
  198. __forceinline void gather_quad_vertices(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y) const
  199. {
  200. v0 = grid_vertex(g,x+0,y+0);
  201. v1 = grid_vertex(g,x+1,y+0);
  202. v2 = grid_vertex(g,x+1,y+1);
  203. v3 = grid_vertex(g,x+0,y+1);
  204. }
  205. /*! gathers quad vertices for specified time */
  206. __forceinline void gather_quad_vertices(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y, float time) const
  207. {
  208. v0 = grid_vertex(g,x+0,y+0,time);
  209. v1 = grid_vertex(g,x+1,y+0,time);
  210. v2 = grid_vertex(g,x+1,y+1,time);
  211. v3 = grid_vertex(g,x+0,y+1,time);
  212. }
  213. /*! gathers quad vertices for mblur and non-mblur meshes */
  214. __forceinline void gather_quad_vertices_safe(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y, float time) const
  215. {
  216. if (hasMotionBlur()) gather_quad_vertices(v0,v1,v2,v3,g,x,y,time);
  217. else gather_quad_vertices(v0,v1,v2,v3,g,x,y);
  218. }
  219. /*! calculates the build bounds of the i'th quad, if it's valid */
  220. __forceinline bool buildBoundsQuad(const Grid& g, size_t sx, size_t sy, BBox3fa& bbox) const
  221. {
  222. BBox3fa b(empty);
  223. for (size_t t=0; t<numTimeSteps; t++)
  224. {
  225. for (size_t y=sy;y<sy+2;y++)
  226. for (size_t x=sx;x<sx+2;x++)
  227. {
  228. const Vec3fa v = grid_vertex(g,x,y,t);
  229. if (unlikely(!isvalid(v))) return false;
  230. b.extend(v);
  231. }
  232. }
  233. bbox = b;
  234. return true;
  235. }
  236. /*! calculates the build bounds of the i'th primitive, if it's valid */
  237. __forceinline bool buildBounds(const Grid& g, size_t sx, size_t sy, BBox3fa& bbox) const
  238. {
  239. BBox3fa b(empty);
  240. for (size_t t=0; t<numTimeSteps; t++)
  241. {
  242. for (size_t y=sy;y<min(sy+3,(size_t)g.resY);y++)
  243. for (size_t x=sx;x<min(sx+3,(size_t)g.resX);x++)
  244. {
  245. const Vec3fa v = grid_vertex(g,x,y,t);
  246. if (unlikely(!isvalid(v))) return false;
  247. b.extend(v);
  248. }
  249. }
  250. bbox = b;
  251. return true;
  252. }
  253. /*! calculates the build bounds of the i'th primitive at the itime'th time segment, if it's valid */
  254. __forceinline bool buildBounds(const Grid& g, size_t sx, size_t sy, size_t itime, BBox3fa& bbox) const
  255. {
  256. assert(itime < numTimeSteps);
  257. BBox3fa b0(empty);
  258. for (size_t y=sy;y<min(sy+3,(size_t)g.resY);y++)
  259. for (size_t x=sx;x<min(sx+3,(size_t)g.resX);x++)
  260. {
  261. const Vec3fa v = grid_vertex(g,x,y,itime);
  262. if (unlikely(!isvalid(v))) return false;
  263. b0.extend(v);
  264. }
  265. /* use bounds of first time step in builder */
  266. bbox = b0;
  267. return true;
  268. }
  269. __forceinline bool valid(size_t gridID, size_t itime=0) const {
  270. return valid(gridID, make_range(itime, itime));
  271. }
  272. /*! check if the i'th primitive is valid between the specified time range */
  273. __forceinline bool valid(size_t gridID, const range<size_t>& itime_range) const
  274. {
  275. if (unlikely(gridID >= grids.size())) return false;
  276. const Grid &g = grid(gridID);
  277. if (unlikely(g.startVtxID + 0 >= vertices0.size())) return false;
  278. if (unlikely(g.startVtxID + (g.resY-1)*g.lineVtxOffset + g.resX-1 >= vertices0.size())) return false;
  279. for (size_t y=0;y<g.resY;y++)
  280. for (size_t x=0;x<g.resX;x++)
  281. for (size_t itime = itime_range.begin(); itime <= itime_range.end(); itime++)
  282. if (!isvalid(grid_vertex(g,x,y,itime))) return false;
  283. return true;
  284. }
  285. __forceinline BBox3fa bounds(const Grid& g, size_t sx, size_t sy, size_t itime) const
  286. {
  287. BBox3fa box(empty);
  288. buildBounds(g,sx,sy,itime,box);
  289. return box;
  290. }
  291. __forceinline LBBox3fa linearBounds(const Grid& g, size_t sx, size_t sy, size_t itime) const {
  292. BBox3fa bounds0, bounds1;
  293. buildBounds(g,sx,sy,itime+0,bounds0);
  294. buildBounds(g,sx,sy,itime+1,bounds1);
  295. return LBBox3fa(bounds0,bounds1);
  296. }
  297. /*! calculates the linear bounds of the i'th primitive for the specified time range */
  298. __forceinline LBBox3fa linearBounds(const Grid& g, size_t sx, size_t sy, const BBox1f& dt) const {
  299. return LBBox3fa([&] (size_t itime) { return bounds(g,sx,sy,itime); }, dt, time_range, fnumTimeSegments);
  300. }
  301. __forceinline float projectedPrimitiveArea(const size_t i) const {
  302. return pos_inf;
  303. }
  304. public:
  305. BufferView<Grid> grids; //!< array of triangles
  306. BufferView<Vec3fa> vertices0; //!< fast access to first vertex buffer
  307. Device::vector<BufferView<Vec3fa>> vertices = device; //!< vertex array for each timestep
  308. Device::vector<RawBufferView> vertexAttribs = device; //!< vertex attributes
  309. #if defined(EMBREE_SYCL_SUPPORT)
  310. public:
  311. struct PrimID_XY { uint32_t primID; uint16_t x,y; };
  312. Device::vector<PrimID_XY> quadID_to_primID_xy = device; //!< maps a quad to the primitive ID and grid coordinates
  313. #endif
  314. };
  315. namespace isa
  316. {
  317. struct GridMeshISA : public GridMesh
  318. {
  319. GridMeshISA (Device* device)
  320. : GridMesh(device) {}
  321. LBBox3fa vlinearBounds(size_t buildID, const BBox1f& time_range, const SubGridBuildData * const sgrids) const override {
  322. const SubGridBuildData &subgrid = sgrids[buildID];
  323. const unsigned int primID = subgrid.primID;
  324. const size_t x = subgrid.x();
  325. const size_t y = subgrid.y();
  326. return linearBounds(grid(primID),x,y,time_range);
  327. }
  328. #if defined(EMBREE_SYCL_SUPPORT)
  329. PrimInfo createPrimRefArray(PrimRef* prims, const range<size_t>& r, size_t k, unsigned int geomID) const override
  330. {
  331. PrimInfo pinfo(empty);
  332. for (size_t j=r.begin(); j<r.end(); j++)
  333. {
  334. BBox3fa bounds = empty;
  335. const PrimID_XY& quad = quadID_to_primID_xy[j];
  336. if (!buildBoundsQuad(grids[quad.primID],quad.x,quad.y,bounds)) continue;
  337. const PrimRef prim(bounds,geomID,unsigned(j));
  338. pinfo.add_center2(prim);
  339. prims[k++] = prim;
  340. }
  341. return pinfo;
  342. }
  343. #endif
  344. PrimInfo createPrimRefArray(mvector<PrimRef>& prims, mvector<SubGridBuildData>& sgrids, const range<size_t>& r, size_t k, unsigned int geomID) const override
  345. {
  346. PrimInfo pinfo(empty);
  347. for (size_t j=r.begin(); j<r.end(); j++)
  348. {
  349. if (!valid(j)) continue;
  350. const GridMesh::Grid &g = grid(j);
  351. for (unsigned int y=0; y<g.resY-1u; y+=2)
  352. {
  353. for (unsigned int x=0; x<g.resX-1u; x+=2)
  354. {
  355. BBox3fa bounds = empty;
  356. if (!buildBounds(g,x,y,bounds)) continue; // get bounds of subgrid
  357. const PrimRef prim(bounds,(unsigned)geomID,(unsigned)k);
  358. pinfo.add_center2(prim);
  359. sgrids[k] = SubGridBuildData(x | g.get3x3FlagsX(x), y | g.get3x3FlagsY(y), unsigned(j));
  360. prims[k++] = prim;
  361. }
  362. }
  363. }
  364. return pinfo;
  365. }
  366. #if defined(EMBREE_SYCL_SUPPORT)
  367. PrimInfo createPrimRefArrayMB(PrimRef* prims, const BBox1f& time_range, const range<size_t>& r, size_t k, unsigned int geomID) const override
  368. {
  369. const BBox1f t0t1 = BBox1f::intersect(getTimeRange(), time_range);
  370. PrimInfo pinfo(empty);
  371. for (size_t j=r.begin(); j<r.end(); j++)
  372. {
  373. const PrimID_XY& quad = quadID_to_primID_xy[j];
  374. const LBBox3fa lbounds = linearBounds(grids[quad.primID],quad.x,quad.y,t0t1);
  375. const PrimRef prim(lbounds.bounds(), unsigned(geomID), unsigned(j));
  376. pinfo.add_center2(prim);
  377. prims[k++] = prim;
  378. }
  379. return pinfo;
  380. }
  381. #endif
  382. PrimInfoMB createPrimRefMBArray(mvector<PrimRefMB>& prims, mvector<SubGridBuildData>& sgrids, const BBox1f& t0t1, const range<size_t>& r, size_t k, unsigned int geomID) const override
  383. {
  384. PrimInfoMB pinfoMB(empty);
  385. for (size_t j=r.begin(); j<r.end(); j++)
  386. {
  387. if (!valid(j, timeSegmentRange(t0t1))) continue;
  388. const GridMesh::Grid &g = grid(j);
  389. for (unsigned int y=0; y<g.resY-1u; y+=2)
  390. {
  391. for (unsigned int x=0; x<g.resX-1u; x+=2)
  392. {
  393. const PrimRefMB prim(linearBounds(g,x,y,t0t1),numTimeSegments(),time_range,numTimeSegments(),unsigned(geomID),unsigned(k));
  394. pinfoMB.add_primref(prim);
  395. sgrids[k] = SubGridBuildData(x | g.get3x3FlagsX(x), y | g.get3x3FlagsY(y), unsigned(j));
  396. prims[k++] = prim;
  397. }
  398. }
  399. }
  400. return pinfoMB;
  401. }
  402. };
  403. }
  404. DECLARE_ISA_FUNCTION(GridMesh*, createGridMesh, Device*);
  405. }