// ======================================================================== // // Copyright 2009-2017 Intel Corporation // // // // Licensed under the Apache License, Version 2.0 (the "License"); // // you may not use this file except in compliance with the License. // // You may obtain a copy of the License at // // // // http://www.apache.org/licenses/LICENSE-2.0 // // // // Unless required by applicable law or agreed to in writing, software // // distributed under the License is distributed on an "AS IS" BASIS, // // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // // See the License for the specific language governing permissions and // // limitations under the License. // // ======================================================================== // #include "acceln.h" #include "ray.h" #include "../../include/embree2/rtcore_ray.h" #include "../../common/algorithms/parallel_for.h" namespace embree { AccelN::AccelN () : Accel(AccelData::TY_ACCELN), accels(nullptr), validAccels(nullptr), validIntersectorN(false) {} AccelN::~AccelN() { for (size_t i=0; ivalidAccels.size(); i++) This->validAccels[i]->intersect(ray,context); } void AccelN::intersect4 (const void* valid, void* ptr, RTCRay4& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) This->validAccels[i]->intersect4(valid,ray,context); } void AccelN::intersect8 (const void* valid, void* ptr, RTCRay8& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) This->validAccels[i]->intersect8(valid,ray,context); } void AccelN::intersect16 (const void* valid, void* ptr, RTCRay16& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) This->validAccels[i]->intersect16(valid,ray,context); } void AccelN::intersectN (void* ptr, RTCRay** ray, const size_t N, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) This->validAccels[i]->intersectN(ray,N,context); } void AccelN::occluded (void* ptr, RTCRay& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) { This->validAccels[i]->occluded(ray,context); if (ray.geomID == 0) break; } } void AccelN::occluded4 (const void* valid, void* ptr, RTCRay4& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) { This->validAccels[i]->occluded4(valid,ray,context); #if defined(__SSE2__) vbool4 valid0 = ((vbool4*)valid)[0]; vbool4 hit0 = ((vint4*)ray.geomID)[0] == vint4(0); if (all(valid0,hit0)) break; #endif } } void AccelN::occluded8 (const void* valid, void* ptr, RTCRay8& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) { This->validAccels[i]->occluded8(valid,ray,context); #if defined(__SSE2__) // FIXME: use AVX code vbool4 valid0 = ((vbool4*)valid)[0]; vbool4 hit0 = ((vint4*)ray.geomID)[0] == vint4(0); vbool4 valid1 = ((vbool4*)valid)[1]; vbool4 hit1 = ((vint4*)ray.geomID)[1] == vint4(0); if (all(valid0,hit0) && all(valid1,hit1)) break; #endif } } void AccelN::occluded16 (const void* valid, void* ptr, RTCRay16& ray, IntersectContext* context) { AccelN* This = (AccelN*)ptr; for (size_t i=0; ivalidAccels.size(); i++) { This->validAccels[i]->occluded16(valid,ray,context); #if defined(__AVX512F__) // FIXME: this code gets never compiler with __AVX512F__ enabled vbool16 valid0 = ((vbool16*)valid)[0]; vbool16 hit0 = ((vint16*)ray.geomID)[0] == vint16(0); if (all(valid0,hit0)) break; #endif } } void AccelN::occludedN (void* ptr, RTCRay** ray, const size_t N, IntersectContext* context) { AccelN* This = (AccelN*)ptr; size_t M = N; for (size_t i=0; ivalidAccels.size(); i++) { This->validAccels[i]->occludedN(ray,M,context); /* only do this optimization if input rays are given in AOS format */ if (context->flags == IntersectContext::INPUT_RAY_DATA_AOS) Ray::filterOutOccluded((Ray**)ray,M); if (M == 0) break; } } void AccelN::print(size_t ident) { for (size_t i=0; iintersectors.print(ident+2); } } void AccelN::immutable() { for (size_t i=0; iimmutable(); } void AccelN::build () { /* build all acceleration structures in parallel */ parallel_for (accels.size(), [&] (size_t i) { accels[i]->build(); }); /* create list of non-empty acceleration structures */ validAccels.clear(); validIntersectorN = true; for (size_t i=0; ibounds.empty()) continue; validAccels.push_back(accels[i]); if (!accels[i]->intersectors.intersectorN) validIntersectorN = false; } if (validAccels.size() == 1) { intersectors = validAccels[0]->intersectors; } else { intersectors.ptr = this; intersectors.intersector1 = Intersector1(&intersect,&occluded,"AccelN::intersector1"); intersectors.intersector4 = Intersector4(&intersect4,&occluded4,"AccelN::intersector4"); intersectors.intersector8 = Intersector8(&intersect8,&occluded8,"AccelN::intersector8"); intersectors.intersector16 = Intersector16(&intersect16,&occluded16,"AccelN::intersector16"); intersectors.intersectorN = IntersectorN(&intersectN,&occludedN,"AccelN::intersectorN"); } /*! calculate bounds */ bounds = empty; for (size_t i=0; ibounds); } void AccelN::select(bool filter4, bool filter8, bool filter16, bool filterN) { for (size_t i=0; iintersectors.select(filter4,filter8,filter16,filterN); } void AccelN::deleteGeometry(size_t geomID) { for (size_t i=0; ideleteGeometry(geomID); } void AccelN::clear() { for (size_t i=0; iclear(); } }