coneline_intersector.h source code [Godot/thirdparty/embree/kernels/geometry/coneline_intersector.h]

1	// Copyright 2009-2021 Intel Corporation
2	// SPDX-License-Identifier: Apache-2.0
3
4	#pragma once
5
6	#include "../common/ray.h"
7	#include "curve_intersector_precalculations.h"
8
9	namespace embree
10	{
11	namespace isa
12	{
13	namespace __coneline_internal
14	{
15	template<int M, typename Epilog, typename ray_tfar_func>
16	static __forceinline bool intersectCone(const vbool<M>& valid_i,
17	const Vec3vf<M>& ray_org_in, const Vec3vf<M>& ray_dir,
18	const vfloat<M>& ray_tnear, const ray_tfar_func& ray_tfar,
19	const Vec4vf<M>& v0, const Vec4vf<M>& v1,
20	const vbool<M>& cL, const vbool<M>& cR,
21	const Epilog& epilog)
22	{
23	vbool<M> valid = valid_i;
24
25	/ move ray origin closer to make calculations numerically stable /
26	const vfloat<M> dOdO = sqr(ray_dir);
27	const vfloat<M> rcp_dOdO = rcp(dOdO);
28	const Vec3vf<M> center = vfloat<M>(`0.5f`)*(v0.xyz()+v1.xyz());
29	const vfloat<M> dt = dot(center-ray_org_in,ray_dir)*rcp_dOdO;
30	const Vec3vf<M> ray_org = ray_org_in + dt*ray_dir;
31
32	const Vec3vf<M> dP = v1.xyz() - v0.xyz();
33	const Vec3vf<M> p0 = ray_org - v0.xyz();
34	const Vec3vf<M> p1 = ray_org - v1.xyz();
35
36	const vfloat<M> dPdP = sqr(dP);
37	const vfloat<M> dP0 = dot(p0,dP);
38	const vfloat<M> dP1 = dot(p1,dP);
39	const vfloat<M> dOdP = dot(ray_dir,dP);
40
41	// intersect cone body
42	const vfloat<M> dr = v0.w - v1.w;
43	const vfloat<M> hy = dPdP + sqr(dr);
44	const vfloat<M> dO0 = dot(ray_dir,p0);
45	const vfloat<M> OO = sqr(p0);
46	const vfloat<M> dPdP2 = sqr(dPdP);
47	const vfloat<M> dPdPr0 = dPdP*v0.w;
48
49	const vfloat<M> A = dPdP2 - sqr(dOdP)*hy;
50	const vfloat<M> B = dPdP2dO0 - dP0dOdPhy + dPdPr0(dr*dOdP);
51	const vfloat<M> C = dPdP2OO - sqr(dP0)hy + dPdPr0(`2.0f`dr*dP0 - dPdPr0);
52
53	const vfloat<M> D = BB - AC;
54	valid &= D >= `0.0f`;
55	if (unlikely(none(valid))) {
56	return false;
57	}
58
59	/ standard case for "non-parallel" rays /
60	const vfloat<M> Q = sqrt(D);
61	const vfloat<M> rcp_A = rcp(A);
62	/ special case for rays that are "parallel" to the cone - assume miss /
63	const vbool<M> isParallel = abs(A) <= min_rcp_input;
64
65	vfloat<M> t_cone_lower = select (isParallel, neg_inf, (-B-Q)*rcp_A);
66	vfloat<M> t_cone_upper = select (isParallel, pos_inf, (-B+Q)*rcp_A);
67	const vfloat<M> y_lower = dP0 + t_cone_lower*dOdP;
68	const vfloat<M> y_upper = dP0 + t_cone_upper*dOdP;
69	t_cone_lower = select(valid & y_lower > `0.0f` & y_lower < dPdP, t_cone_lower, pos_inf);
70	t_cone_upper = select(valid & y_upper > `0.0f` & y_upper < dPdP, t_cone_upper, neg_inf);
71
72	const vbool<M> hitDisk0 = valid & cL;
73	const vbool<M> hitDisk1 = valid & cR;
74	const vfloat<M> rcp_dOdP = rcp(dOdP);
75	const vfloat<M> t_disk0 = select (hitDisk0, select (sqr(p0dOdP-ray_dirdP0)<(sqr(v0.w)sqr(dOdP)), -dP0rcp_dOdP, pos_inf), pos_inf);
76	const vfloat<M> t_disk1 = select (hitDisk1, select (sqr(p1dOdP-ray_dirdP1)<(sqr(v1.w)sqr(dOdP)), -dP1rcp_dOdP, pos_inf), pos_inf);
77	const vfloat<M> t_disk_lower = min(t_disk0, t_disk1);
78	const vfloat<M> t_disk_upper = max(t_disk0, t_disk1);
79
80	const vfloat<M> t_lower = min(t_cone_lower, t_disk_lower);
81	const vfloat<M> t_upper = max(t_cone_upper, select(t_lower==t_disk_lower,
82	select(t_disk_upper==vfloat<M>(pos_inf),neg_inf,t_disk_upper),
83	select(t_disk_lower==vfloat<M>(pos_inf),neg_inf,t_disk_lower)));
84
85	const vbool<M> valid_lower = valid & ray_tnear <= dt+t_lower & dt+t_lower <= ray_tfar() & t_lower != vfloat<M>(pos_inf);
86	const vbool<M> valid_upper = valid & ray_tnear <= dt+t_upper & dt+t_upper <= ray_tfar() & t_upper != vfloat<M>(neg_inf);
87
88	const vbool<M> valid_first = valid_lower \| valid_upper;
89	if (unlikely(none(valid_first)))
90	return false;
91
92	const vfloat<M> t_first = select(valid_lower, t_lower, t_upper);
93	const vfloat<M> y_first = select(valid_lower, y_lower, y_upper);
94
95	const vfloat<M> rcp_dPdP = rcp(dPdP);
96	const Vec3vf<M> dP2drr0dP = dPdPdrv0.w*dP;
97	const Vec3vf<M> dPhy = dP*hy;
98	const vbool<M> cone_hit_first = valid & (t_first == t_cone_lower \| t_first == t_cone_upper);
99	const vbool<M> disk0_hit_first = valid & (t_first == t_disk0);
100	const Vec3vf<M> Ng_first = select(cone_hit_first, dPdP2(p0+t_firstray_dir)+dP2drr0dP-dPhy*y_first, select(disk0_hit_first, -dP, dP));
101	const vfloat<M> u_first = select(cone_hit_first, y_first*rcp_dPdP, select(disk0_hit_first, vfloat<M>(zero), vfloat<M>(one)));
102
103	/ invoke intersection filter for first hit /
104	RoundLineIntersectorHitM<M> hit(u_first,zero,dt+t_first,Ng_first);
105	const bool is_hit_first = epilog(valid_first, hit);
106
107	/ check for possible second hits before potentially accepted hit /
108	const vfloat<M> t_second = t_upper;
109	const vfloat<M> y_second = y_upper;
110	const vbool<M> valid_second = valid_lower & valid_upper & (dt+t_upper <= ray_tfar());
111	if (unlikely(none(valid_second)))
112	return is_hit_first;
113
114	/ invoke intersection filter for second hit /
115	const vbool<M> cone_hit_second = t_second == t_cone_lower \| t_second == t_cone_upper;
116	const vbool<M> disk0_hit_second = t_second == t_disk0;
117	const Vec3vf<M> Ng_second = select(cone_hit_second, dPdP2(p0+t_secondray_dir)+dP2drr0dP-dPhy*y_second, select(disk0_hit_second, -dP, dP));
118	const vfloat<M> u_second = select(cone_hit_second, y_second*rcp_dPdP, select(disk0_hit_first, vfloat<M>(zero), vfloat<M>(one)));
119
120	hit = RoundLineIntersectorHitM<M>(u_second,zero,dt+t_second,Ng_second);
121	const bool is_hit_second = epilog(valid_second, hit);
122
123	return is_hit_first \| is_hit_second;
124	}
125	}
126
127	template<int M>
128	struct ConeLineIntersectorHitM
129	{
130	__forceinline ConeLineIntersectorHitM() {}
131
132	__forceinline ConeLineIntersectorHitM(const vfloat<M>& u, const vfloat<M>& v, const vfloat<M>& t, const Vec3vf<M>& Ng)
133	: vu(u), vv(v), vt(t), vNg(Ng) {}
134
135	__forceinline void finalize() {}
136
137	__forceinline Vec2f uv (const size_t i) const { return Vec2f(vu[i],vv[i]); }
138	__forceinline float t (const size_t i) const { return vt[i]; }
139	__forceinline Vec3fa Ng(const size_t i) const { return Vec3fa(vNg.x[i],vNg.y[i],vNg.z[i]); }
140
141	public:
142	vfloat<M> vu;
143	vfloat<M> vv;
144	vfloat<M> vt;
145	Vec3vf<M> vNg;
146	};
147
148	template<int M>
149	struct ConeCurveIntersector1
150	{
151	typedef CurvePrecalculations1 Precalculations;
152
153	struct ray_tfar {
154	Ray& ray;
155	__forceinline ray_tfar(Ray& ray) : ray(ray) {}
156	__forceinline vfloat<M> operator() () const { return ray.tfar; };
157	};
158
159	template<typename Epilog>
160	static __forceinline bool intersect(const vbool<M>& valid_i,
161	Ray& ray,
162	IntersectContext* context,
163	const LineSegments* geom,
164	const Precalculations& pre,
165	const Vec4vf<M>& v0i, const Vec4vf<M>& v1i,
166	const vbool<M>& cL, const vbool<M>& cR,
167	const Epilog& epilog)
168	{
169	const Vec3vf<M> ray_org(ray.org.x, ray.org.y, ray.org.z);
170	const Vec3vf<M> ray_dir(ray.dir.x, ray.dir.y, ray.dir.z);
171	const vfloat<M> ray_tnear(ray.tnear());
172	const Vec4vf<M> v0 = enlargeRadiusToMinWidth<M>(context,geom,ray_org,v0i);
173	const Vec4vf<M> v1 = enlargeRadiusToMinWidth<M>(context,geom,ray_org,v1i);
174	return __coneline_internal::intersectCone<M>(valid_i,ray_org,ray_dir,ray_tnear,ray_tfar(ray),v0,v1,cL,cR,epilog);
175	}
176	};
177
178	template<int M, int K>
179	struct ConeCurveIntersectorK
180	{
181	typedef CurvePrecalculationsK<K> Precalculations;
182
183	struct ray_tfar {
184	RayK<K>& ray;
185	size_t k;
186	__forceinline ray_tfar(RayK<K>& ray, size_t k) : ray(ray), k(k) {}
187	__forceinline vfloat<M> operator() () const { return ray.tfar[k]; };
188	};
189
190	template<typename Epilog>
191	static __forceinline bool intersect(const vbool<M>& valid_i,
192	RayK<K>& ray, size_t k,
193	IntersectContext* context,
194	const LineSegments* geom,
195	const Precalculations& pre,
196	const Vec4vf<M>& v0i, const Vec4vf<M>& v1i,
197	const vbool<M>& cL, const vbool<M>& cR,
198	const Epilog& epilog)
199	{
200	const Vec3vf<M> ray_org(ray.org.x[k], ray.org.y[k], ray.org.z[k]);
201	const Vec3vf<M> ray_dir(ray.dir.x[k], ray.dir.y[k], ray.dir.z[k]);
202	const vfloat<M> ray_tnear = ray.tnear()[k];
203	const Vec4vf<M> v0 = enlargeRadiusToMinWidth<M>(context,geom,ray_org,v0i);
204	const Vec4vf<M> v1 = enlargeRadiusToMinWidth<M>(context,geom,ray_org,v1i);
205	return __coneline_internal::intersectCone<M>(valid_i,ray_org,ray_dir,ray_tnear,ray_tfar(ray,k),v0,v1,cL,cR,epilog);
206	}
207	};
208	}
209	}
210

Browse the source code of Godot/thirdparty/embree/kernels/geometry/coneline_intersector.h