#6 [DO NOT SQUASH] Performance improvements for vector.lua

오픈
pgimeno pgimeno/pg-accelerate-dir2rot 에서 pgimeno/master 로 2 commits 를 머지하려 합니다
1개의 변경된 파일76개의 추가작업 그리고 38개의 파일을 삭제
  1. 76 38
      builtin/common/vector.lua

+ 76 - 38
builtin/common/vector.lua

@@ -1,6 +1,18 @@
 
 vector = {}
 
+-- Cache math functions in locals
+local vector = vector
+local math_sin = math.sin
+local math_cos = math.cos
+local math_asin = math.asin
+local math_atan2 = math.atan2
+local math_pi = math.pi
+local math_sqrt = math.sqrt
+local math_floor = math.floor
+local math_hypot = math.hypot
+assert(math_hypot, "Wrong loading order")
+
 function vector.new(a, b, c)
 	if type(a) == "table" then
 		assert(a.x and a.y and a.z, "Invalid vector passed to vector.new()")
@@ -19,7 +31,7 @@ function vector.equals(a, b)
 end
 
 function vector.length(v)
-	return math.hypot(v.x, math.hypot(v.y, v.z))
+	return math_hypot(v.x, math_hypot(v.y, v.z))
 end
 
 function vector.normalize(v)
@@ -33,17 +45,17 @@ end
 
 function vector.floor(v)
 	return {
-		x = math.floor(v.x),
-		y = math.floor(v.y),
-		z = math.floor(v.z)
+		x = math_floor(v.x),
+		y = math_floor(v.y),
+		z = math_floor(v.z)
 	}
 end
 
 function vector.round(v)
 	return {
-		x = math.floor(v.x + 0.5),
-		y = math.floor(v.y + 0.5),
-		z = math.floor(v.z + 0.5)
+		x = math_floor(v.x + 0.5),
+		y = math_floor(v.y + 0.5),
+		z = math_floor(v.z + 0.5)
 	}
 end
 
@@ -59,7 +71,7 @@ function vector.distance(a, b)
 	local x = a.x - b.x
 	local y = a.y - b.y
 	local z = a.z - b.z
-	return math.hypot(x, math.hypot(y, z))
+	return math_hypot(x, math_hypot(y, z))
 end
 
 function vector.direction(pos1, pos2)
@@ -74,7 +86,7 @@ function vector.angle(a, b)
 	local dotp = vector.dot(a, b)
 	local cp = vector.cross(a, b)
 	local crossplen = vector.length(cp)
-	return math.atan2(crossplen, dotp)
+	return math_atan2(crossplen, dotp)
 end
 
 function vector.dot(a, b)
@@ -143,18 +155,18 @@ function vector.sort(a, b)
 end
 
 local function sin(x)
-	if x % math.pi == 0 then
+	if x % math_pi == 0 then
 		return 0
 	else
-		return math.sin(x)
+		return math_sin(x)
 	end
 end
 
 local function cos(x)
-	if x % math.pi == math.pi / 2 then
+	if x % math_pi == math_pi / 2 then
 		return 0
 	else
-		return math.cos(x)
+		return math_cos(x)
 	end
 end
 
@@ -178,7 +190,7 @@ function vector.rotate(v, rot)
 	local sinroll = sin(-rot.z)
 	local cospitch = cos(rot.x)
 	local cosyaw = cos(rot.y)
-	local cosroll = math.cos(rot.z)
+	local cosroll = cos(rot.z)
 	-- Rotation matrix that applies yaw, pitch and roll
 	local matrix = {
 		{
@@ -205,32 +217,58 @@ function vector.rotate(v, rot)
 	)
 end
 
+-- dir_to_rotation implementation
+
+-- Excerpt from PR #8515, converted to specify the matrix as multiple args.
+local function m3arg_to_pitch_yaw_roll(m11, m12, m13, m21, m22, m23, m31, m32, m33)
+	local y = math_atan2(-m13, m33)
+	local c2 = math_sqrt(m21^2 + m22^2)
+	local x = math_atan2(m23, c2)
+	local s1 = math_sin(y)
+	local c1 = math_cos(y)
+	local z = math_atan2(s1 * m32 + c1 * m12, s1 * m31 + c1 * m11)
+	return x, y, z
+end
+
+-- Cross product with one argument per component.
+local function v3arg_cross(x1, y1, z1, x2, y2, z2)
+	return y1*z2 - z1*y2, z1*x2 - x1*z2, x1*y2 - y1*x2
+end
+
+-- Normalization with one argument per component, returning length.
+local function v3arg_normalize(x, y, z)
+	local len = math_hypot(x, math_hypot(y, z))
+	return x / len, y / len, z / len, len
+end
+
 function vector.dir_to_rotation(forward, up)
-	forward = vector.normalize(forward)
-	local rot = {x = math.asin(forward.y), y = -math.atan2(forward.x, forward.z), z = 0}
+	-- Normalize forward, defaulting to 0,0,1.
+	local fx, fy, fz, len = v3arg_normalize(forward.x, forward.y, forward.z)
+	if len == 0 then
+		-- Zero length
+		fx, fy, fz = 0, 0, 1
+	end
+
 	if not up then
-		return rot
+		return {x = math_asin(fy), y = -math_atan2(fx, fz), z = 0}
 	end
-	assert(vector.dot(forward, up) < 0.000001,
-			"Invalid vectors passed to vector.dir_to_rotation().")
-	up = vector.normalize(up)
-	-- Calculate vector pointing up with roll = 0, just based on forward vector.
-	local forwup = vector.rotate({x = 0, y = 1, z = 0}, rot)
-	-- 'forwup' and 'up' are now in a plane with 'forward' as normal.
-	-- The angle between them is the absolute of the roll value we're looking for.
-	rot.z = vector.angle(forwup, up)
-
-	-- Since vector.angle never returns a negative value or a value greater
-	-- than math.pi, rot.z has to be inverted sometimes.
-	-- To determine wether this is the case, we rotate the up vector back around
-	-- the forward vector and check if it worked out.
-	local back = vector.rotate_around_axis(up, forward, -rot.z)
-
-	-- We don't use vector.equals for this because of floating point imprecision.
-	if (back.x - forwup.x) * (back.x - forwup.x) +
-			(back.y - forwup.y) * (back.y - forwup.y) +
-			(back.z - forwup.z) * (back.z - forwup.z) > 0.0000001 then
-		rot.z = -rot.z
+	local ux, uy, uz = up.x, up.y, up.z
+
+	-- Synthesize a right vector via cross product of up and forward.
+	local rx, ry, rz = v3arg_cross(ux, uy, uz, fx, fy, fz)
+
+	-- Normalize right, defaulting to 1,0,0.
+	rx, ry, rz, len = v3arg_normalize(rx, ry, rz)
+	if len == 0 then
+		-- Zero length
+		rx, ry, rz = 1, 0, 0
 	end
-	return rot
+
+	-- Calculate a new up vector as cross product of forward and right.
+	-- The resulting up vector is guaranteed to be normalized.
+	ux, uy, uz = v3arg_cross(fx, fy, fz,  rx, ry, rz)
+
+	-- We have an orthogonal matrix now; convert it to Euler.
+	local x, y, z = m3arg_to_pitch_yaw_roll(rx, ux, fx, ry, uy, fy, rz, uz, fz)
+	return {x = x, y = y, z = z}
 end