[PATCH v5 2/3] vkd3d-shader/hlsl: Implement atan.

2 Nov 2023

From: Petrichor Park ppark@codeweavers.com
---
 libs/vkd3d-shader/hlsl.y            | 48 +++++++++++++++++++++++++++++
 tests/hlsl/inverse-trig.shader_test | 10 +++---
 2 files changed, 53 insertions(+), 5 deletions(-)

diff --git a/libs/vkd3d-shader/hlsl.y b/libs/vkd3d-shader/hlsl.y
index f21aba6ec..3511c4a68 100644
--- a/libs/vkd3d-shader/hlsl.y
+++ b/libs/vkd3d-shader/hlsl.y
@@ -2742,6 +2742,53 @@ static bool intrinsic_asin(struct hlsl_ctx *ctx,
     return write_acos_or_asin(ctx, params, loc, true);
 }
+static bool intrinsic_atan(struct hlsl_ctx *ctx,
+        const struct parse_initializer *params, const struct vkd3d_shader_location *loc)
+{
+    struct hlsl_ir_function_decl *func;
+    struct hlsl_type *type;
+    char *body;
+
+    static const char template[] =
+            "%s atan(%s x)\n"
+            "{\n"
+            "    %s abs_arg = abs(x);\n"
+            "    %s input = (abs_arg < 1.0) ? x : 1.0 / x;\n"
+            /* HLSL pow(x, y) always returns NaN if x<0. So write out the powers longhand. */
+            "    %s x2 = input * input;\n"
+            "    %s x3 = input * x2;\n"
+            "    %s x5 =    x3 * x2;\n"
+            "    %s x7 =    x5 * x2;\n"
+            "    %s x9 =    x7 * x2;\n"
+            "    %s poly_approx = \n"
+            "        0.020265052 * x9\n"
+            "        + -0.0840074 * x7\n"
+            "        + 0.17941668 * x5\n"
+            "        + -0.3301321 * x3\n"
+            "        + 0.99985593 * input;\n"
+            "    return (abs_arg < 1.0)\n"
+            "        ? poly_approx\n"
+            "        : (((x < 0.0 ? -1 : 1) * 3.14159265 / 2.0) - poly_approx);\n"
+            "}";
+
+    if (!(type = elementwise_intrinsic_get_common_type(ctx, params, loc)))
+        return false;
+    type = hlsl_get_numeric_type(ctx, type->class, HLSL_TYPE_FLOAT, type->dimx, type->dimy);
+
+
+    if (!(body = hlsl_sprintf_alloc(ctx, template, type->name, type->name,
+            type->name, type->name,
+            type->name, type->name, type->name, type->name, type->name,
+            type->name)))
+        return false;
+    func = hlsl_compile_internal_function(ctx, "atan", body);
+    vkd3d_free(body);
+    if (!func)
+        return false;
+
+    return add_user_call(ctx, func, params, loc);
+}
+
 /* Find the type corresponding to the given source type, with the same
  * dimensions but a different base type. */
 static struct hlsl_type *convert_numeric_type(const struct hlsl_ctx *ctx,
@@ -3842,6 +3889,7 @@ intrinsic_functions[] =
     {"asfloat",                             1, true,  intrinsic_asfloat},
     {"asin",                                1, true,  intrinsic_asin},
     {"asuint",                             -1, true,  intrinsic_asuint},
+    {"atan",                                1, true,  intrinsic_atan},
     {"clamp",                               3, true,  intrinsic_clamp},
     {"clip",                                1, true,  intrinsic_clip},
     {"cos",                                 1, true,  intrinsic_cos},
diff --git a/tests/hlsl/inverse-trig.shader_test b/tests/hlsl/inverse-trig.shader_test
index 7be7c5e7d..8820ec002 100644
--- a/tests/hlsl/inverse-trig.shader_test
+++ b/tests/hlsl/inverse-trig.shader_test
@@ -5,17 +5,17 @@ float4 main() : sv_target
 {
     // Add 10 to avoid epsilon problems near 0
     // Note that this means -8.5odd means -pi/2
-    return float4(asin(a.x), acos(a.y), 0.0, 0) + 10.0;
+    return float4(asin(a.x), acos(a.y), atan(a.z), 0) + 10.0;
 }
[test]
 uniform 0 float4 -1.0 -1.0 -1.0 0.0
 draw quad
-probe all rgba (8.429203673, 13.141592654, 10.0, 10.0) 256
+probe all rgba (8.429203673, 13.141592654, 9.214601837, 10.0) 256
uniform 0 float4 -0.5 -0.5 -0.5 0.0
 draw quad
-probe all rgba (9.476401224, 12.09439510, 10.0, 10.0) 256
+probe all rgba (9.476401224, 12.09439510, 9.536352391, 10.0) 256
uniform 0 float4 0.0 0.0 0.0 0.0
 draw quad
@@ -23,8 +23,8 @@ probe all rgba (10.0, 11.570796327, 10.0, 10.0) 256
uniform 0 float4 0.5 0.5 0.5 0.0
 draw quad
-probe all rgba (10.52359878, 11.04719755, 10.0, 10.0) 256
+probe all rgba (10.52359878, 11.04719755, 10.46364761, 10.0) 256
uniform 0 float4 1.0 1.0 1.0 0.0
 draw quad
-probe all rgba (11.570796327, 10.0, 10.0, 10.0) 256
+probe all rgba (11.570796327, 10.0, 10.7853981634, 10.0) 256
-- 
GitLab


https://gitlab.winehq.org/wine/vkd3d/-/merge_requests/364

    

2025

2024

2023

2022

[PATCH v5 2/3] vkd3d-shader/hlsl: Implement atan.