@luma.gl/shadertools 9.1.9 → 9.2.0-alpha.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/dist.dev.js +1614 -3716
- package/dist/dist.min.js +278 -484
- package/dist/index.cjs +366 -804
- package/dist/index.cjs.map +4 -4
- package/dist/index.d.ts +0 -6
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +0 -10
- package/dist/index.js.map +1 -1
- package/dist/lib/shader-assembly/assemble-shaders.d.ts +6 -4
- package/dist/lib/shader-assembly/assemble-shaders.d.ts.map +1 -1
- package/dist/lib/shader-assembly/assemble-shaders.js +14 -9
- package/dist/lib/shader-assembly/assemble-shaders.js.map +1 -1
- package/dist/lib/shader-assembly/platform-info.d.ts +1 -1
- package/dist/lib/shader-assembly/platform-info.d.ts.map +1 -1
- package/dist/lib/shader-module/shader-module.d.ts +1 -1
- package/dist/lib/shader-module/shader-module.d.ts.map +1 -1
- package/dist/lib/wgsl/get-shader-layout-wgsl.d.ts.map +1 -1
- package/dist/lib/wgsl/get-shader-layout-wgsl.js +3 -1
- package/dist/lib/wgsl/get-shader-layout-wgsl.js.map +1 -1
- package/dist/modules/engine/project/project.d.ts.map +1 -1
- package/dist/modules/engine/project/project.js +4 -2
- package/dist/modules/engine/project/project.js.map +1 -1
- package/dist/modules/lighting/gouraud-material/gouraud-material.js +1 -1
- package/dist/modules/lighting/gouraud-material/gouraud-material.js.map +1 -1
- package/dist/modules/lighting/lights/{lighting-uniforms-glsl.d.ts → lighting-glsl.d.ts} +1 -1
- package/dist/modules/lighting/lights/lighting-glsl.d.ts.map +1 -0
- package/dist/modules/lighting/lights/{lighting-uniforms-glsl.js → lighting-glsl.js} +1 -1
- package/dist/modules/lighting/lights/lighting-glsl.js.map +1 -0
- package/dist/modules/lighting/lights/{lighting-uniforms-wgsl.d.ts → lighting-wgsl.d.ts} +1 -1
- package/dist/modules/lighting/lights/lighting-wgsl.d.ts.map +1 -0
- package/dist/modules/lighting/lights/{lighting-uniforms-wgsl.js → lighting-wgsl.js} +1 -1
- package/dist/modules/lighting/lights/lighting-wgsl.js.map +1 -0
- package/dist/modules/lighting/lights/lighting.d.ts +1 -3
- package/dist/modules/lighting/lights/lighting.d.ts.map +1 -1
- package/dist/modules/lighting/lights/lighting.js +4 -4
- package/dist/modules/lighting/lights/lighting.js.map +1 -1
- package/dist/modules/lighting/no-material/dirlight.d.ts.map +1 -1
- package/dist/modules/lighting/no-material/dirlight.js +1 -2
- package/dist/modules/lighting/no-material/dirlight.js.map +1 -1
- package/dist/modules/lighting/pbr-material/{pbr-fragment-glsl.d.ts → pbr-material-glsl.d.ts} +2 -1
- package/dist/modules/lighting/pbr-material/pbr-material-glsl.d.ts.map +1 -0
- package/dist/modules/lighting/pbr-material/{pbr-fragment-glsl.js → pbr-material-glsl.js} +36 -1
- package/dist/modules/lighting/pbr-material/pbr-material-glsl.js.map +1 -0
- package/dist/modules/lighting/pbr-material/pbr-material-wgsl.d.ts +3 -0
- package/dist/modules/lighting/pbr-material/pbr-material-wgsl.d.ts.map +1 -0
- package/dist/modules/lighting/pbr-material/pbr-material-wgsl.js +487 -0
- package/dist/modules/lighting/pbr-material/pbr-material-wgsl.js.map +1 -0
- package/dist/modules/lighting/pbr-material/pbr-material.d.ts +11 -4
- package/dist/modules/lighting/pbr-material/pbr-material.d.ts.map +1 -1
- package/dist/modules/lighting/pbr-material/pbr-material.js +12 -12
- package/dist/modules/lighting/pbr-material/pbr-material.js.map +1 -1
- package/dist/modules/lighting/pbr-material/pbr-projection.d.ts.map +1 -1
- package/dist/modules/lighting/pbr-material/pbr-projection.js.map +1 -1
- package/dist/modules/lighting/phong-material/phong-material.js +1 -1
- package/dist/modules/lighting/phong-material/phong-material.js.map +1 -1
- package/dist/modules/lighting/phong-material/phong-shaders-glsl.d.ts +1 -1
- package/dist/modules/lighting/phong-material/phong-shaders-glsl.d.ts.map +1 -1
- package/dist/modules/lighting/phong-material/phong-shaders-glsl.js +2 -0
- package/dist/modules/lighting/phong-material/phong-shaders-glsl.js.map +1 -1
- package/dist/modules/math/random/random.d.ts +1 -0
- package/dist/modules/math/random/random.d.ts.map +1 -1
- package/dist/modules/math/random/random.js +7 -0
- package/dist/modules/math/random/random.js.map +1 -1
- package/package.json +3 -3
- package/src/index.ts +0 -17
- package/src/lib/shader-assembly/assemble-shaders.ts +12 -11
- package/src/lib/shader-assembly/platform-info.ts +1 -1
- package/src/lib/shader-module/shader-module.ts +1 -1
- package/src/lib/wgsl/get-shader-layout-wgsl.ts +7 -5
- package/src/modules/engine/project/project.ts +8 -5
- package/src/modules/lighting/gouraud-material/gouraud-material.ts +1 -1
- package/src/modules/lighting/lights/lighting.ts +4 -4
- package/src/modules/lighting/no-material/dirlight.ts +2 -3
- package/src/modules/lighting/pbr-material/{pbr-fragment-glsl.ts → pbr-material-glsl.ts} +36 -1
- package/src/modules/lighting/pbr-material/pbr-material-wgsl.ts +490 -0
- package/src/modules/lighting/pbr-material/pbr-material.ts +12 -12
- package/src/modules/lighting/pbr-material/pbr-projection.ts +0 -2
- package/src/modules/lighting/phong-material/phong-material.ts +1 -1
- package/src/modules/lighting/phong-material/phong-shaders-glsl.ts +2 -0
- package/src/modules/math/random/random.ts +8 -0
- package/dist/modules/lighting/lights/lighting-uniforms-glsl.d.ts.map +0 -1
- package/dist/modules/lighting/lights/lighting-uniforms-glsl.js.map +0 -1
- package/dist/modules/lighting/lights/lighting-uniforms-wgsl.d.ts.map +0 -1
- package/dist/modules/lighting/lights/lighting-uniforms-wgsl.js.map +0 -1
- package/dist/modules/lighting/pbr-material/pbr-fragment-glsl.d.ts.map +0 -1
- package/dist/modules/lighting/pbr-material/pbr-fragment-glsl.js.map +0 -1
- package/dist/modules/lighting/pbr-material/pbr-uniforms-glsl.d.ts +0 -2
- package/dist/modules/lighting/pbr-material/pbr-uniforms-glsl.d.ts.map +0 -1
- package/dist/modules/lighting/pbr-material/pbr-uniforms-glsl.js +0 -67
- package/dist/modules/lighting/pbr-material/pbr-uniforms-glsl.js.map +0 -1
- package/dist/modules/lighting/pbr-material/pbr-vertex-glsl.d.ts +0 -2
- package/dist/modules/lighting/pbr-material/pbr-vertex-glsl.d.ts.map +0 -1
- package/dist/modules/lighting/pbr-material/pbr-vertex-glsl.js +0 -39
- package/dist/modules/lighting/pbr-material/pbr-vertex-glsl.js.map +0 -1
- package/dist/modules/module-injectors.d.ts +0 -3
- package/dist/modules/module-injectors.d.ts.map +0 -1
- package/dist/modules/module-injectors.js +0 -31
- package/dist/modules/module-injectors.js.map +0 -1
- package/dist/modules-webgl1/geometry/geometry.d.ts +0 -9
- package/dist/modules-webgl1/geometry/geometry.d.ts.map +0 -1
- package/dist/modules-webgl1/geometry/geometry.js +0 -39
- package/dist/modules-webgl1/geometry/geometry.js.map +0 -1
- package/dist/modules-webgl1/lighting/dirlight/dirlight.d.ts +0 -10
- package/dist/modules-webgl1/lighting/dirlight/dirlight.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/dirlight/dirlight.js +0 -38
- package/dist/modules-webgl1/lighting/dirlight/dirlight.js.map +0 -1
- package/dist/modules-webgl1/lighting/lights/lights-glsl.d.ts +0 -2
- package/dist/modules-webgl1/lighting/lights/lights-glsl.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/lights/lights-glsl.js +0 -40
- package/dist/modules-webgl1/lighting/lights/lights-glsl.js.map +0 -1
- package/dist/modules-webgl1/lighting/lights/lights.d.ts +0 -38
- package/dist/modules-webgl1/lighting/lights/lights.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/lights/lights.js +0 -93
- package/dist/modules-webgl1/lighting/lights/lights.js.map +0 -1
- package/dist/modules-webgl1/lighting/pbr/pbr-fragment-glsl.d.ts +0 -2
- package/dist/modules-webgl1/lighting/pbr/pbr-fragment-glsl.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/pbr/pbr-fragment-glsl.js +0 -393
- package/dist/modules-webgl1/lighting/pbr/pbr-fragment-glsl.js.map +0 -1
- package/dist/modules-webgl1/lighting/pbr/pbr-vertex-glsl.d.ts +0 -2
- package/dist/modules-webgl1/lighting/pbr/pbr-vertex-glsl.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/pbr/pbr-vertex-glsl.js +0 -43
- package/dist/modules-webgl1/lighting/pbr/pbr-vertex-glsl.js.map +0 -1
- package/dist/modules-webgl1/lighting/pbr/pbr.d.ts +0 -23
- package/dist/modules-webgl1/lighting/pbr/pbr.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/pbr/pbr.js +0 -21
- package/dist/modules-webgl1/lighting/pbr/pbr.js.map +0 -1
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting-glsl.d.ts +0 -2
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting-glsl.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting-glsl.js +0 -79
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting-glsl.js.map +0 -1
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting.d.ts +0 -45
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting.d.ts.map +0 -1
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting.js +0 -44
- package/dist/modules-webgl1/lighting/phong-lighting/phong-lighting.js.map +0 -1
- package/dist/modules-webgl1/math/fp64/fp64-arithmetic-glsl.d.ts +0 -2
- package/dist/modules-webgl1/math/fp64/fp64-arithmetic-glsl.d.ts.map +0 -1
- package/dist/modules-webgl1/math/fp64/fp64-arithmetic-glsl.js +0 -171
- package/dist/modules-webgl1/math/fp64/fp64-arithmetic-glsl.js.map +0 -1
- package/dist/modules-webgl1/math/fp64/fp64-functions-glsl.d.ts +0 -2
- package/dist/modules-webgl1/math/fp64/fp64-functions-glsl.d.ts.map +0 -1
- package/dist/modules-webgl1/math/fp64/fp64-functions-glsl.js +0 -675
- package/dist/modules-webgl1/math/fp64/fp64-functions-glsl.js.map +0 -1
- package/dist/modules-webgl1/math/fp64/fp64.d.ts +0 -35
- package/dist/modules-webgl1/math/fp64/fp64.d.ts.map +0 -1
- package/dist/modules-webgl1/math/fp64/fp64.js +0 -38
- package/dist/modules-webgl1/math/fp64/fp64.js.map +0 -1
- package/dist/modules-webgl1/project/project.d.ts +0 -20
- package/dist/modules-webgl1/project/project.d.ts.map +0 -1
- package/dist/modules-webgl1/project/project.js +0 -114
- package/dist/modules-webgl1/project/project.js.map +0 -1
- package/src/modules/lighting/pbr-material/pbr-uniforms-glsl.ts +0 -67
- package/src/modules/lighting/pbr-material/pbr-vertex-glsl.ts +0 -39
- package/src/modules/module-injectors.ts +0 -32
- package/src/modules-webgl1/geometry/geometry.ts +0 -41
- package/src/modules-webgl1/lighting/dirlight/dirlight.ts +0 -50
- package/src/modules-webgl1/lighting/lights/lights-glsl.ts +0 -40
- package/src/modules-webgl1/lighting/lights/lights.ts +0 -143
- package/src/modules-webgl1/lighting/pbr/README.md +0 -12
- package/src/modules-webgl1/lighting/pbr/pbr-fragment-glsl.ts +0 -396
- package/src/modules-webgl1/lighting/pbr/pbr-vertex-glsl.ts +0 -43
- package/src/modules-webgl1/lighting/pbr/pbr.ts +0 -23
- package/src/modules-webgl1/lighting/phong-lighting/phong-lighting-glsl.ts +0 -79
- package/src/modules-webgl1/lighting/phong-lighting/phong-lighting.ts +0 -64
- package/src/modules-webgl1/math/fp64/fp64-arithmetic-glsl.ts +0 -171
- package/src/modules-webgl1/math/fp64/fp64-functions-glsl.ts +0 -675
- package/src/modules-webgl1/math/fp64/fp64.ts +0 -44
- package/src/modules-webgl1/project/README.md +0 -52
- package/src/modules-webgl1/project/project.ts +0 -135
- /package/src/modules/lighting/lights/{lighting-uniforms-glsl.ts → lighting-glsl.ts} +0 -0
- /package/src/modules/lighting/lights/{lighting-uniforms-wgsl.ts → lighting-wgsl.ts} +0 -0
|
@@ -1,675 +0,0 @@
|
|
|
1
|
-
// luma.gl
|
|
2
|
-
// SPDX-License-Identifier: MIT
|
|
3
|
-
// Copyright (c) vis.gl contributors
|
|
4
|
-
|
|
5
|
-
export const fp64functionShader = /* glsl */ `\
|
|
6
|
-
const vec2 E_FP64 = vec2(2.7182817459106445e+00, 8.254840366817007e-08);
|
|
7
|
-
const vec2 LOG2_FP64 = vec2(0.6931471824645996e+00, -1.9046542121259336e-09);
|
|
8
|
-
const vec2 PI_FP64 = vec2(3.1415927410125732, -8.742278012618954e-8);
|
|
9
|
-
const vec2 TWO_PI_FP64 = vec2(6.2831854820251465, -1.7484556025237907e-7);
|
|
10
|
-
const vec2 PI_2_FP64 = vec2(1.5707963705062866, -4.371139006309477e-8);
|
|
11
|
-
const vec2 PI_4_FP64 = vec2(0.7853981852531433, -2.1855695031547384e-8);
|
|
12
|
-
const vec2 PI_16_FP64 = vec2(0.19634954631328583, -5.463923757886846e-9);
|
|
13
|
-
const vec2 PI_16_2_FP64 = vec2(0.39269909262657166, -1.0927847515773692e-8);
|
|
14
|
-
const vec2 PI_16_3_FP64 = vec2(0.5890486240386963, -1.4906100798128818e-9);
|
|
15
|
-
const vec2 PI_180_FP64 = vec2(0.01745329238474369, 1.3519960498364902e-10);
|
|
16
|
-
|
|
17
|
-
const vec2 SIN_TABLE_0_FP64 = vec2(0.19509032368659973, -1.6704714833615242e-9);
|
|
18
|
-
const vec2 SIN_TABLE_1_FP64 = vec2(0.3826834261417389, 6.22335089017767e-9);
|
|
19
|
-
const vec2 SIN_TABLE_2_FP64 = vec2(0.5555702447891235, -1.1769521357507529e-8);
|
|
20
|
-
const vec2 SIN_TABLE_3_FP64 = vec2(0.7071067690849304, 1.2101617041793133e-8);
|
|
21
|
-
|
|
22
|
-
const vec2 COS_TABLE_0_FP64 = vec2(0.9807852506637573, 2.9739473106360492e-8);
|
|
23
|
-
const vec2 COS_TABLE_1_FP64 = vec2(0.9238795042037964, 2.8307490351764386e-8);
|
|
24
|
-
const vec2 COS_TABLE_2_FP64 = vec2(0.8314695954322815, 1.6870263741530778e-8);
|
|
25
|
-
const vec2 COS_TABLE_3_FP64 = vec2(0.7071067690849304, 1.2101617152815436e-8);
|
|
26
|
-
|
|
27
|
-
const vec2 INVERSE_FACTORIAL_3_FP64 = vec2(1.666666716337204e-01, -4.967053879312289e-09); // 1/3!
|
|
28
|
-
const vec2 INVERSE_FACTORIAL_4_FP64 = vec2(4.16666679084301e-02, -1.2417634698280722e-09); // 1/4!
|
|
29
|
-
const vec2 INVERSE_FACTORIAL_5_FP64 = vec2(8.333333767950535e-03, -4.34617203337595e-10); // 1/5!
|
|
30
|
-
const vec2 INVERSE_FACTORIAL_6_FP64 = vec2(1.3888889225199819e-03, -3.3631094437103215e-11); // 1/6!
|
|
31
|
-
const vec2 INVERSE_FACTORIAL_7_FP64 = vec2(1.9841270113829523e-04, -2.725596874933456e-12); // 1/7!
|
|
32
|
-
const vec2 INVERSE_FACTORIAL_8_FP64 = vec2(2.4801587642286904e-05, -3.406996025904184e-13); // 1/8!
|
|
33
|
-
const vec2 INVERSE_FACTORIAL_9_FP64 = vec2(2.75573188446287533e-06, 3.7935713937038186e-14); // 1/9!
|
|
34
|
-
const vec2 INVERSE_FACTORIAL_10_FP64 = vec2(2.755731998149713e-07, -7.575112367869873e-15); // 1/10!
|
|
35
|
-
|
|
36
|
-
float nint(float d) {
|
|
37
|
-
if (d == floor(d)) return d;
|
|
38
|
-
return floor(d + 0.5);
|
|
39
|
-
}
|
|
40
|
-
|
|
41
|
-
vec2 nint_fp64(vec2 a) {
|
|
42
|
-
float hi = nint(a.x);
|
|
43
|
-
float lo;
|
|
44
|
-
vec2 tmp;
|
|
45
|
-
if (hi == a.x) {
|
|
46
|
-
lo = nint(a.y);
|
|
47
|
-
tmp = quickTwoSum(hi, lo);
|
|
48
|
-
} else {
|
|
49
|
-
lo = 0.0;
|
|
50
|
-
if (abs(hi - a.x) == 0.5 && a.y < 0.0) {
|
|
51
|
-
hi -= 1.0;
|
|
52
|
-
}
|
|
53
|
-
tmp = vec2(hi, lo);
|
|
54
|
-
}
|
|
55
|
-
return tmp;
|
|
56
|
-
}
|
|
57
|
-
|
|
58
|
-
/* k_power controls how much range reduction we would like to have
|
|
59
|
-
Range reduction uses the following method:
|
|
60
|
-
assume a = k_power * r + m * log(2), k and m being integers.
|
|
61
|
-
Set k_power = 4 (we can choose other k to trade accuracy with performance.
|
|
62
|
-
we only need to calculate exp(r) and using exp(a) = 2^m * exp(r)^k_power;
|
|
63
|
-
*/
|
|
64
|
-
|
|
65
|
-
vec2 exp_fp64(vec2 a) {
|
|
66
|
-
// We need to make sure these two numbers match
|
|
67
|
-
// as bit-wise shift is not available in GLSL 1.0
|
|
68
|
-
const int k_power = 4;
|
|
69
|
-
const float k = 16.0;
|
|
70
|
-
|
|
71
|
-
const float inv_k = 1.0 / k;
|
|
72
|
-
|
|
73
|
-
if (a.x <= -88.0) return vec2(0.0, 0.0);
|
|
74
|
-
if (a.x >= 88.0) return vec2(1.0 / 0.0, 1.0 / 0.0);
|
|
75
|
-
if (a.x == 0.0 && a.y == 0.0) return vec2(1.0, 0.0);
|
|
76
|
-
if (a.x == 1.0 && a.y == 0.0) return E_FP64;
|
|
77
|
-
|
|
78
|
-
float m = floor(a.x / LOG2_FP64.x + 0.5);
|
|
79
|
-
vec2 r = sub_fp64(a, mul_fp64(LOG2_FP64, vec2(m, 0.0))) * inv_k;
|
|
80
|
-
vec2 s, t, p;
|
|
81
|
-
|
|
82
|
-
p = mul_fp64(r, r);
|
|
83
|
-
s = sum_fp64(r, p * 0.5);
|
|
84
|
-
p = mul_fp64(p, r);
|
|
85
|
-
t = mul_fp64(p, INVERSE_FACTORIAL_3_FP64);
|
|
86
|
-
|
|
87
|
-
s = sum_fp64(s, t);
|
|
88
|
-
p = mul_fp64(p, r);
|
|
89
|
-
t = mul_fp64(p, INVERSE_FACTORIAL_4_FP64);
|
|
90
|
-
|
|
91
|
-
s = sum_fp64(s, t);
|
|
92
|
-
p = mul_fp64(p, r);
|
|
93
|
-
t = mul_fp64(p, INVERSE_FACTORIAL_5_FP64);
|
|
94
|
-
|
|
95
|
-
// s = sum_fp64(s, t);
|
|
96
|
-
// p = mul_fp64(p, r);
|
|
97
|
-
// t = mul_fp64(p, INVERSE_FACTORIAL_6_FP64);
|
|
98
|
-
|
|
99
|
-
// s = sum_fp64(s, t);
|
|
100
|
-
// p = mul_fp64(p, r);
|
|
101
|
-
// t = mul_fp64(p, INVERSE_FACTORIAL_7_FP64);
|
|
102
|
-
|
|
103
|
-
s = sum_fp64(s, t);
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
// At this point, s = exp(r) - 1; but after following 4 recursions, we will get exp(r) ^ 512 - 1.
|
|
107
|
-
for (int i = 0; i < k_power; i++) {
|
|
108
|
-
s = sum_fp64(s * 2.0, mul_fp64(s, s));
|
|
109
|
-
}
|
|
110
|
-
|
|
111
|
-
#if defined(NVIDIA_FP64_WORKAROUND) || defined(INTEL_FP64_WORKAROUND)
|
|
112
|
-
s = sum_fp64(s, vec2(ONE, 0.0));
|
|
113
|
-
#else
|
|
114
|
-
s = sum_fp64(s, vec2(1.0, 0.0));
|
|
115
|
-
#endif
|
|
116
|
-
|
|
117
|
-
return s * pow(2.0, m);
|
|
118
|
-
// return r;
|
|
119
|
-
}
|
|
120
|
-
|
|
121
|
-
vec2 log_fp64(vec2 a)
|
|
122
|
-
{
|
|
123
|
-
if (a.x == 1.0 && a.y == 0.0) return vec2(0.0, 0.0);
|
|
124
|
-
if (a.x <= 0.0) return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
125
|
-
vec2 x = vec2(log(a.x), 0.0);
|
|
126
|
-
vec2 s;
|
|
127
|
-
#if defined(NVIDIA_FP64_WORKAROUND) || defined(INTEL_FP64_WORKAROUND)
|
|
128
|
-
s = vec2(ONE, 0.0);
|
|
129
|
-
#else
|
|
130
|
-
s = vec2(1.0, 0.0);
|
|
131
|
-
#endif
|
|
132
|
-
|
|
133
|
-
x = sub_fp64(sum_fp64(x, mul_fp64(a, exp_fp64(-x))), s);
|
|
134
|
-
return x;
|
|
135
|
-
}
|
|
136
|
-
|
|
137
|
-
vec2 sin_taylor_fp64(vec2 a) {
|
|
138
|
-
vec2 r, s, t, x;
|
|
139
|
-
|
|
140
|
-
if (a.x == 0.0 && a.y == 0.0) {
|
|
141
|
-
return vec2(0.0, 0.0);
|
|
142
|
-
}
|
|
143
|
-
|
|
144
|
-
x = -mul_fp64(a, a);
|
|
145
|
-
s = a;
|
|
146
|
-
r = a;
|
|
147
|
-
|
|
148
|
-
r = mul_fp64(r, x);
|
|
149
|
-
t = mul_fp64(r, INVERSE_FACTORIAL_3_FP64);
|
|
150
|
-
s = sum_fp64(s, t);
|
|
151
|
-
|
|
152
|
-
r = mul_fp64(r, x);
|
|
153
|
-
t = mul_fp64(r, INVERSE_FACTORIAL_5_FP64);
|
|
154
|
-
s = sum_fp64(s, t);
|
|
155
|
-
|
|
156
|
-
/* keep the following commented code in case we need them
|
|
157
|
-
for extra accuracy from the Taylor expansion*/
|
|
158
|
-
|
|
159
|
-
// r = mul_fp64(r, x);
|
|
160
|
-
// t = mul_fp64(r, INVERSE_FACTORIAL_7_FP64);
|
|
161
|
-
// s = sum_fp64(s, t);
|
|
162
|
-
|
|
163
|
-
// r = mul_fp64(r, x);
|
|
164
|
-
// t = mul_fp64(r, INVERSE_FACTORIAL_9_FP64);
|
|
165
|
-
// s = sum_fp64(s, t);
|
|
166
|
-
|
|
167
|
-
return s;
|
|
168
|
-
}
|
|
169
|
-
|
|
170
|
-
vec2 cos_taylor_fp64(vec2 a) {
|
|
171
|
-
vec2 r, s, t, x;
|
|
172
|
-
|
|
173
|
-
if (a.x == 0.0 && a.y == 0.0) {
|
|
174
|
-
return vec2(1.0, 0.0);
|
|
175
|
-
}
|
|
176
|
-
|
|
177
|
-
x = -mul_fp64(a, a);
|
|
178
|
-
r = x;
|
|
179
|
-
s = sum_fp64(vec2(1.0, 0.0), r * 0.5);
|
|
180
|
-
|
|
181
|
-
r = mul_fp64(r, x);
|
|
182
|
-
t = mul_fp64(r, INVERSE_FACTORIAL_4_FP64);
|
|
183
|
-
s = sum_fp64(s, t);
|
|
184
|
-
|
|
185
|
-
r = mul_fp64(r, x);
|
|
186
|
-
t = mul_fp64(r, INVERSE_FACTORIAL_6_FP64);
|
|
187
|
-
s = sum_fp64(s, t);
|
|
188
|
-
|
|
189
|
-
/* keep the following commented code in case we need them
|
|
190
|
-
for extra accuracy from the Taylor expansion*/
|
|
191
|
-
|
|
192
|
-
// r = mul_fp64(r, x);
|
|
193
|
-
// t = mul_fp64(r, INVERSE_FACTORIAL_8_FP64);
|
|
194
|
-
// s = sum_fp64(s, t);
|
|
195
|
-
|
|
196
|
-
// r = mul_fp64(r, x);
|
|
197
|
-
// t = mul_fp64(r, INVERSE_FACTORIAL_10_FP64);
|
|
198
|
-
// s = sum_fp64(s, t);
|
|
199
|
-
|
|
200
|
-
return s;
|
|
201
|
-
}
|
|
202
|
-
|
|
203
|
-
void sincos_taylor_fp64(vec2 a, out vec2 sin_t, out vec2 cos_t) {
|
|
204
|
-
if (a.x == 0.0 && a.y == 0.0) {
|
|
205
|
-
sin_t = vec2(0.0, 0.0);
|
|
206
|
-
cos_t = vec2(1.0, 0.0);
|
|
207
|
-
}
|
|
208
|
-
|
|
209
|
-
sin_t = sin_taylor_fp64(a);
|
|
210
|
-
cos_t = sqrt_fp64(sub_fp64(vec2(1.0, 0.0), mul_fp64(sin_t, sin_t)));
|
|
211
|
-
}
|
|
212
|
-
|
|
213
|
-
vec2 sin_fp64(vec2 a) {
|
|
214
|
-
if (a.x == 0.0 && a.y == 0.0) {
|
|
215
|
-
return vec2(0.0, 0.0);
|
|
216
|
-
}
|
|
217
|
-
|
|
218
|
-
// 2pi range reduction
|
|
219
|
-
vec2 z = nint_fp64(div_fp64(a, TWO_PI_FP64));
|
|
220
|
-
vec2 r = sub_fp64(a, mul_fp64(TWO_PI_FP64, z));
|
|
221
|
-
|
|
222
|
-
vec2 t;
|
|
223
|
-
float q = floor(r.x / PI_2_FP64.x + 0.5);
|
|
224
|
-
int j = int(q);
|
|
225
|
-
|
|
226
|
-
if (j < -2 || j > 2) {
|
|
227
|
-
return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
228
|
-
}
|
|
229
|
-
|
|
230
|
-
t = sub_fp64(r, mul_fp64(PI_2_FP64, vec2(q, 0.0)));
|
|
231
|
-
|
|
232
|
-
q = floor(t.x / PI_16_FP64.x + 0.5);
|
|
233
|
-
int k = int(q);
|
|
234
|
-
|
|
235
|
-
if (k == 0) {
|
|
236
|
-
if (j == 0) {
|
|
237
|
-
return sin_taylor_fp64(t);
|
|
238
|
-
} else if (j == 1) {
|
|
239
|
-
return cos_taylor_fp64(t);
|
|
240
|
-
} else if (j == -1) {
|
|
241
|
-
return -cos_taylor_fp64(t);
|
|
242
|
-
} else {
|
|
243
|
-
return -sin_taylor_fp64(t);
|
|
244
|
-
}
|
|
245
|
-
}
|
|
246
|
-
|
|
247
|
-
int abs_k = int(abs(float(k)));
|
|
248
|
-
|
|
249
|
-
if (abs_k > 4) {
|
|
250
|
-
return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
251
|
-
} else {
|
|
252
|
-
t = sub_fp64(t, mul_fp64(PI_16_FP64, vec2(q, 0.0)));
|
|
253
|
-
}
|
|
254
|
-
|
|
255
|
-
vec2 u = vec2(0.0, 0.0);
|
|
256
|
-
vec2 v = vec2(0.0, 0.0);
|
|
257
|
-
|
|
258
|
-
#if defined(NVIDIA_FP64_WORKAROUND) || defined(INTEL_FP64_WORKAROUND)
|
|
259
|
-
if (abs(float(abs_k) - 1.0) < 0.5) {
|
|
260
|
-
u = COS_TABLE_0_FP64;
|
|
261
|
-
v = SIN_TABLE_0_FP64;
|
|
262
|
-
} else if (abs(float(abs_k) - 2.0) < 0.5) {
|
|
263
|
-
u = COS_TABLE_1_FP64;
|
|
264
|
-
v = SIN_TABLE_1_FP64;
|
|
265
|
-
} else if (abs(float(abs_k) - 3.0) < 0.5) {
|
|
266
|
-
u = COS_TABLE_2_FP64;
|
|
267
|
-
v = SIN_TABLE_2_FP64;
|
|
268
|
-
} else if (abs(float(abs_k) - 4.0) < 0.5) {
|
|
269
|
-
u = COS_TABLE_3_FP64;
|
|
270
|
-
v = SIN_TABLE_3_FP64;
|
|
271
|
-
}
|
|
272
|
-
#else
|
|
273
|
-
if (abs_k == 1) {
|
|
274
|
-
u = COS_TABLE_0_FP64;
|
|
275
|
-
v = SIN_TABLE_0_FP64;
|
|
276
|
-
} else if (abs_k == 2) {
|
|
277
|
-
u = COS_TABLE_1_FP64;
|
|
278
|
-
v = SIN_TABLE_1_FP64;
|
|
279
|
-
} else if (abs_k == 3) {
|
|
280
|
-
u = COS_TABLE_2_FP64;
|
|
281
|
-
v = SIN_TABLE_2_FP64;
|
|
282
|
-
} else if (abs_k == 4) {
|
|
283
|
-
u = COS_TABLE_3_FP64;
|
|
284
|
-
v = SIN_TABLE_3_FP64;
|
|
285
|
-
}
|
|
286
|
-
#endif
|
|
287
|
-
|
|
288
|
-
vec2 sin_t, cos_t;
|
|
289
|
-
sincos_taylor_fp64(t, sin_t, cos_t);
|
|
290
|
-
|
|
291
|
-
|
|
292
|
-
|
|
293
|
-
vec2 result = vec2(0.0, 0.0);
|
|
294
|
-
if (j == 0) {
|
|
295
|
-
if (k > 0) {
|
|
296
|
-
result = sum_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
297
|
-
} else {
|
|
298
|
-
result = sub_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
299
|
-
}
|
|
300
|
-
} else if (j == 1) {
|
|
301
|
-
if (k > 0) {
|
|
302
|
-
result = sub_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
303
|
-
} else {
|
|
304
|
-
result = sum_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
305
|
-
}
|
|
306
|
-
} else if (j == -1) {
|
|
307
|
-
if (k > 0) {
|
|
308
|
-
result = sub_fp64(mul_fp64(v, sin_t), mul_fp64(u, cos_t));
|
|
309
|
-
} else {
|
|
310
|
-
result = -sum_fp64(mul_fp64(v, sin_t), mul_fp64(u, cos_t));
|
|
311
|
-
}
|
|
312
|
-
} else {
|
|
313
|
-
if (k > 0) {
|
|
314
|
-
result = -sum_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
315
|
-
} else {
|
|
316
|
-
result = sub_fp64(mul_fp64(v, cos_t), mul_fp64(u, sin_t));
|
|
317
|
-
}
|
|
318
|
-
}
|
|
319
|
-
|
|
320
|
-
return result;
|
|
321
|
-
}
|
|
322
|
-
|
|
323
|
-
vec2 cos_fp64(vec2 a) {
|
|
324
|
-
if (a.x == 0.0 && a.y == 0.0) {
|
|
325
|
-
return vec2(1.0, 0.0);
|
|
326
|
-
}
|
|
327
|
-
|
|
328
|
-
// 2pi range reduction
|
|
329
|
-
vec2 z = nint_fp64(div_fp64(a, TWO_PI_FP64));
|
|
330
|
-
vec2 r = sub_fp64(a, mul_fp64(TWO_PI_FP64, z));
|
|
331
|
-
|
|
332
|
-
vec2 t;
|
|
333
|
-
float q = floor(r.x / PI_2_FP64.x + 0.5);
|
|
334
|
-
int j = int(q);
|
|
335
|
-
|
|
336
|
-
if (j < -2 || j > 2) {
|
|
337
|
-
return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
338
|
-
}
|
|
339
|
-
|
|
340
|
-
t = sub_fp64(r, mul_fp64(PI_2_FP64, vec2(q, 0.0)));
|
|
341
|
-
|
|
342
|
-
q = floor(t.x / PI_16_FP64.x + 0.5);
|
|
343
|
-
int k = int(q);
|
|
344
|
-
|
|
345
|
-
if (k == 0) {
|
|
346
|
-
if (j == 0) {
|
|
347
|
-
return cos_taylor_fp64(t);
|
|
348
|
-
} else if (j == 1) {
|
|
349
|
-
return -sin_taylor_fp64(t);
|
|
350
|
-
} else if (j == -1) {
|
|
351
|
-
return sin_taylor_fp64(t);
|
|
352
|
-
} else {
|
|
353
|
-
return -cos_taylor_fp64(t);
|
|
354
|
-
}
|
|
355
|
-
}
|
|
356
|
-
|
|
357
|
-
int abs_k = int(abs(float(k)));
|
|
358
|
-
|
|
359
|
-
if (abs_k > 4) {
|
|
360
|
-
return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
361
|
-
} else {
|
|
362
|
-
t = sub_fp64(t, mul_fp64(PI_16_FP64, vec2(q, 0.0)));
|
|
363
|
-
}
|
|
364
|
-
|
|
365
|
-
vec2 u = vec2(0.0, 0.0);
|
|
366
|
-
vec2 v = vec2(0.0, 0.0);
|
|
367
|
-
|
|
368
|
-
#if defined(NVIDIA_FP64_WORKAROUND) || defined(INTEL_FP64_WORKAROUND)
|
|
369
|
-
if (abs(float(abs_k) - 1.0) < 0.5) {
|
|
370
|
-
u = COS_TABLE_0_FP64;
|
|
371
|
-
v = SIN_TABLE_0_FP64;
|
|
372
|
-
} else if (abs(float(abs_k) - 2.0) < 0.5) {
|
|
373
|
-
u = COS_TABLE_1_FP64;
|
|
374
|
-
v = SIN_TABLE_1_FP64;
|
|
375
|
-
} else if (abs(float(abs_k) - 3.0) < 0.5) {
|
|
376
|
-
u = COS_TABLE_2_FP64;
|
|
377
|
-
v = SIN_TABLE_2_FP64;
|
|
378
|
-
} else if (abs(float(abs_k) - 4.0) < 0.5) {
|
|
379
|
-
u = COS_TABLE_3_FP64;
|
|
380
|
-
v = SIN_TABLE_3_FP64;
|
|
381
|
-
}
|
|
382
|
-
#else
|
|
383
|
-
if (abs_k == 1) {
|
|
384
|
-
u = COS_TABLE_0_FP64;
|
|
385
|
-
v = SIN_TABLE_0_FP64;
|
|
386
|
-
} else if (abs_k == 2) {
|
|
387
|
-
u = COS_TABLE_1_FP64;
|
|
388
|
-
v = SIN_TABLE_1_FP64;
|
|
389
|
-
} else if (abs_k == 3) {
|
|
390
|
-
u = COS_TABLE_2_FP64;
|
|
391
|
-
v = SIN_TABLE_2_FP64;
|
|
392
|
-
} else if (abs_k == 4) {
|
|
393
|
-
u = COS_TABLE_3_FP64;
|
|
394
|
-
v = SIN_TABLE_3_FP64;
|
|
395
|
-
}
|
|
396
|
-
#endif
|
|
397
|
-
|
|
398
|
-
vec2 sin_t, cos_t;
|
|
399
|
-
sincos_taylor_fp64(t, sin_t, cos_t);
|
|
400
|
-
|
|
401
|
-
vec2 result = vec2(0.0, 0.0);
|
|
402
|
-
if (j == 0) {
|
|
403
|
-
if (k > 0) {
|
|
404
|
-
result = sub_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
405
|
-
} else {
|
|
406
|
-
result = sum_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
407
|
-
}
|
|
408
|
-
} else if (j == 1) {
|
|
409
|
-
if (k > 0) {
|
|
410
|
-
result = -sum_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
411
|
-
} else {
|
|
412
|
-
result = sub_fp64(mul_fp64(v, cos_t), mul_fp64(u, sin_t));
|
|
413
|
-
}
|
|
414
|
-
} else if (j == -1) {
|
|
415
|
-
if (k > 0) {
|
|
416
|
-
result = sum_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
417
|
-
} else {
|
|
418
|
-
result = sub_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
419
|
-
}
|
|
420
|
-
} else {
|
|
421
|
-
if (k > 0) {
|
|
422
|
-
result = sub_fp64(mul_fp64(v, sin_t), mul_fp64(u, cos_t));
|
|
423
|
-
} else {
|
|
424
|
-
result = -sum_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
425
|
-
}
|
|
426
|
-
}
|
|
427
|
-
|
|
428
|
-
return result;
|
|
429
|
-
}
|
|
430
|
-
|
|
431
|
-
vec2 tan_fp64(vec2 a) {
|
|
432
|
-
vec2 sin_a;
|
|
433
|
-
vec2 cos_a;
|
|
434
|
-
|
|
435
|
-
if (a.x == 0.0 && a.y == 0.0) {
|
|
436
|
-
return vec2(0.0, 0.0);
|
|
437
|
-
}
|
|
438
|
-
|
|
439
|
-
// 2pi range reduction
|
|
440
|
-
vec2 z = nint_fp64(div_fp64(a, TWO_PI_FP64));
|
|
441
|
-
vec2 r = sub_fp64(a, mul_fp64(TWO_PI_FP64, z));
|
|
442
|
-
|
|
443
|
-
vec2 t;
|
|
444
|
-
float q = floor(r.x / PI_2_FP64.x + 0.5);
|
|
445
|
-
int j = int(q);
|
|
446
|
-
|
|
447
|
-
|
|
448
|
-
if (j < -2 || j > 2) {
|
|
449
|
-
return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
450
|
-
}
|
|
451
|
-
|
|
452
|
-
t = sub_fp64(r, mul_fp64(PI_2_FP64, vec2(q, 0.0)));
|
|
453
|
-
|
|
454
|
-
q = floor(t.x / PI_16_FP64.x + 0.5);
|
|
455
|
-
int k = int(q);
|
|
456
|
-
int abs_k = int(abs(float(k)));
|
|
457
|
-
|
|
458
|
-
// We just can't get PI/16 * 3.0 very accurately.
|
|
459
|
-
// so let's just store it
|
|
460
|
-
if (abs_k > 4) {
|
|
461
|
-
return vec2(0.0 / 0.0, 0.0 / 0.0);
|
|
462
|
-
} else {
|
|
463
|
-
t = sub_fp64(t, mul_fp64(PI_16_FP64, vec2(q, 0.0)));
|
|
464
|
-
}
|
|
465
|
-
|
|
466
|
-
|
|
467
|
-
vec2 u = vec2(0.0, 0.0);
|
|
468
|
-
vec2 v = vec2(0.0, 0.0);
|
|
469
|
-
|
|
470
|
-
vec2 sin_t, cos_t;
|
|
471
|
-
vec2 s, c;
|
|
472
|
-
sincos_taylor_fp64(t, sin_t, cos_t);
|
|
473
|
-
|
|
474
|
-
if (k == 0) {
|
|
475
|
-
s = sin_t;
|
|
476
|
-
c = cos_t;
|
|
477
|
-
} else {
|
|
478
|
-
#if defined(NVIDIA_FP64_WORKAROUND) || defined(INTEL_FP64_WORKAROUND)
|
|
479
|
-
if (abs(float(abs_k) - 1.0) < 0.5) {
|
|
480
|
-
u = COS_TABLE_0_FP64;
|
|
481
|
-
v = SIN_TABLE_0_FP64;
|
|
482
|
-
} else if (abs(float(abs_k) - 2.0) < 0.5) {
|
|
483
|
-
u = COS_TABLE_1_FP64;
|
|
484
|
-
v = SIN_TABLE_1_FP64;
|
|
485
|
-
} else if (abs(float(abs_k) - 3.0) < 0.5) {
|
|
486
|
-
u = COS_TABLE_2_FP64;
|
|
487
|
-
v = SIN_TABLE_2_FP64;
|
|
488
|
-
} else if (abs(float(abs_k) - 4.0) < 0.5) {
|
|
489
|
-
u = COS_TABLE_3_FP64;
|
|
490
|
-
v = SIN_TABLE_3_FP64;
|
|
491
|
-
}
|
|
492
|
-
#else
|
|
493
|
-
if (abs_k == 1) {
|
|
494
|
-
u = COS_TABLE_0_FP64;
|
|
495
|
-
v = SIN_TABLE_0_FP64;
|
|
496
|
-
} else if (abs_k == 2) {
|
|
497
|
-
u = COS_TABLE_1_FP64;
|
|
498
|
-
v = SIN_TABLE_1_FP64;
|
|
499
|
-
} else if (abs_k == 3) {
|
|
500
|
-
u = COS_TABLE_2_FP64;
|
|
501
|
-
v = SIN_TABLE_2_FP64;
|
|
502
|
-
} else if (abs_k == 4) {
|
|
503
|
-
u = COS_TABLE_3_FP64;
|
|
504
|
-
v = SIN_TABLE_3_FP64;
|
|
505
|
-
}
|
|
506
|
-
#endif
|
|
507
|
-
if (k > 0) {
|
|
508
|
-
s = sum_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
509
|
-
c = sub_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
510
|
-
} else {
|
|
511
|
-
s = sub_fp64(mul_fp64(u, sin_t), mul_fp64(v, cos_t));
|
|
512
|
-
c = sum_fp64(mul_fp64(u, cos_t), mul_fp64(v, sin_t));
|
|
513
|
-
}
|
|
514
|
-
}
|
|
515
|
-
|
|
516
|
-
if (j == 0) {
|
|
517
|
-
sin_a = s;
|
|
518
|
-
cos_a = c;
|
|
519
|
-
} else if (j == 1) {
|
|
520
|
-
sin_a = c;
|
|
521
|
-
cos_a = -s;
|
|
522
|
-
} else if (j == -1) {
|
|
523
|
-
sin_a = -c;
|
|
524
|
-
cos_a = s;
|
|
525
|
-
} else {
|
|
526
|
-
sin_a = -s;
|
|
527
|
-
cos_a = -c;
|
|
528
|
-
}
|
|
529
|
-
return div_fp64(sin_a, cos_a);
|
|
530
|
-
}
|
|
531
|
-
|
|
532
|
-
vec2 radians_fp64(vec2 degree) {
|
|
533
|
-
return mul_fp64(degree, PI_180_FP64);
|
|
534
|
-
}
|
|
535
|
-
|
|
536
|
-
vec2 mix_fp64(vec2 a, vec2 b, float x) {
|
|
537
|
-
vec2 range = sub_fp64(b, a);
|
|
538
|
-
return sum_fp64(a, mul_fp64(range, vec2(x, 0.0)));
|
|
539
|
-
}
|
|
540
|
-
|
|
541
|
-
// Vector functions
|
|
542
|
-
// vec2 functions
|
|
543
|
-
void vec2_sum_fp64(vec2 a[2], vec2 b[2], out vec2 out_val[2]) {
|
|
544
|
-
out_val[0] = sum_fp64(a[0], b[0]);
|
|
545
|
-
out_val[1] = sum_fp64(a[1], b[1]);
|
|
546
|
-
}
|
|
547
|
-
|
|
548
|
-
void vec2_sub_fp64(vec2 a[2], vec2 b[2], out vec2 out_val[2]) {
|
|
549
|
-
out_val[0] = sub_fp64(a[0], b[0]);
|
|
550
|
-
out_val[1] = sub_fp64(a[1], b[1]);
|
|
551
|
-
}
|
|
552
|
-
|
|
553
|
-
void vec2_mul_fp64(vec2 a[2], vec2 b[2], out vec2 out_val[2]) {
|
|
554
|
-
out_val[0] = mul_fp64(a[0], b[0]);
|
|
555
|
-
out_val[1] = mul_fp64(a[1], b[1]);
|
|
556
|
-
}
|
|
557
|
-
|
|
558
|
-
void vec2_div_fp64(vec2 a[2], vec2 b[2], out vec2 out_val[2]) {
|
|
559
|
-
out_val[0] = div_fp64(a[0], b[0]);
|
|
560
|
-
out_val[1] = div_fp64(a[1], b[1]);
|
|
561
|
-
}
|
|
562
|
-
|
|
563
|
-
void vec2_mix_fp64(vec2 x[2], vec2 y[2], float a, out vec2 out_val[2]) {
|
|
564
|
-
vec2 range[2];
|
|
565
|
-
vec2_sub_fp64(y, x, range);
|
|
566
|
-
vec2 portion[2];
|
|
567
|
-
portion[0] = range[0] * a;
|
|
568
|
-
portion[1] = range[1] * a;
|
|
569
|
-
vec2_sum_fp64(x, portion, out_val);
|
|
570
|
-
}
|
|
571
|
-
|
|
572
|
-
vec2 vec2_length_fp64(vec2 x[2]) {
|
|
573
|
-
return sqrt_fp64(sum_fp64(mul_fp64(x[0], x[0]), mul_fp64(x[1], x[1])));
|
|
574
|
-
}
|
|
575
|
-
|
|
576
|
-
void vec2_normalize_fp64(vec2 x[2], out vec2 out_val[2]) {
|
|
577
|
-
vec2 length = vec2_length_fp64(x);
|
|
578
|
-
vec2 length_vec2[2];
|
|
579
|
-
length_vec2[0] = length;
|
|
580
|
-
length_vec2[1] = length;
|
|
581
|
-
|
|
582
|
-
vec2_div_fp64(x, length_vec2, out_val);
|
|
583
|
-
}
|
|
584
|
-
|
|
585
|
-
vec2 vec2_distance_fp64(vec2 x[2], vec2 y[2]) {
|
|
586
|
-
vec2 diff[2];
|
|
587
|
-
vec2_sub_fp64(x, y, diff);
|
|
588
|
-
return vec2_length_fp64(diff);
|
|
589
|
-
}
|
|
590
|
-
|
|
591
|
-
vec2 vec2_dot_fp64(vec2 a[2], vec2 b[2]) {
|
|
592
|
-
vec2 v[2];
|
|
593
|
-
|
|
594
|
-
v[0] = mul_fp64(a[0], b[0]);
|
|
595
|
-
v[1] = mul_fp64(a[1], b[1]);
|
|
596
|
-
|
|
597
|
-
return sum_fp64(v[0], v[1]);
|
|
598
|
-
}
|
|
599
|
-
|
|
600
|
-
// vec3 functions
|
|
601
|
-
void vec3_sub_fp64(vec2 a[3], vec2 b[3], out vec2 out_val[3]) {
|
|
602
|
-
for (int i = 0; i < 3; i++) {
|
|
603
|
-
out_val[i] = sum_fp64(a[i], b[i]);
|
|
604
|
-
}
|
|
605
|
-
}
|
|
606
|
-
|
|
607
|
-
void vec3_sum_fp64(vec2 a[3], vec2 b[3], out vec2 out_val[3]) {
|
|
608
|
-
for (int i = 0; i < 3; i++) {
|
|
609
|
-
out_val[i] = sum_fp64(a[i], b[i]);
|
|
610
|
-
}
|
|
611
|
-
}
|
|
612
|
-
|
|
613
|
-
vec2 vec3_length_fp64(vec2 x[3]) {
|
|
614
|
-
return sqrt_fp64(sum_fp64(sum_fp64(mul_fp64(x[0], x[0]), mul_fp64(x[1], x[1])),
|
|
615
|
-
mul_fp64(x[2], x[2])));
|
|
616
|
-
}
|
|
617
|
-
|
|
618
|
-
vec2 vec3_distance_fp64(vec2 x[3], vec2 y[3]) {
|
|
619
|
-
vec2 diff[3];
|
|
620
|
-
vec3_sub_fp64(x, y, diff);
|
|
621
|
-
return vec3_length_fp64(diff);
|
|
622
|
-
}
|
|
623
|
-
|
|
624
|
-
// vec4 functions
|
|
625
|
-
void vec4_fp64(vec4 a, out vec2 out_val[4]) {
|
|
626
|
-
out_val[0].x = a[0];
|
|
627
|
-
out_val[0].y = 0.0;
|
|
628
|
-
|
|
629
|
-
out_val[1].x = a[1];
|
|
630
|
-
out_val[1].y = 0.0;
|
|
631
|
-
|
|
632
|
-
out_val[2].x = a[2];
|
|
633
|
-
out_val[2].y = 0.0;
|
|
634
|
-
|
|
635
|
-
out_val[3].x = a[3];
|
|
636
|
-
out_val[3].y = 0.0;
|
|
637
|
-
}
|
|
638
|
-
|
|
639
|
-
void vec4_scalar_mul_fp64(vec2 a[4], vec2 b, out vec2 out_val[4]) {
|
|
640
|
-
out_val[0] = mul_fp64(a[0], b);
|
|
641
|
-
out_val[1] = mul_fp64(a[1], b);
|
|
642
|
-
out_val[2] = mul_fp64(a[2], b);
|
|
643
|
-
out_val[3] = mul_fp64(a[3], b);
|
|
644
|
-
}
|
|
645
|
-
|
|
646
|
-
void vec4_sum_fp64(vec2 a[4], vec2 b[4], out vec2 out_val[4]) {
|
|
647
|
-
for (int i = 0; i < 4; i++) {
|
|
648
|
-
out_val[i] = sum_fp64(a[i], b[i]);
|
|
649
|
-
}
|
|
650
|
-
}
|
|
651
|
-
|
|
652
|
-
void vec4_dot_fp64(vec2 a[4], vec2 b[4], out vec2 out_val) {
|
|
653
|
-
vec2 v[4];
|
|
654
|
-
|
|
655
|
-
v[0] = mul_fp64(a[0], b[0]);
|
|
656
|
-
v[1] = mul_fp64(a[1], b[1]);
|
|
657
|
-
v[2] = mul_fp64(a[2], b[2]);
|
|
658
|
-
v[3] = mul_fp64(a[3], b[3]);
|
|
659
|
-
|
|
660
|
-
out_val = sum_fp64(sum_fp64(v[0], v[1]), sum_fp64(v[2], v[3]));
|
|
661
|
-
}
|
|
662
|
-
|
|
663
|
-
void mat4_vec4_mul_fp64(vec2 b[16], vec2 a[4], out vec2 out_val[4]) {
|
|
664
|
-
vec2 tmp[4];
|
|
665
|
-
|
|
666
|
-
for (int i = 0; i < 4; i++)
|
|
667
|
-
{
|
|
668
|
-
for (int j = 0; j < 4; j++)
|
|
669
|
-
{
|
|
670
|
-
tmp[j] = b[j + i * 4];
|
|
671
|
-
}
|
|
672
|
-
vec4_dot_fp64(a, tmp, out_val[i]);
|
|
673
|
-
}
|
|
674
|
-
}
|
|
675
|
-
`;
|
|
@@ -1,44 +0,0 @@
|
|
|
1
|
-
// luma.gl
|
|
2
|
-
// SPDX-License-Identifier: MIT
|
|
3
|
-
// Copyright (c) vis.gl contributors
|
|
4
|
-
|
|
5
|
-
import {fp64ify, fp64LowPart, fp64ifyMatrix4} from '../../../modules/math/fp64/fp64-utils';
|
|
6
|
-
|
|
7
|
-
import {fp64arithmeticShader} from './fp64-arithmetic-glsl';
|
|
8
|
-
import {fp64functionShader} from './fp64-functions-glsl';
|
|
9
|
-
|
|
10
|
-
const CONST_UNIFORMS = {
|
|
11
|
-
// Used in LUMA_FP64_CODE_ELIMINATION_WORKAROUND
|
|
12
|
-
ONE: 1.0
|
|
13
|
-
};
|
|
14
|
-
export {fp64ify, fp64LowPart, fp64ifyMatrix4};
|
|
15
|
-
|
|
16
|
-
function getUniforms() {
|
|
17
|
-
return CONST_UNIFORMS;
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
/**
|
|
21
|
-
* 64bit arithmetic: add, sub, mul, div (small subset of fp64 module)
|
|
22
|
-
*/
|
|
23
|
-
export const fp64arithmetic = {
|
|
24
|
-
name: 'fp64-arithmetic',
|
|
25
|
-
vs: fp64arithmeticShader,
|
|
26
|
-
getUniforms,
|
|
27
|
-
fp64ify,
|
|
28
|
-
fp64LowPart,
|
|
29
|
-
fp64ifyMatrix4
|
|
30
|
-
};
|
|
31
|
-
|
|
32
|
-
/**
|
|
33
|
-
* Full 64 bit math library
|
|
34
|
-
*/
|
|
35
|
-
export const fp64 = {
|
|
36
|
-
name: 'fp64',
|
|
37
|
-
vs: fp64functionShader,
|
|
38
|
-
dependencies: [fp64arithmetic],
|
|
39
|
-
|
|
40
|
-
// Additional Functions
|
|
41
|
-
fp64ify,
|
|
42
|
-
fp64LowPart,
|
|
43
|
-
fp64ifyMatrix4
|
|
44
|
-
};
|