From: Chris Duncan Date: Tue, 14 Jan 2025 20:10:48 +0000 (-0800) Subject: Remove unnecessary v[10-11] scalars. X-Git-Url: https://zoso.dev/?a=commitdiff_plain;h=344d1ad843e03aab9b00f3b683918f35b964e74c;p=nano-pow.git Remove unnecessary v[10-11] scalars. --- diff --git a/src/shaders/compute.wgsl b/src/shaders/compute.wgsl index 540dc4d..d870fd0 100644 --- a/src/shaders/compute.wgsl +++ b/src/shaders/compute.wgsl @@ -231,8 +231,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -269,8 +269,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -279,8 +279,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -318,8 +318,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -532,8 +532,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -566,16 +566,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -609,8 +609,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -1013,8 +1013,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -1051,8 +1051,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -1061,8 +1061,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -1096,8 +1096,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -1306,8 +1306,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -1346,16 +1346,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -1389,8 +1389,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -1805,8 +1805,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -1839,8 +1839,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -1849,8 +1849,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -1888,8 +1888,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -2102,8 +2102,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -2136,16 +2136,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -2179,8 +2179,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -2595,8 +2595,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -2633,8 +2633,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -2643,8 +2643,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -2682,8 +2682,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -2892,8 +2892,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -2932,16 +2932,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -2975,8 +2975,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -3393,8 +3393,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -3427,8 +3427,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -3437,8 +3437,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -3472,8 +3472,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -3690,8 +3690,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -3724,16 +3724,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -3773,8 +3773,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -4187,8 +4187,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -4221,8 +4221,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -4231,8 +4231,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -4266,8 +4266,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -4484,8 +4484,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -4524,16 +4524,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -4567,8 +4567,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -4975,8 +4975,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -5013,8 +5013,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -5023,8 +5023,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -5058,8 +5058,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -5272,8 +5272,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -5312,16 +5312,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -5355,8 +5355,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -5767,8 +5767,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -5801,8 +5801,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -5811,8 +5811,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -5846,8 +5846,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -6064,8 +6064,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -6098,16 +6098,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -6147,8 +6147,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -6559,8 +6559,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -6593,8 +6593,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -6603,8 +6603,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -6638,8 +6638,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -6856,8 +6856,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -6890,16 +6890,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -6939,8 +6939,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -7357,8 +7357,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -7391,8 +7391,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -7401,8 +7401,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -7440,8 +7440,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -7661,8 +7661,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -7695,16 +7695,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -7738,8 +7738,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -8162,8 +8162,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -8200,8 +8200,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -8210,8 +8210,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -8249,8 +8249,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -8463,8 +8463,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -8497,16 +8497,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -8540,8 +8540,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -8944,8 +8944,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -8982,8 +8982,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; @@ -8992,8 +8992,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // a = a + b v_23.x = v2; v_23.y = v3; - v_1011.x = v10; - v_1011.y = v11; + + v_23 = v_23 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_23.x + v_1011.x < v_23.x); v2 = v_23.x; v3 = v_23.y; @@ -9027,8 +9027,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_1819.x = v18; v_1819.y = v19; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_1819; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x; @@ -9237,8 +9237,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { */ // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -9277,16 +9277,16 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 24) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x >> 24u) | (xor.y << 8u), (xor.y >> 24u) | (xor.x << 8u)); v10 = v_1011.x; v11 = v_1011.y; // a = a + b - v_1011.x = v10; - v_1011.y = v11; + + v_01 = v_01 + v_1011 + select(vec2(0u), vec2(0u, 1u), v_01.x + v_1011.x < v_01.x); v1 = v_01.y; @@ -9320,8 +9320,8 @@ fn main(@builtin(global_invocation_id) id: vec3) { // b = rotr64(b ^ c, 63) v_2021.x = v20; v_2021.y = v21; - v_1011.x = v10; - v_1011.y = v11; + + xor = v_1011 ^ v_2021; v_1011 = vec2((xor.x << 1u) | (xor.y >> 31u), (xor.y << 1u) | (xor.x >> 31u)); v10 = v_1011.x;