From 013f71e0640d10e3e691730201f2daa36f49693e Mon Sep 17 00:00:00 2001 From: truelossless Date: Wed, 27 Jul 2022 14:20:22 +0100 Subject: [PATCH] improve windows builds - add required nvcuda.dll for those who don't have it - lower CUDA (therefore nvidia driver) requirements - untrack PTX I am aware of an issue with ANSI escape sequences showing in windows terminals. This seems related to https://github.com/yaahc/color-eyre/issues/80 and the owo_colors crate. Not sure how to fix that. Maybe switch to anyhow and use crossterm instead of owo colors would work, but we would loose the colorful error reports. --- .github/workflows/ci.yml | 16 +- .gitignore | 1 + resources/module.ptx | 24649 ------------------------------------- 3 files changed, 12 insertions(+), 24654 deletions(-) delete mode 100644 resources/module.ptx diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 95fb496..61d8107 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -11,7 +11,7 @@ jobs: run: docker build -t rust-cuda . - name: Start Docker - run: docker run -t -d -v $PWD:/root/rust-cuda --name builder rust-cuda + run: docker run -t -d -v $PWD:/root/rust-cuda --name builder rust-cuda - name: Build executable run: docker exec -w /root/rust-cuda/cli builder cargo build --release @@ -37,7 +37,7 @@ jobs: - name: Install CUDA uses: Jimver/cuda-toolkit@v0.2.8 with: - cuda: '11.7.0' + cuda: "11.2.2" - name: Build executable run: | @@ -53,11 +53,17 @@ jobs: cd ../cli cargo test --release --no-fail-fast + - name: Zip with DLL + run: | + cd cli/target/release/ + cp C:\\Windows\\System32\\nvcuda.dll . + 7z a cugparck-cli.zip nvcuda.dll cugparck-cli.exe + - name: Upload artifact uses: actions/upload-artifact@v3 with: name: cug-windows - path: cli/target/release/cugparck-cli.exe + path: cli/target/release/cugparck-cli.zip upload: needs: [build_windows, build_linux] @@ -105,6 +111,6 @@ jobs: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} with: upload_url: ${{ steps.create_release.outputs.upload_url }} - asset_path: cugparck-cli.exe - asset_name: cug-windows-${{ steps.commit.outputs.hash }}.exe + asset_path: cugparck-cli.zip + asset_name: cug-windows-${{ steps.commit.outputs.hash }}.zip asset_content_type: application/zip diff --git a/.gitignore b/.gitignore index f0b7f6b..9816695 100644 --- a/.gitignore +++ b/.gitignore @@ -1,6 +1,7 @@ .vscode/ .devcontainer/ +resources/module.ptx # Generated by Cargo # will have compiled files and executables diff --git a/resources/module.ptx b/resources/module.ptx deleted file mode 100644 index 8b35d30..0000000 --- a/resources/module.ptx +++ /dev/null @@ -1,24649 +0,0 @@ -// -// Generated by NVIDIA NVVM Compiler -// -// Compiler Build ID: CL-30521435 -// Cuda compilation tools, release 11.4, V11.4.152 -// Based on NVVM 7.0.1 -// - -.version 7.4 -.target sm_61 -.address_size 64 - - // .globl chains_kernel -.func _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E -( - .param .b64 _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_0, - .param .b32 _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_1, - .param .align 16 .b8 _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_2[16] -) -; -.func _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE -( - .param .b64 _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_0, - .param .b64 _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_1, - .param .b64 _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_2 -) -; -.func _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E -() -.noreturn ; -.func _ZN4core5slice5index26slice_start_index_len_fail17h31c4387487c2b57aE -() -.noreturn ; -.func _ZN4core6result13unwrap_failed17h995d1a0127e5a880E -() -.noreturn ; -.global .align 1 .b8 private$6[84] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 98, 108, 111, 99, 107, 45, 98, 117, 102, 102, 101, 114, 45, 48, 46, 49, 48, 46, 50, 47, 115, 114, 99, 47, 108, 105, 98, 46, 114, 115}; -.global .align 8 .u8 private$8[24] = {0XFF(generic(private$6)), 0xFF00(generic(private$6)), 0xFF0000(generic(private$6)), 0xFF000000(generic(private$6)), 0xFF00000000(generic(private$6)), 0xFF0000000000(generic(private$6)), 0xFF000000000000(generic(private$6)), 0xFF00000000000000(generic(private$6)), 84, 0, 0, 0, 0, 0, 0, 0, 132, 0, 0, 0, 37, 0, 0, 0}; -.global .align 8 .u8 private$l[24] = {0XFF(generic(private$6)), 0xFF00(generic(private$6)), 0xFF0000(generic(private$6)), 0xFF000000(generic(private$6)), 0xFF00000000(generic(private$6)), 0xFF0000000000(generic(private$6)), 0xFF000000000000(generic(private$6)), 0xFF00000000000000(generic(private$6)), 84, 0, 0, 0, 0, 0, 0, 0, 31, 1, 0, 0, 30, 0, 0, 0}; -.global .align 8 .u8 private$j[24] = {0XFF(generic(private$6)), 0xFF00(generic(private$6)), 0xFF0000(generic(private$6)), 0xFF000000(generic(private$6)), 0xFF00000000(generic(private$6)), 0xFF0000000000(generic(private$6)), 0xFF000000000000(generic(private$6)), 0xFF00000000000000(generic(private$6)), 84, 0, 0, 0, 0, 0, 0, 0, 28, 1, 0, 0, 24, 0, 0, 0}; -.global .align 1 .b8 private$P[75] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 109, 100, 52, 45, 48, 46, 49, 48, 46, 49, 47, 115, 114, 99, 47, 108, 105, 98, 46, 114, 115}; -.global .align 8 .u8 private$Q[24] = {0XFF(generic(private$P)), 0xFF00(generic(private$P)), 0xFF0000(generic(private$P)), 0xFF000000(generic(private$P)), 0xFF00000000(generic(private$P)), 0xFF0000000000(generic(private$P)), 0xFF000000000000(generic(private$P)), 0xFF00000000000000(generic(private$P)), 75, 0, 0, 0, 0, 0, 0, 0, 91, 0, 0, 0, 19, 0, 0, 0}; -.global .align 1 .b8 private$R[76] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 109, 100, 45, 53, 45, 48, 46, 49, 48, 46, 49, 47, 115, 114, 99, 47, 108, 105, 98, 46, 114, 115}; -.global .align 8 .u8 private$S[24] = {0XFF(generic(private$R)), 0xFF00(generic(private$R)), 0xFF0000(generic(private$R)), 0xFF000000(generic(private$R)), 0xFF00000000(generic(private$R)), 0xFF0000000000(generic(private$R)), 0xFF000000000000(generic(private$R)), 0xFF00000000000000(generic(private$R)), 76, 0, 0, 0, 0, 0, 0, 0, 94, 0, 0, 0, 19, 0, 0, 0}; -.global .align 1 .b8 private$T[77] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 115, 104, 97, 45, 49, 45, 48, 46, 49, 48, 46, 48, 47, 115, 114, 99, 47, 108, 105, 98, 46, 114, 115}; -.global .align 8 .u8 private$U[24] = {0XFF(generic(private$T)), 0xFF00(generic(private$T)), 0xFF0000(generic(private$T)), 0xFF000000(generic(private$T)), 0xFF00000000(generic(private$T)), 0xFF0000000000(generic(private$T)), 0xFF000000000000(generic(private$T)), 0xFF00000000000000(generic(private$T)), 77, 0, 0, 0, 0, 0, 0, 0, 105, 0, 0, 0, 19, 0, 0, 0}; -.global .align 1 .b8 private$14[81] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 115, 104, 97, 50, 45, 48, 46, 49, 48, 46, 50, 47, 115, 114, 99, 47, 99, 111, 114, 101, 95, 97, 112, 105, 46, 114, 115}; -.global .align 8 .u8 private$15[24] = {0XFF(generic(private$14)), 0xFF00(generic(private$14)), 0xFF0000(generic(private$14)), 0xFF000000(generic(private$14)), 0xFF00000000(generic(private$14)), 0xFF0000000000(generic(private$14)), 0xFF000000000000(generic(private$14)), 0xFF00000000000000(generic(private$14)), 81, 0, 0, 0, 0, 0, 0, 0, 66, 0, 0, 0, 19, 0, 0, 0}; -.global .align 1 .b8 private$0[95] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 100, 105, 103, 101, 115, 116, 45, 48, 46, 49, 48, 46, 51, 47, 115, 114, 99, 47, 99, 111, 114, 101, 95, 97, 112, 105, 47, 99, 116, 95, 118, 97, 114, 105, 97, 98, 108, 101, 46, 114, 115}; -.global .align 8 .u8 private$5[24] = {0XFF(generic(private$0)), 0xFF00(generic(private$0)), 0xFF0000(generic(private$0)), 0xFF000000(generic(private$0)), 0xFF00000000(generic(private$0)), 0xFF0000000000(generic(private$0)), 0xFF000000000000(generic(private$0)), 0xFF00000000000000(generic(private$0)), 95, 0, 0, 0, 0, 0, 0, 0, 117, 0, 0, 0, 36, 0, 0, 0}; -.global .align 1 .b8 private$L[78] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 115, 104, 97, 51, 45, 48, 46, 49, 48, 46, 49, 47, 115, 114, 99, 47, 115, 116, 97, 116, 101, 46, 114, 115}; -.global .align 8 .u8 private$O[24] = {0XFF(generic(private$L)), 0xFF00(generic(private$L)), 0xFF0000(generic(private$L)), 0xFF000000(generic(private$L)), 0xFF00000000(generic(private$L)), 0xFF0000000000(generic(private$L)), 0xFF000000000000(generic(private$L)), 0xFF00000000000000(generic(private$L)), 78, 0, 0, 0, 0, 0, 0, 0, 25, 0, 0, 0, 15, 0, 0, 0}; -.global .align 1 .b8 private$029[83] = {47, 114, 111, 111, 116, 47, 46, 99, 97, 114, 103, 111, 47, 114, 101, 103, 105, 115, 116, 114, 121, 47, 115, 114, 99, 47, 103, 105, 116, 104, 117, 98, 46, 99, 111, 109, 45, 49, 101, 99, 99, 54, 50, 57, 57, 100, 98, 57, 101, 99, 56, 50, 51, 47, 116, 105, 110, 121, 118, 101, 99, 45, 49, 46, 54, 46, 48, 47, 115, 114, 99, 47, 97, 114, 114, 97, 121, 118, 101, 99, 46, 114, 115}; -.global .align 8 .u8 private$1[24] = {0XFF(generic(private$029)), 0xFF00(generic(private$029)), 0xFF0000(generic(private$029)), 0xFF000000(generic(private$029)), 0xFF00000000(generic(private$029)), 0xFF0000000000(generic(private$029)), 0xFF000000000000(generic(private$029)), 0xFF00000000000000(generic(private$029)), 83, 0, 0, 0, 0, 0, 0, 0, 37, 5, 0, 0, 26, 0, 0, 0}; -.global .align 8 .b8 private$9214[192] = {1, 0, 0, 0, 0, 0, 0, 0, 130, 128, 0, 0, 0, 0, 0, 0, 138, 128, 0, 0, 0, 0, 0, 128, 0, 128, 0, 128, 0, 0, 0, 128, 139, 128, 0, 0, 0, 0, 0, 0, 1, 0, 0, 128, 0, 0, 0, 0, 129, 128, 0, 128, 0, 0, 0, 128, 9, 128, 0, 0, 0, 0, 0, 128, 138, 0, 0, 0, 0, 0, 0, 0, 136, 0, 0, 0, 0, 0, 0, 0, 9, 128, 0, 128, 0, 0, 0, 0, 10, 0, 0, 128, 0, 0, 0, 0, 139, 128, 0, 128, 0, 0, 0, 0, 139, 0, 0, 0, 0, 0, 0, 128, 137, 128, 0, 0, 0, 0, 0, 128, 3, 128, 0, 0, 0, 0, 0, 128, 2, 128, 0, 0, 0, 0, 0, 128, 128, 0, 0, 0, 0, 0, 0, 128, 10, 128, 0, 0, 0, 0, 0, 0, 10, 0, 0, 128, 0, 0, 0, 128, 129, 128, 0, 128, 0, 0, 0, 128, 128, 128, 0, 0, 0, 0, 0, 128, 1, 0, 0, 128, 0, 0, 0, 0, 8, 128, 0, 128, 0, 0, 0, 128}; -.global .align 8 .b8 private$i465[32] = {0, 0, 0, 0, 0, 0, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 8, 0, 0, 0, 0, 0, 0, 0, 12, 0, 0, 0, 0, 0, 0, 0}; -.global .align 8 .b8 private$r469[32] = {0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0}; - -.visible .entry chains_kernel( - .param .u64 chains_kernel_param_0, - .param .u64 chains_kernel_param_1, - .param .u64 chains_kernel_param_2, - .param .u64 chains_kernel_param_3, - .param .align 8 .b8 chains_kernel_param_4[272] -) -{ - .local .align 16 .b8 __local_depot0[368]; - .reg .b64 %SP; - .reg .b64 %SPL; - .reg .pred %p<83>; - .reg .b16 %rs<208>; - .reg .b32 %r<125>; - .reg .b64 %rd<359>; - - - mov.u64 %SPL, __local_depot0; - cvta.local.u64 %SP, %SPL; - ld.param.u64 %rd57, [chains_kernel_param_0]; - ld.param.u64 %rd143, [chains_kernel_param_1]; - ld.param.u64 %rd144, [chains_kernel_param_2]; - ld.param.u64 %rd145, [chains_kernel_param_3]; - mov.u64 %rd146, chains_kernel_param_4; - add.u64 %rd147, %SP, 0; - add.u64 %rd1, %SPL, 0; - add.u64 %rd2, %SPL, 88; - ld.param.v4.u16 {%rs21, %rs22, %rs23, %rs24}, [%rd146]; - st.local.v4.u16 [%rd2], {%rs21, %rs22, %rs23, %rs24}; - ld.param.v4.u16 {%rs11, %rs26, %rs27, %rs28}, [%rd146+8]; - st.local.v4.u16 [%rd2+8], {%rs11, %rs26, %rs27, %rs28}; - ld.param.u64 %rd149, [%rd146+16]; - add.s64 %rd4, %rd2, 16; - st.local.u64 [%rd2+16], %rd149; - ld.param.u64 %rd150, [%rd146+24]; - st.local.u64 [%rd2+24], %rd150; - ld.param.u64 %rd151, [%rd146+32]; - st.local.u64 [%rd2+32], %rd151; - ld.param.u64 %rd152, [%rd146+40]; - st.local.u64 [%rd2+40], %rd152; - ld.param.u64 %rd153, [%rd146+48]; - st.local.u64 [%rd2+48], %rd153; - ld.param.u64 %rd154, [%rd146+56]; - st.local.u64 [%rd2+56], %rd154; - ld.param.u64 %rd155, [%rd146+64]; - st.local.u64 [%rd2+64], %rd155; - ld.param.u64 %rd156, [%rd146+72]; - st.local.u64 [%rd2+72], %rd156; - ld.param.u64 %rd157, [%rd146+80]; - st.local.u64 [%rd2+80], %rd157; - ld.param.u64 %rd158, [%rd146+88]; - st.local.u64 [%rd2+88], %rd158; - ld.param.u64 %rd159, [%rd146+96]; - st.local.u64 [%rd2+96], %rd159; - ld.param.u16 %rs6, [%rd146+104]; - st.local.u16 [%rd2+104], %rs6; - ld.param.v2.u8 {%rs32, %rs33}, [%rd146+106]; - add.s64 %rd5, %rd2, 106; - st.local.v2.u8 [%rd2+106], {%rs32, %rs33}; - ld.param.u32 %r22, [%rd146+108]; - st.local.u32 [%rd2+108], %r22; - ld.param.v4.u16 {%rs36, %rs37, %rs38, %rs39}, [%rd146+112]; - st.local.v4.u16 [%rd2+112], {%rs36, %rs37, %rs38, %rs39}; - ld.param.v4.u16 {%rs44, %rs45, %rs46, %rs47}, [%rd146+120]; - st.local.v4.u16 [%rd2+120], {%rs44, %rs45, %rs46, %rs47}; - ld.param.v4.u16 {%rs52, %rs53, %rs54, %rs55}, [%rd146+128]; - st.local.v4.u16 [%rd2+128], {%rs52, %rs53, %rs54, %rs55}; - ld.param.v4.u16 {%rs60, %rs61, %rs62, %rs63}, [%rd146+136]; - st.local.v4.u16 [%rd2+136], {%rs60, %rs61, %rs62, %rs63}; - ld.param.u64 %rd160, [%rd146+144]; - st.local.u64 [%rd2+144], %rd160; - ld.param.v4.u16 {%rs68, %rs69, %rs70, %rs71}, [%rd146+152]; - st.local.v4.u16 [%rd2+152], {%rs68, %rs69, %rs70, %rs71}; - ld.param.v4.u16 {%rs76, %rs77, %rs78, %rs79}, [%rd146+160]; - st.local.v4.u16 [%rd2+160], {%rs76, %rs77, %rs78, %rs79}; - ld.param.v4.u16 {%rs84, %rs85, %rs86, %rs87}, [%rd146+168]; - st.local.v4.u16 [%rd2+168], {%rs84, %rs85, %rs86, %rs87}; - ld.param.v4.u16 {%rs92, %rs93, %rs94, %rs95}, [%rd146+176]; - st.local.v4.u16 [%rd2+176], {%rs92, %rs93, %rs94, %rs95}; - ld.param.v4.u16 {%rs100, %rs101, %rs102, %rs103}, [%rd146+184]; - st.local.v4.u16 [%rd2+184], {%rs100, %rs101, %rs102, %rs103}; - ld.param.v4.u16 {%rs108, %rs109, %rs110, %rs111}, [%rd146+192]; - st.local.v4.u16 [%rd2+192], {%rs108, %rs109, %rs110, %rs111}; - ld.param.v4.u16 {%rs116, %rs117, %rs118, %rs119}, [%rd146+200]; - st.local.v4.u16 [%rd2+200], {%rs116, %rs117, %rs118, %rs119}; - ld.param.u64 %rd161, [%rd146+208]; - st.local.u64 [%rd2+208], %rd161; - ld.param.v4.u16 {%rs124, %rs125, %rs126, %rs127}, [%rd146+216]; - st.local.v4.u16 [%rd2+216], {%rs124, %rs125, %rs126, %rs127}; - ld.param.v4.u16 {%rs132, %rs133, %rs134, %rs135}, [%rd146+224]; - st.local.v4.u16 [%rd2+224], {%rs132, %rs133, %rs134, %rs135}; - ld.param.v4.u16 {%rs140, %rs141, %rs142, %rs143}, [%rd146+232]; - st.local.v4.u16 [%rd2+232], {%rs140, %rs141, %rs142, %rs143}; - ld.param.u64 %rd162, [%rd146+240]; - st.local.u64 [%rd2+240], %rd162; - ld.param.v4.u16 {%rs148, %rs149, %rs150, %rs151}, [%rd146+248]; - st.local.v4.u16 [%rd2+248], {%rs148, %rs149, %rs150, %rs151}; - ld.param.u64 %rd163, [%rd146+256]; - st.local.u64 [%rd2+256], %rd163; - ld.param.u64 %rd164, [%rd146+264]; - st.local.u64 [%rd2+264], %rd164; - mov.u32 %r23, %ntid.x; - mov.u32 %r24, %ctaid.x; - mov.u32 %r25, %tid.x; - mad.lo.s32 %r26, %r23, %r24, %r25; - cvt.u64.u32 %rd6, %r26; - setp.ge.u64 %p5, %rd6, %rd145; - @%p5 bra $L__BB0_139; - - cvta.to.global.u64 %rd165, %rd144; - shl.b64 %rd166, %rd6, 4; - add.s64 %rd167, %rd165, %rd166; - add.s64 %rd7, %rd167, 8; - ld.global.u64 %rd8, [%rd167+8]; - mov.u32 %r120, 0; - st.local.u32 [%rd1+8], %r120; - mov.b64 %rd168, {%r120, %r120}; - st.local.u64 [%rd1], %rd168; - setp.gt.u16 %p6, %rs11, 11; - @%p6 bra $L__BB0_149; - - add.u64 %rd170, %SP, 16; - add.u64 %rd9, %SPL, 16; - cvt.u64.u16 %rd10, %rs11; - cvt.u32.u16 %r28, %rs11; - mul.wide.u32 %rd171, %r28, 8; - add.s64 %rd172, %rd2, %rd171; - add.s64 %rd312, %rd172, 16; - mov.u64 %rd314, 0; - mov.pred %p7, -1; - mov.pred %p9, 0; - -$L__BB0_3: - setp.eq.s64 %p8, %rd4, %rd312; - mov.pred %p81, %p7; - @%p8 bra $L__BB0_5; - - add.s64 %rd15, %rd312, -8; - ld.local.u64 %rd174, [%rd312+-8]; - setp.lt.u64 %p10, %rd8, %rd174; - selp.u64 %rd175, 1, 0, %p10; - add.s64 %rd314, %rd314, %rd175; - mov.u64 %rd312, %rd15; - mov.pred %p81, %p9; - @%p10 bra $L__BB0_3; - -$L__BB0_5: - @%p81 bra $L__BB0_148; - - not.b64 %rd176, %rd314; - add.s64 %rd18, %rd10, %rd176; - setp.lt.u64 %p2, %rd18, %rd10; - @%p2 bra $L__BB0_8; - bra.uni $L__BB0_7; - -$L__BB0_8: - shl.b64 %rd179, %rd18, 3; - add.s64 %rd180, %rd2, %rd179; - ld.local.u64 %rd181, [%rd180+16]; - mov.u64 %rd344, 0; - sub.s64 %rd20, %rd8, %rd181; - setp.eq.s64 %p11, %rd18, 0; - mov.u64 %rd345, %rd344; - mov.u32 %r121, %r120; - mov.u32 %r122, %r120; - @%p11 bra $L__BB0_55; - - cvt.u64.u16 %rd21, %rs6; - setp.eq.s16 %p12, %rs6, 0; - @%p12 bra $L__BB0_53; - - setp.gt.u16 %p13, %rs6, 128; - @%p13 bra $L__BB0_52; - - and.b64 %rd182, %rd20, -4294967296; - setp.eq.s64 %p14, %rd182, 0; - @%p14 bra $L__BB0_13; - - div.u64 %rd315, %rd20, %rd21; - bra.uni $L__BB0_14; - -$L__BB0_13: - cvt.u32.u64 %r32, %rd21; - cvt.u32.u64 %r33, %rd20; - div.u32 %r34, %r33, %r32; - cvt.u64.u32 %rd315, %r34; - -$L__BB0_14: - mul.lo.s64 %rd183, %rd315, %rd21; - sub.s64 %rd184, %rd20, %rd183; - add.s64 %rd185, %rd2, %rd184; - ld.local.u8 %rs157, [%rd185+106]; - add.s64 %rd25, %rd1, 2; - st.local.u8 [%rd1+2], %rs157; - setp.lt.u64 %p15, %rd18, 2; - mov.u16 %rs203, 1; - @%p15 bra $L__BB0_54; - - and.b64 %rd188, %rd315, -4294967296; - setp.eq.s64 %p16, %rd188, 0; - @%p16 bra $L__BB0_17; - - div.u64 %rd316, %rd315, %rd21; - bra.uni $L__BB0_18; - -$L__BB0_17: - cvt.u32.u64 %r35, %rd21; - cvt.u32.u64 %r36, %rd315; - div.u32 %r37, %r36, %r35; - cvt.u64.u32 %rd316, %r37; - -$L__BB0_18: - mul.lo.s64 %rd189, %rd316, %rd21; - sub.s64 %rd190, %rd315, %rd189; - add.s64 %rd191, %rd2, %rd190; - ld.local.u8 %rs159, [%rd191+106]; - st.local.u8 [%rd25+1], %rs159; - setp.eq.s64 %p17, %rd18, 2; - mov.u16 %rs203, 2; - @%p17 bra $L__BB0_54; - - and.b64 %rd192, %rd316, -4294967296; - setp.eq.s64 %p18, %rd192, 0; - @%p18 bra $L__BB0_21; - - div.u64 %rd317, %rd316, %rd21; - bra.uni $L__BB0_22; - -$L__BB0_21: - cvt.u32.u64 %r38, %rd21; - cvt.u32.u64 %r39, %rd316; - div.u32 %r40, %r39, %r38; - cvt.u64.u32 %rd317, %r40; - -$L__BB0_22: - mul.lo.s64 %rd193, %rd317, %rd21; - sub.s64 %rd194, %rd316, %rd193; - add.s64 %rd195, %rd2, %rd194; - ld.local.u8 %rs161, [%rd195+106]; - or.b64 %rd197, %rd147, 4; - cvta.to.local.u64 %rd198, %rd197; - st.local.u8 [%rd198], %rs161; - setp.lt.u64 %p19, %rd18, 4; - mov.u16 %rs203, 3; - @%p19 bra $L__BB0_54; - - and.b64 %rd199, %rd317, -4294967296; - setp.eq.s64 %p20, %rd199, 0; - @%p20 bra $L__BB0_25; - - div.u64 %rd318, %rd317, %rd21; - bra.uni $L__BB0_26; - -$L__BB0_25: - cvt.u32.u64 %r41, %rd21; - cvt.u32.u64 %r42, %rd317; - div.u32 %r43, %r42, %r41; - cvt.u64.u32 %rd318, %r43; - -$L__BB0_26: - mul.lo.s64 %rd200, %rd318, %rd21; - sub.s64 %rd201, %rd317, %rd200; - add.s64 %rd202, %rd2, %rd201; - ld.local.u8 %rs163, [%rd202+106]; - st.local.u8 [%rd25+3], %rs163; - setp.eq.s64 %p21, %rd18, 4; - mov.u16 %rs203, 4; - @%p21 bra $L__BB0_54; - - and.b64 %rd203, %rd318, -4294967296; - setp.eq.s64 %p22, %rd203, 0; - @%p22 bra $L__BB0_29; - - div.u64 %rd319, %rd318, %rd21; - bra.uni $L__BB0_30; - -$L__BB0_29: - cvt.u32.u64 %r44, %rd21; - cvt.u32.u64 %r45, %rd318; - div.u32 %r46, %r45, %r44; - cvt.u64.u32 %rd319, %r46; - -$L__BB0_30: - mul.lo.s64 %rd204, %rd319, %rd21; - sub.s64 %rd205, %rd318, %rd204; - add.s64 %rd206, %rd2, %rd205; - ld.local.u8 %rs165, [%rd206+106]; - st.local.u8 [%rd25+4], %rs165; - setp.lt.u64 %p23, %rd18, 6; - mov.u16 %rs203, 5; - @%p23 bra $L__BB0_54; - - and.b64 %rd207, %rd319, -4294967296; - setp.eq.s64 %p24, %rd207, 0; - @%p24 bra $L__BB0_33; - - div.u64 %rd320, %rd319, %rd21; - bra.uni $L__BB0_34; - -$L__BB0_33: - cvt.u32.u64 %r47, %rd21; - cvt.u32.u64 %r48, %rd319; - div.u32 %r49, %r48, %r47; - cvt.u64.u32 %rd320, %r49; - -$L__BB0_34: - mul.lo.s64 %rd208, %rd320, %rd21; - sub.s64 %rd209, %rd319, %rd208; - add.s64 %rd210, %rd2, %rd209; - ld.local.u8 %rs167, [%rd210+106]; - st.local.u8 [%rd25+5], %rs167; - setp.eq.s64 %p25, %rd18, 6; - mov.u16 %rs203, 6; - @%p25 bra $L__BB0_54; - - and.b64 %rd211, %rd320, -4294967296; - setp.eq.s64 %p26, %rd211, 0; - @%p26 bra $L__BB0_37; - - div.u64 %rd321, %rd320, %rd21; - bra.uni $L__BB0_38; - -$L__BB0_37: - cvt.u32.u64 %r50, %rd21; - cvt.u32.u64 %r51, %rd320; - div.u32 %r52, %r51, %r50; - cvt.u64.u32 %rd321, %r52; - -$L__BB0_38: - mul.lo.s64 %rd212, %rd321, %rd21; - sub.s64 %rd213, %rd320, %rd212; - add.s64 %rd214, %rd2, %rd213; - ld.local.u8 %rs169, [%rd214+106]; - or.b64 %rd216, %rd147, 8; - cvta.to.local.u64 %rd217, %rd216; - st.local.u8 [%rd217], %rs169; - setp.lt.u64 %p27, %rd18, 8; - mov.u16 %rs203, 7; - @%p27 bra $L__BB0_54; - - and.b64 %rd218, %rd321, -4294967296; - setp.eq.s64 %p28, %rd218, 0; - @%p28 bra $L__BB0_41; - - div.u64 %rd322, %rd321, %rd21; - bra.uni $L__BB0_42; - -$L__BB0_41: - cvt.u32.u64 %r53, %rd21; - cvt.u32.u64 %r54, %rd321; - div.u32 %r55, %r54, %r53; - cvt.u64.u32 %rd322, %r55; - -$L__BB0_42: - mul.lo.s64 %rd219, %rd322, %rd21; - sub.s64 %rd220, %rd321, %rd219; - add.s64 %rd221, %rd2, %rd220; - ld.local.u8 %rs171, [%rd221+106]; - st.local.u8 [%rd25+7], %rs171; - setp.eq.s64 %p29, %rd18, 8; - mov.u16 %rs203, 8; - @%p29 bra $L__BB0_54; - - and.b64 %rd222, %rd322, -4294967296; - setp.eq.s64 %p30, %rd222, 0; - @%p30 bra $L__BB0_45; - - div.u64 %rd323, %rd322, %rd21; - bra.uni $L__BB0_46; - -$L__BB0_45: - cvt.u32.u64 %r56, %rd21; - cvt.u32.u64 %r57, %rd322; - div.u32 %r58, %r57, %r56; - cvt.u64.u32 %rd323, %r58; - -$L__BB0_46: - mul.lo.s64 %rd223, %rd323, %rd21; - sub.s64 %rd224, %rd322, %rd223; - add.s64 %rd225, %rd2, %rd224; - ld.local.u8 %rs173, [%rd225+106]; - st.local.u8 [%rd25+8], %rs173; - setp.lt.u64 %p31, %rd18, 10; - mov.u16 %rs203, 9; - @%p31 bra $L__BB0_54; - - and.b64 %rd226, %rd323, -4294967296; - setp.eq.s64 %p32, %rd226, 0; - @%p32 bra $L__BB0_49; - - rem.u64 %rd324, %rd323, %rd21; - bra.uni $L__BB0_50; - -$L__BB0_49: - cvt.u32.u64 %r59, %rd21; - cvt.u32.u64 %r60, %rd323; - rem.u32 %r61, %r60, %r59; - cvt.u64.u32 %rd324, %r61; - -$L__BB0_50: - add.s64 %rd227, %rd2, %rd324; - ld.local.u8 %rs175, [%rd227+106]; - st.local.u8 [%rd25+9], %rs175; - setp.eq.s64 %p33, %rd18, 10; - mov.u16 %rs203, 10; - @%p33 bra $L__BB0_54; - bra.uni $L__BB0_51; - -$L__BB0_54: - st.local.u16 [%rd1], %rs203; - ld.local.v4.u32 {%r120, %r121, %r122, %r65}, [%rd1]; - mov.b64 %rd345, {%r122, %r65}; - mov.b64 %rd344, {%r120, %r121}; - -$L__BB0_55: - setp.ge.u64 %p34, %rd57, %rd143; - @%p34 bra $L__BB0_118; - - mov.u32 %r73, 0; - mov.pred %p40, -1; - mov.pred %p42, 0; - bra.uni $L__BB0_57; - -$L__BB0_142: - ld.local.u8 %rs21, [%rd2]; - -$L__BB0_57: - cvt.u32.u16 %r67, %rs21; - { // callseq 1, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd170; - .param .b32 param1; - st.param.b32 [param1+0], %r67; - .param .align 16 .b8 param2[16]; - st.param.v2.b32 [param2+0], {%r120, %r121}; - st.param.b32 [param2+8], %r122; - call.uni - _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E, - ( - param0, - param1, - param2 - ); - } // callseq 1 - ld.local.u16 %rs10, [%rd9]; - setp.gt.u16 %p35, %rs10, 64; - @%p35 bra $L__BB0_147; - - setp.lt.u16 %p36, %rs10, 8; - @%p36 bra $L__BB0_146; - - ld.local.u64 %rd59, [%rd2+264]; - setp.eq.s64 %p37, %rd59, 0; - @%p37 bra $L__BB0_145; - - ld.local.u8 %rd231, [%rd2+248]; - mul.lo.s64 %rd232, %rd57, %rd231; - ld.local.u16 %rs176, [%rd9+8]; - ld.local.u16 %rs177, [%rd9+6]; - mov.b32 %r68, {%rs177, %rs176}; - ld.local.u16 %rs178, [%rd9+4]; - ld.local.u16 %rs179, [%rd9+2]; - mov.b32 %r69, {%rs179, %rs178}; - mov.b64 %rd233, {%r69, %r68}; - add.s64 %rd60, %rd232, %rd233; - or.b64 %rd234, %rd60, %rd59; - and.b64 %rd235, %rd234, -4294967296; - setp.eq.s64 %p38, %rd235, 0; - @%p38 bra $L__BB0_62; - - rem.u64 %rd328, %rd60, %rd59; - bra.uni $L__BB0_63; - -$L__BB0_62: - cvt.u32.u64 %r70, %rd59; - cvt.u32.u64 %r71, %rd60; - rem.u32 %r72, %r71, %r70; - cvt.u64.u32 %rd328, %r72; - -$L__BB0_63: - st.local.u32 [%rd1+8], %r73; - mov.b64 %rd236, {%r73, %r73}; - st.local.u64 [%rd1], %rd236; - ld.local.u16 %rs11, [%rd2+8]; - setp.gt.u16 %p39, %rs11, 11; - @%p39 bra $L__BB0_144; - - cvt.u64.u16 %rd64, %rs11; - cvt.u32.u16 %r74, %rs11; - mul.wide.u32 %rd238, %r74, 8; - add.s64 %rd239, %rd2, %rd238; - add.s64 %rd329, %rd239, 16; - mov.u64 %rd331, 0; - -$L__BB0_65: - setp.eq.s64 %p41, %rd4, %rd329; - mov.pred %p82, %p40; - @%p41 bra $L__BB0_67; - - add.s64 %rd68, %rd329, -8; - ld.local.u64 %rd240, [%rd329+-8]; - setp.lt.u64 %p43, %rd328, %rd240; - selp.u64 %rd241, 1, 0, %p43; - add.s64 %rd331, %rd331, %rd241; - mov.u64 %rd329, %rd68; - mov.pred %p82, %p42; - @%p43 bra $L__BB0_65; - -$L__BB0_67: - @%p82 bra $L__BB0_143; - - not.b64 %rd242, %rd331; - add.s64 %rd71, %rd64, %rd242; - setp.lt.u64 %p4, %rd71, %rd64; - @%p4 bra $L__BB0_70; - bra.uni $L__BB0_69; - -$L__BB0_70: - shl.b64 %rd245, %rd71, 3; - add.s64 %rd246, %rd2, %rd245; - ld.local.u64 %rd247, [%rd246+16]; - mov.u64 %rd344, 0; - sub.s64 %rd73, %rd328, %rd247; - setp.eq.s64 %p44, %rd71, 0; - mov.u64 %rd345, %rd344; - mov.u32 %r120, %r73; - mov.u32 %r121, %r73; - mov.u32 %r122, %r73; - @%p44 bra $L__BB0_117; - - ld.local.u16 %rs12, [%rd2+104]; - cvt.u64.u16 %rd74, %rs12; - setp.eq.s16 %p45, %rs12, 0; - @%p45 bra $L__BB0_115; - - setp.gt.u16 %p46, %rs12, 128; - @%p46 bra $L__BB0_114; - - and.b64 %rd248, %rd73, -4294967296; - setp.eq.s64 %p47, %rd248, 0; - @%p47 bra $L__BB0_75; - - div.u64 %rd332, %rd73, %rd74; - bra.uni $L__BB0_76; - -$L__BB0_75: - cvt.u32.u64 %r78, %rd74; - cvt.u32.u64 %r79, %rd73; - div.u32 %r80, %r79, %r78; - cvt.u64.u32 %rd332, %r80; - -$L__BB0_76: - mul.lo.s64 %rd249, %rd332, %rd74; - sub.s64 %rd250, %rd73, %rd249; - add.s64 %rd251, %rd2, %rd250; - ld.local.u8 %rs181, [%rd251+106]; - add.s64 %rd78, %rd1, 2; - st.local.u8 [%rd1+2], %rs181; - setp.lt.u64 %p48, %rd71, 2; - mov.u16 %rs205, 1; - @%p48 bra $L__BB0_116; - - and.b64 %rd254, %rd332, -4294967296; - setp.eq.s64 %p49, %rd254, 0; - @%p49 bra $L__BB0_79; - - div.u64 %rd333, %rd332, %rd74; - bra.uni $L__BB0_80; - -$L__BB0_79: - cvt.u32.u64 %r81, %rd74; - cvt.u32.u64 %r82, %rd332; - div.u32 %r83, %r82, %r81; - cvt.u64.u32 %rd333, %r83; - -$L__BB0_80: - mul.lo.s64 %rd255, %rd333, %rd74; - sub.s64 %rd256, %rd332, %rd255; - add.s64 %rd257, %rd2, %rd256; - ld.local.u8 %rs183, [%rd257+106]; - st.local.u8 [%rd78+1], %rs183; - setp.eq.s64 %p50, %rd71, 2; - mov.u16 %rs205, 2; - @%p50 bra $L__BB0_116; - - and.b64 %rd258, %rd333, -4294967296; - setp.eq.s64 %p51, %rd258, 0; - @%p51 bra $L__BB0_83; - - div.u64 %rd334, %rd333, %rd74; - bra.uni $L__BB0_84; - -$L__BB0_83: - cvt.u32.u64 %r84, %rd74; - cvt.u32.u64 %r85, %rd333; - div.u32 %r86, %r85, %r84; - cvt.u64.u32 %rd334, %r86; - -$L__BB0_84: - mul.lo.s64 %rd259, %rd334, %rd74; - sub.s64 %rd260, %rd333, %rd259; - add.s64 %rd261, %rd2, %rd260; - ld.local.u8 %rs185, [%rd261+106]; - or.b64 %rd263, %rd147, 4; - cvta.to.local.u64 %rd264, %rd263; - st.local.u8 [%rd264], %rs185; - setp.lt.u64 %p52, %rd71, 4; - mov.u16 %rs205, 3; - @%p52 bra $L__BB0_116; - - and.b64 %rd265, %rd334, -4294967296; - setp.eq.s64 %p53, %rd265, 0; - @%p53 bra $L__BB0_87; - - div.u64 %rd335, %rd334, %rd74; - bra.uni $L__BB0_88; - -$L__BB0_87: - cvt.u32.u64 %r87, %rd74; - cvt.u32.u64 %r88, %rd334; - div.u32 %r89, %r88, %r87; - cvt.u64.u32 %rd335, %r89; - -$L__BB0_88: - mul.lo.s64 %rd266, %rd335, %rd74; - sub.s64 %rd267, %rd334, %rd266; - add.s64 %rd268, %rd2, %rd267; - ld.local.u8 %rs187, [%rd268+106]; - st.local.u8 [%rd78+3], %rs187; - setp.eq.s64 %p54, %rd71, 4; - mov.u16 %rs205, 4; - @%p54 bra $L__BB0_116; - - and.b64 %rd269, %rd335, -4294967296; - setp.eq.s64 %p55, %rd269, 0; - @%p55 bra $L__BB0_91; - - div.u64 %rd336, %rd335, %rd74; - bra.uni $L__BB0_92; - -$L__BB0_91: - cvt.u32.u64 %r90, %rd74; - cvt.u32.u64 %r91, %rd335; - div.u32 %r92, %r91, %r90; - cvt.u64.u32 %rd336, %r92; - -$L__BB0_92: - mul.lo.s64 %rd270, %rd336, %rd74; - sub.s64 %rd271, %rd335, %rd270; - add.s64 %rd272, %rd2, %rd271; - ld.local.u8 %rs189, [%rd272+106]; - st.local.u8 [%rd78+4], %rs189; - setp.lt.u64 %p56, %rd71, 6; - mov.u16 %rs205, 5; - @%p56 bra $L__BB0_116; - - and.b64 %rd273, %rd336, -4294967296; - setp.eq.s64 %p57, %rd273, 0; - @%p57 bra $L__BB0_95; - - div.u64 %rd337, %rd336, %rd74; - bra.uni $L__BB0_96; - -$L__BB0_95: - cvt.u32.u64 %r93, %rd74; - cvt.u32.u64 %r94, %rd336; - div.u32 %r95, %r94, %r93; - cvt.u64.u32 %rd337, %r95; - -$L__BB0_96: - mul.lo.s64 %rd274, %rd337, %rd74; - sub.s64 %rd275, %rd336, %rd274; - add.s64 %rd276, %rd2, %rd275; - ld.local.u8 %rs191, [%rd276+106]; - st.local.u8 [%rd78+5], %rs191; - setp.eq.s64 %p58, %rd71, 6; - mov.u16 %rs205, 6; - @%p58 bra $L__BB0_116; - - and.b64 %rd277, %rd337, -4294967296; - setp.eq.s64 %p59, %rd277, 0; - @%p59 bra $L__BB0_99; - - div.u64 %rd338, %rd337, %rd74; - bra.uni $L__BB0_100; - -$L__BB0_99: - cvt.u32.u64 %r96, %rd74; - cvt.u32.u64 %r97, %rd337; - div.u32 %r98, %r97, %r96; - cvt.u64.u32 %rd338, %r98; - -$L__BB0_100: - mul.lo.s64 %rd278, %rd338, %rd74; - sub.s64 %rd279, %rd337, %rd278; - add.s64 %rd280, %rd2, %rd279; - ld.local.u8 %rs193, [%rd280+106]; - or.b64 %rd282, %rd147, 8; - cvta.to.local.u64 %rd283, %rd282; - st.local.u8 [%rd283], %rs193; - setp.lt.u64 %p60, %rd71, 8; - mov.u16 %rs205, 7; - @%p60 bra $L__BB0_116; - - and.b64 %rd284, %rd338, -4294967296; - setp.eq.s64 %p61, %rd284, 0; - @%p61 bra $L__BB0_103; - - div.u64 %rd339, %rd338, %rd74; - bra.uni $L__BB0_104; - -$L__BB0_103: - cvt.u32.u64 %r99, %rd74; - cvt.u32.u64 %r100, %rd338; - div.u32 %r101, %r100, %r99; - cvt.u64.u32 %rd339, %r101; - -$L__BB0_104: - mul.lo.s64 %rd285, %rd339, %rd74; - sub.s64 %rd286, %rd338, %rd285; - add.s64 %rd287, %rd2, %rd286; - ld.local.u8 %rs195, [%rd287+106]; - st.local.u8 [%rd78+7], %rs195; - setp.eq.s64 %p62, %rd71, 8; - mov.u16 %rs205, 8; - @%p62 bra $L__BB0_116; - - and.b64 %rd288, %rd339, -4294967296; - setp.eq.s64 %p63, %rd288, 0; - @%p63 bra $L__BB0_107; - - div.u64 %rd340, %rd339, %rd74; - bra.uni $L__BB0_108; - -$L__BB0_107: - cvt.u32.u64 %r102, %rd74; - cvt.u32.u64 %r103, %rd339; - div.u32 %r104, %r103, %r102; - cvt.u64.u32 %rd340, %r104; - -$L__BB0_108: - mul.lo.s64 %rd289, %rd340, %rd74; - sub.s64 %rd290, %rd339, %rd289; - add.s64 %rd291, %rd2, %rd290; - ld.local.u8 %rs197, [%rd291+106]; - st.local.u8 [%rd78+8], %rs197; - setp.lt.u64 %p64, %rd71, 10; - mov.u16 %rs205, 9; - @%p64 bra $L__BB0_116; - - and.b64 %rd292, %rd340, -4294967296; - setp.eq.s64 %p65, %rd292, 0; - @%p65 bra $L__BB0_111; - - rem.u64 %rd341, %rd340, %rd74; - bra.uni $L__BB0_112; - -$L__BB0_111: - cvt.u32.u64 %r105, %rd74; - cvt.u32.u64 %r106, %rd340; - rem.u32 %r107, %r106, %r105; - cvt.u64.u32 %rd341, %r107; - -$L__BB0_112: - add.s64 %rd293, %rd2, %rd341; - ld.local.u8 %rs199, [%rd293+106]; - st.local.u8 [%rd78+9], %rs199; - setp.eq.s64 %p66, %rd71, 10; - mov.u16 %rs205, 10; - @%p66 bra $L__BB0_116; - bra.uni $L__BB0_113; - -$L__BB0_116: - st.local.u16 [%rd1], %rs205; - ld.local.v4.u32 {%r120, %r121, %r122, %r111}, [%rd1]; - mov.b64 %rd345, {%r122, %r111}; - mov.b64 %rd344, {%r120, %r121}; - -$L__BB0_117: - add.s64 %rd57, %rd57, 1; - setp.lt.u64 %p67, %rd57, %rd143; - @%p67 bra $L__BB0_142; - -$L__BB0_118: - st.local.u32 [%rd9+8], %rd345; - st.local.u64 [%rd9], %rd344; - mov.b32 {%rs15, %rs200}, %r120; - cvt.u64.u16 %rd112, %rs15; - setp.gt.u16 %p68, %rs11, 11; - @%p68 bra $L__BB0_141; - - setp.gt.u16 %p69, %rs11, %rs15; - @%p69 bra $L__BB0_121; - bra.uni $L__BB0_120; - -$L__BB0_121: - shl.b64 %rd299, %rd112, 3; - add.s64 %rd300, %rd2, %rd299; - ld.local.u64 %rd349, [%rd300+16]; - setp.gt.u16 %p70, %rs15, 10; - @%p70 bra $L__BB0_140; - - add.s64 %rd301, %rd9, %rd112; - add.s64 %rd114, %rd301, 2; - setp.eq.s16 %p71, %rs15, 0; - @%p71 bra $L__BB0_138; - - ld.local.u16 %rs16, [%rd2+104]; - cvt.u64.u16 %rd115, %rs16; - setp.gt.u16 %p72, %rs16, 128; - @%p72 bra $L__BB0_137; - - setp.eq.s16 %p73, %rs16, 0; - @%p73 bra $L__BB0_129; - - add.s64 %rd347, %rd9, 2; - add.s64 %rd303, %rd2, %rd115; - add.s64 %rd117, %rd303, 106; - shr.u64 %rd304, %rd344, 16; - mov.u64 %rd302, 0; - cvt.u16.u64 %rs207, %rd304; - mov.u64 %rd346, %rd302; - mov.u64 %rd348, %rd347; - bra.uni $L__BB0_126; - -$L__BB0_136: - ld.local.u8 %rs207, [%rd348]; - mov.u64 %rd346, %rd124; - -$L__BB0_126: - add.s64 %rd347, %rd347, 1; - add.s64 %rd348, %rd348, 1; - add.s64 %rd124, %rd346, 1; - mov.u64 %rd350, %rd5; - mov.u64 %rd351, %rd5; - mov.u64 %rd352, %rd302; - -$L__BB0_127: - ld.local.u8 %rs201, [%rd351]; - and.b16 %rs202, %rs207, 255; - setp.eq.s16 %p74, %rs201, %rs202; - @%p74 bra $L__BB0_130; - - add.s64 %rd350, %rd350, 1; - add.s64 %rd351, %rd351, 1; - add.s64 %rd352, %rd352, 1; - setp.eq.s64 %p75, %rd350, %rd117; - @%p75 bra $L__BB0_129; - bra.uni $L__BB0_127; - -$L__BB0_130: - cvt.u32.u64 %r124, %rd346; - mov.u64 %rd355, 1; - setp.eq.s32 %p76, %r124, 0; - @%p76 bra $L__BB0_135; - - setp.eq.s32 %p77, %r124, 1; - mov.u64 %rd356, %rd115; - @%p77 bra $L__BB0_134; - - mov.u64 %rd355, 1; - mov.u64 %rd356, %rd115; - -$L__BB0_133: - and.b32 %r113, %r124, 1; - setp.eq.b32 %p78, %r113, 1; - selp.b64 %rd309, %rd356, 1, %p78; - mul.lo.s64 %rd355, %rd309, %rd355; - shr.u32 %r21, %r124, 1; - mul.lo.s64 %rd356, %rd356, %rd356; - setp.gt.u32 %p79, %r124, 3; - mov.u32 %r124, %r21; - @%p79 bra $L__BB0_133; - -$L__BB0_134: - mul.lo.s64 %rd355, %rd356, %rd355; - -$L__BB0_135: - and.b64 %rd310, %rd352, 255; - mul.lo.s64 %rd311, %rd355, %rd310; - add.s64 %rd349, %rd311, %rd349; - setp.eq.s64 %p80, %rd347, %rd114; - @%p80 bra $L__BB0_138; - bra.uni $L__BB0_136; - -$L__BB0_138: - st.global.u64 [%rd7], %rd349; - -$L__BB0_139: - ret; - -$L__BB0_129: - trap; - -$L__BB0_147: - { // callseq 8, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 8 - -$L__BB0_146: - { // callseq 7, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 7 - -$L__BB0_145: - trap; - -$L__BB0_144: - { // callseq 6, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 6 - -$L__BB0_143: - trap; - -$L__BB0_69: - trap; - -$L__BB0_115: - trap; - -$L__BB0_114: - { // callseq 2, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 2 - -$L__BB0_149: - { // callseq 9, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 9 - -$L__BB0_148: - trap; - -$L__BB0_7: - trap; - -$L__BB0_113: - trap; - -$L__BB0_141: - { // callseq 5, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 5 - -$L__BB0_120: - trap; - -$L__BB0_140: - { // callseq 4, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 4 - -$L__BB0_53: - trap; - -$L__BB0_52: - { // callseq 0, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 0 - -$L__BB0_137: - { // callseq 3, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 3 - -$L__BB0_51: - trap; - -} -.func _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E( - .param .b64 _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_0, - .param .b32 _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_1, - .param .align 16 .b8 _ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_2[16] -) -{ - .local .align 16 .b8 __local_depot1[592]; - .reg .b64 %SP; - .reg .b64 %SPL; - .reg .pred %p<403>; - .reg .b16 %rs<4357>; - .reg .b32 %r<9183>; - .reg .b64 %rd<4282>; - - - mov.u64 %SPL, __local_depot1; - cvta.local.u64 %SP, %SPL; - ld.param.v2.u32 {%r303, %r304}, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_2]; - ld.param.u32 %r302, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_2+8]; - ld.param.u64 %rd967, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_0]; - ld.param.u8 %rs1381, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_1]; - cvta.to.local.u64 %rd12, %rd967; - add.u64 %rd968, %SP, 0; - add.u64 %rd1, %SPL, 0; - add.u64 %rd978, %SP, 576; - add.u64 %rd979, %SPL, 576; - st.local.u32 [%rd979+8], %r302; - ld.param.u64 %rd980, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_2]; - st.local.u64 [%rd979], %rd980; - mov.b32 {%rs1, %rs1382}, %r303; - cvt.u64.u16 %rd11, %rs1; - shr.u64 %rd981, %rd980, 16; - cvt.u16.u64 %rs2, %rd981; - and.b16 %rs1380, %rs1381, 15; - setp.gt.s16 %p1, %rs1380, 5; - @%p1 bra $L__BB1_17; - - setp.gt.s16 %p9, %rs1380, 2; - @%p9 bra $L__BB1_9; - bra.uni $L__BB1_2; - -$L__BB1_9: - setp.eq.s16 %p10, %rs1380, 3; - @%p10 bra $L__BB1_250; - - setp.eq.s16 %p11, %rs1380, 4; - @%p11 bra $L__BB1_228; - - setp.eq.s16 %p12, %rs1380, 5; - @%p12 bra $L__BB1_12; - bra.uni $L__BB1_470; - -$L__BB1_12: - setp.gt.u16 %p142, %rs1, 10; - add.u64 %rd2190, %SP, 352; - add.u64 %rd680, %SPL, 352; - mov.u16 %rs2623, 0; - st.local.v4.u16 [%rd680], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2191, %rd2190, 8; - cvta.to.local.u64 %rd681, %rd2191; - st.local.v4.u16 [%rd681], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2192, %rd2190, 16; - cvta.to.local.u64 %rd682, %rd2192; - st.local.v4.u16 [%rd682], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2193, %rd2190, 24; - cvta.to.local.u64 %rd683, %rd2193; - st.local.v4.u16 [%rd683], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2194, %rd2190, 32; - cvta.to.local.u64 %rd684, %rd2194; - st.local.v4.u16 [%rd684], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2195, %rd2190, 40; - cvta.to.local.u64 %rd685, %rd2195; - st.local.v4.u16 [%rd685], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2196, %rd2190, 48; - cvta.to.local.u64 %rd686, %rd2196; - st.local.v4.u16 [%rd686], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd2197, %rd2190, 56; - cvta.to.local.u64 %rd687, %rd2197; - st.local.v4.u16 [%rd687], {%rs2623, %rs2623, %rs2623, %rs2623}; - add.s64 %rd688, %rd2190, 64; - cvta.to.local.u64 %rd689, %rd688; - st.local.u8 [%rd689], %rs2623; - @%p142 bra $L__BB1_227; - - cvta.to.local.u64 %rd690, %rd978; - shr.u64 %rd691, %rd11, 1; - setp.eq.s64 %p143, %rd691, 0; - @%p143 bra $L__BB1_211; - - mov.u64 %rd4218, 1; - mov.u64 %rd4216, %rd690; - mov.u64 %rd4217, %rd680; - bra.uni $L__BB1_15; - -$L__BB1_16: - ld.local.u16 %rs2, [%rd4216+4]; - add.s64 %rd4218, %rd4218, 1; - add.s64 %rd4217, %rd4217, 2; - add.s64 %rd4216, %rd4216, 2; - -$L__BB1_15: - st.local.u16 [%rd4217], %rs2; - setp.ge.u64 %p144, %rd4218, %rd691; - @%p144 bra $L__BB1_211; - bra.uni $L__BB1_16; - -$L__BB1_211: - and.b64 %rd699, %rd11, 1; - setp.eq.s64 %p145, %rd699, 0; - @%p145 bra $L__BB1_214; - - and.b64 %rd2202, %rd11, 65534; - cvta.to.local.u64 %rd2204, %rd2190; - add.s64 %rd700, %rd2204, %rd2202; - add.s64 %rd2205, %rd690, %rd2202; - add.s64 %rd701, %rd2205, 2; - mov.u64 %rd4219, 0; - -$L__BB1_213: - add.s64 %rd2206, %rd701, %rd4219; - ld.local.u8 %rs2624, [%rd2206]; - add.s64 %rd2207, %rd700, %rd4219; - st.local.u8 [%rd2207], %rs2624; - add.s64 %rd4219, %rd4219, 1; - setp.lt.u64 %p146, %rd4219, %rd699; - @%p146 bra $L__BB1_213; - -$L__BB1_214: - mov.u64 %rd2208, 0; - st.local.u8 [%rd689], %rs1; - ld.local.v4.u16 {%rs2625, %rs2626, %rs2627, %rs2628}, [%rd680]; - ld.local.v4.u16 {%rs2633, %rs2634, %rs2635, %rs2636}, [%rd681]; - ld.local.v4.u16 {%rs2641, %rs2642, %rs2643, %rs2644}, [%rd682]; - ld.local.v4.u16 {%rs2649, %rs2650, %rs2651, %rs2652}, [%rd683]; - ld.local.v4.u16 {%rs2657, %rs2658, %rs2659, %rs2660}, [%rd684]; - ld.local.v4.u16 {%rs2665, %rs2666, %rs2667, %rs2668}, [%rd685]; - ld.local.v4.u16 {%rs2673, %rs2674, %rs2675, %rs2676}, [%rd686]; - mov.u32 %r647, 0; - shr.u16 %rs2679, %rs2676, 8; - ld.local.v4.u16 {%rs2680, %rs2681, %rs2682, %rs2683}, [%rd687]; - ld.local.v4.u16 {%rs2688, %rs2689, %rs2690, %rs2691}, [%rd689]; - and.b16 %rs2695, %rs2688, 255; - st.local.u64 [%rd1], %rd2208; - mov.u32 %r648, -1150833019; - mov.u32 %r649, 1779033703; - st.local.v2.u32 [%rd1+8], {%r649, %r648}; - mov.u32 %r650, -1521486534; - mov.u32 %r651, 1013904242; - st.local.v2.u32 [%rd1+16], {%r651, %r650}; - mov.u32 %r652, -1694144372; - mov.u32 %r653, 1359893119; - st.local.v2.u32 [%rd1+24], {%r653, %r652}; - mov.u32 %r654, 1541459225; - mov.u32 %r655, 528734635; - st.local.v2.u32 [%rd1+32], {%r655, %r654}; - st.local.v4.u16 [%rd1+40], {%rs2625, %rs2626, %rs2627, %rs2628}; - st.local.v4.u16 [%rd1+48], {%rs2633, %rs2634, %rs2635, %rs2636}; - st.local.v4.u16 [%rd1+56], {%rs2641, %rs2642, %rs2643, %rs2644}; - st.local.v4.u16 [%rd1+64], {%rs2649, %rs2650, %rs2651, %rs2652}; - st.local.v4.u16 [%rd1+72], {%rs2657, %rs2658, %rs2659, %rs2660}; - st.local.v4.u16 [%rd1+80], {%rs2665, %rs2666, %rs2667, %rs2668}; - st.local.v2.u16 [%rd1+88], {%rs2673, %rs2674}; - st.local.u16 [%rd1+92], %rs2675; - st.local.u8 [%rd1+94], %rs2676; - st.local.u8 [%rd1+95], %rs2679; - st.local.v4.u16 [%rd1+96], {%rs2680, %rs2681, %rs2682, %rs2683}; - st.local.v4.u16 [%rd1+104], {%rs2688, %rs2689, %rs2690, %rs2691}; - cvt.u64.u16 %rd2210, %rs2688; - and.b64 %rd705, %rd2210, 255; - cvt.u32.u16 %r656, %rs2688; - and.b32 %r657, %r656, 255; - mul.wide.u32 %rd2211, %r657, 8; - { - .reg .b32 %temp; - mov.b64 {%r658, %temp}, %rd2211; - } - { - .reg .b32 %temp; - mov.b64 {%temp, %r659}, %rd2211; - } - mov.u32 %r660, 291; - prmt.b32 %r661, %r658, %r647, %r660; - prmt.b32 %r662, %r659, %r647, %r660; - mov.b64 %rd706, {%r662, %r661}; - setp.lt.u16 %p147, %rs2695, 64; - @%p147 bra $L__BB1_216; - bra.uni $L__BB1_215; - -$L__BB1_216: - add.s64 %rd2212, %rd1, %rd705; - mov.u16 %rs2698, 128; - st.local.u8 [%rd2212+40], %rs2698; - add.s64 %rd707, %rd705, 1; - setp.eq.s64 %p148, %rd707, 64; - @%p148 bra $L__BB1_223; - - add.s64 %rd2213, %rd1, %rd707; - add.s64 %rd4224, %rd2213, 40; - mov.u16 %rs2699, 3; - sub.s16 %rs2700, %rs2699, %rs2688; - and.b16 %rs535, %rs2700, 3; - setp.eq.s16 %p149, %rs535, 0; - @%p149 bra $L__BB1_220; - - cvt.u64.u16 %rd2214, %rs535; - neg.s64 %rd4220, %rd2214; - mov.u64 %rd4221, %rd4224; - -$L__BB1_219: - .pragma "nounroll"; - add.s64 %rd4224, %rd4221, 1; - st.local.u8 [%rd4221], %rs2623; - add.s64 %rd4220, %rd4220, 1; - setp.ne.s64 %p150, %rd4220, 0; - mov.u64 %rd4221, %rd4224; - @%p150 bra $L__BB1_219; - -$L__BB1_220: - mov.u64 %rd2215, 62; - sub.s64 %rd2216, %rd2215, %rd705; - setp.lt.u64 %p151, %rd2216, 3; - @%p151 bra $L__BB1_223; - - sub.s64 %rd2217, %rd1, %rd4224; - add.s64 %rd4223, %rd2217, 104; - -$L__BB1_222: - st.local.u8 [%rd4224], %rs2623; - st.local.u8 [%rd4224+1], %rs2623; - st.local.u8 [%rd4224+2], %rs2623; - st.local.u8 [%rd4224+3], %rs2623; - add.s64 %rd4223, %rd4223, -4; - setp.ne.s64 %p152, %rd4223, 0; - add.s64 %rd4224, %rd4224, 4; - @%p152 bra $L__BB1_222; - -$L__BB1_223: - add.s64 %rd721, %rd968, 40; - or.b64 %rd2219, %rd705, 7; - setp.eq.s64 %p153, %rd2219, 63; - add.s64 %rd722, %rd968, 8; - @%p153 bra $L__BB1_225; - bra.uni $L__BB1_224; - -$L__BB1_225: - mov.u64 %rd2221, 1; - { // callseq 25, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd722; - .param .b64 param1; - st.param.b64 [param1+0], %rd721; - .param .b64 param2; - st.param.b64 [param2+0], %rd2221; - call.uni - _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE, - ( - param0, - param1, - param2 - ); - } // callseq 25 - add.u64 %rd2222, %SP, 504; - add.u64 %rd2223, %SPL, 504; - st.local.u8 [%rd2223], %rs2623; - st.local.u8 [%rd2223+1], %rs2623; - st.local.u8 [%rd2223+2], %rs2623; - st.local.u8 [%rd2223+3], %rs2623; - st.local.u8 [%rd2223+4], %rs2623; - st.local.u8 [%rd2223+5], %rs2623; - st.local.u8 [%rd2223+6], %rs2623; - st.local.u8 [%rd2223+7], %rs2623; - st.local.u8 [%rd2223+8], %rs2623; - st.local.u8 [%rd2223+9], %rs2623; - st.local.u8 [%rd2223+10], %rs2623; - st.local.u8 [%rd2223+11], %rs2623; - st.local.u8 [%rd2223+12], %rs2623; - st.local.u8 [%rd2223+13], %rs2623; - st.local.u8 [%rd2223+14], %rs2623; - st.local.u8 [%rd2223+15], %rs2623; - st.local.u8 [%rd2223+16], %rs2623; - st.local.u8 [%rd2223+17], %rs2623; - st.local.u8 [%rd2223+18], %rs2623; - st.local.u8 [%rd2223+19], %rs2623; - st.local.u8 [%rd2223+20], %rs2623; - st.local.u8 [%rd2223+21], %rs2623; - st.local.u8 [%rd2223+22], %rs2623; - st.local.u8 [%rd2223+23], %rs2623; - st.local.u8 [%rd2223+24], %rs2623; - st.local.u8 [%rd2223+25], %rs2623; - st.local.u8 [%rd2223+26], %rs2623; - st.local.u8 [%rd2223+27], %rs2623; - st.local.u8 [%rd2223+28], %rs2623; - st.local.u8 [%rd2223+29], %rs2623; - st.local.u8 [%rd2223+30], %rs2623; - st.local.u8 [%rd2223+31], %rs2623; - st.local.u8 [%rd2223+32], %rs2623; - st.local.u8 [%rd2223+33], %rs2623; - st.local.u8 [%rd2223+34], %rs2623; - st.local.u8 [%rd2223+35], %rs2623; - st.local.u8 [%rd2223+36], %rs2623; - st.local.u8 [%rd2223+37], %rs2623; - st.local.u8 [%rd2223+38], %rs2623; - st.local.u8 [%rd2223+39], %rs2623; - st.local.u8 [%rd2223+40], %rs2623; - st.local.u8 [%rd2223+41], %rs2623; - st.local.u8 [%rd2223+42], %rs2623; - st.local.u8 [%rd2223+43], %rs2623; - st.local.u8 [%rd2223+44], %rs2623; - st.local.u8 [%rd2223+45], %rs2623; - st.local.u8 [%rd2223+46], %rs2623; - st.local.u8 [%rd2223+47], %rs2623; - st.local.u8 [%rd2223+48], %rs2623; - st.local.u8 [%rd2223+49], %rs2623; - st.local.u8 [%rd2223+50], %rs2623; - st.local.u8 [%rd2223+51], %rs2623; - st.local.u8 [%rd2223+52], %rs2623; - st.local.u8 [%rd2223+53], %rs2623; - st.local.u8 [%rd2223+54], %rs2623; - st.local.u8 [%rd2223+55], %rs2623; - shr.u64 %rd2224, %rd706, 56; - st.local.u8 [%rd2223+63], %rd2224; - shr.u64 %rd2225, %rd706, 48; - st.local.u8 [%rd2223+62], %rd2225; - shr.u64 %rd2226, %rd706, 40; - st.local.u8 [%rd2223+61], %rd2226; - shr.u64 %rd2227, %rd706, 32; - st.local.u8 [%rd2223+60], %rd2227; - shr.u64 %rd2228, %rd706, 24; - st.local.u8 [%rd2223+59], %rd2228; - shr.u64 %rd2229, %rd706, 16; - st.local.u8 [%rd2223+58], %rd2229; - shr.u64 %rd2230, %rd706, 8; - st.local.u8 [%rd2223+57], %rd2230; - st.local.u8 [%rd2223+56], %rd706; - { // callseq 26, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd722; - .param .b64 param1; - st.param.b64 [param1+0], %rd2222; - .param .b64 param2; - st.param.b64 [param2+0], %rd2221; - call.uni - _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE, - ( - param0, - param1, - param2 - ); - } // callseq 26 - bra.uni $L__BB1_226; - -$L__BB1_17: - setp.gt.s16 %p2, %rs1380, 8; - @%p2 bra $L__BB1_23; - - setp.eq.s16 %p6, %rs1380, 8; - @%p6 bra $L__BB1_158; - bra.uni $L__BB1_19; - -$L__BB1_158: - setp.gt.u16 %p105, %rs1, 10; - add.u64 %rd1879, %SP, 352; - add.u64 %rd511, %SPL, 352; - mov.u16 %rs2264, 0; - st.local.v4.u16 [%rd511], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1880, %rd1879, 8; - cvta.to.local.u64 %rd512, %rd1880; - st.local.v4.u16 [%rd512], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1881, %rd1879, 16; - cvta.to.local.u64 %rd513, %rd1881; - st.local.v4.u16 [%rd513], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1882, %rd1879, 24; - cvta.to.local.u64 %rd514, %rd1882; - st.local.v4.u16 [%rd514], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1883, %rd1879, 32; - cvta.to.local.u64 %rd515, %rd1883; - st.local.v4.u16 [%rd515], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1884, %rd1879, 40; - cvta.to.local.u64 %rd516, %rd1884; - st.local.v4.u16 [%rd516], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1885, %rd1879, 48; - cvta.to.local.u64 %rd517, %rd1885; - st.local.v4.u16 [%rd517], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1886, %rd1879, 56; - cvta.to.local.u64 %rd518, %rd1886; - st.local.v4.u16 [%rd518], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1887, %rd1879, 64; - cvta.to.local.u64 %rd519, %rd1887; - st.local.v4.u16 [%rd519], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1888, %rd1879, 72; - cvta.to.local.u64 %rd520, %rd1888; - st.local.v4.u16 [%rd520], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1889, %rd1879, 80; - cvta.to.local.u64 %rd521, %rd1889; - st.local.v4.u16 [%rd521], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1890, %rd1879, 88; - cvta.to.local.u64 %rd522, %rd1890; - st.local.v4.u16 [%rd522], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1891, %rd1879, 96; - cvta.to.local.u64 %rd523, %rd1891; - st.local.v4.u16 [%rd523], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1892, %rd1879, 104; - cvta.to.local.u64 %rd524, %rd1892; - st.local.v4.u16 [%rd524], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1893, %rd1879, 112; - cvta.to.local.u64 %rd525, %rd1893; - st.local.v4.u16 [%rd525], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1894, %rd1879, 120; - cvta.to.local.u64 %rd526, %rd1894; - st.local.v4.u16 [%rd526], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1895, %rd1879, 128; - cvta.to.local.u64 %rd527, %rd1895; - st.local.v4.u16 [%rd527], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd1896, %rd1879, 136; - cvta.to.local.u64 %rd528, %rd1896; - st.local.v4.u16 [%rd528], {%rs2264, %rs2264, %rs2264, %rs2264}; - add.s64 %rd529, %rd1879, 144; - cvta.to.local.u64 %rd530, %rd529; - st.local.u8 [%rd530], %rs2264; - @%p105 bra $L__BB1_206; - - cvta.to.local.u64 %rd531, %rd978; - shr.u64 %rd532, %rd11, 1; - setp.eq.s64 %p106, %rd532, 0; - @%p106 bra $L__BB1_163; - - mov.u64 %rd4173, 1; - mov.u64 %rd4171, %rd531; - mov.u64 %rd4172, %rd511; - bra.uni $L__BB1_161; - -$L__BB1_162: - ld.local.u16 %rs2, [%rd4171+4]; - add.s64 %rd4173, %rd4173, 1; - add.s64 %rd4172, %rd4172, 2; - add.s64 %rd4171, %rd4171, 2; - -$L__BB1_161: - st.local.u16 [%rd4172], %rs2; - setp.ge.u64 %p107, %rd4173, %rd532; - @%p107 bra $L__BB1_163; - bra.uni $L__BB1_162; - -$L__BB1_163: - and.b64 %rd540, %rd11, 1; - setp.eq.s64 %p108, %rd540, 0; - @%p108 bra $L__BB1_166; - - and.b64 %rd1901, %rd11, 65534; - cvta.to.local.u64 %rd1903, %rd1879; - add.s64 %rd541, %rd1903, %rd1901; - add.s64 %rd1904, %rd531, %rd1901; - add.s64 %rd542, %rd1904, 2; - mov.u64 %rd4174, 0; - -$L__BB1_165: - add.s64 %rd1905, %rd542, %rd4174; - ld.local.u8 %rs2265, [%rd1905]; - add.s64 %rd1906, %rd541, %rd4174; - st.local.u8 [%rd1906], %rs2265; - add.s64 %rd4174, %rd4174, 1; - setp.lt.u64 %p109, %rd4174, %rd540; - @%p109 bra $L__BB1_165; - -$L__BB1_166: - mov.u64 %rd1907, 0; - st.local.u8 [%rd530], %rs1; - ld.local.v4.u16 {%rs2266, %rs2267, %rs2268, %rs2269}, [%rd511]; - ld.local.v4.u16 {%rs2274, %rs2275, %rs2276, %rs2277}, [%rd512]; - ld.local.v4.u16 {%rs2282, %rs2283, %rs2284, %rs2285}, [%rd513]; - ld.local.v4.u16 {%rs2290, %rs2291, %rs2292, %rs2293}, [%rd514]; - ld.local.v4.u16 {%rs2298, %rs2299, %rs2300, %rs2301}, [%rd515]; - shr.u16 %rs2304, %rs2301, 8; - ld.local.v4.u16 {%rs2305, %rs2306, %rs2307, %rs2308}, [%rd516]; - ld.local.v4.u16 {%rs2313, %rs2314, %rs2315, %rs2316}, [%rd517]; - ld.local.v4.u16 {%rs2321, %rs2322, %rs2323, %rs2324}, [%rd518]; - ld.local.v4.u16 {%rs2329, %rs2330, %rs2331, %rs2332}, [%rd519]; - ld.local.v4.u16 {%rs2337, %rs2338, %rs2339, %rs2340}, [%rd520]; - ld.local.v4.u16 {%rs2345, %rs2346, %rs2347, %rs2348}, [%rd521]; - ld.local.v4.u16 {%rs2353, %rs2354, %rs2355, %rs2356}, [%rd522]; - ld.local.v4.u16 {%rs2361, %rs2362, %rs2363, %rs2364}, [%rd523]; - shr.u16 %rs2367, %rs2364, 8; - ld.local.v4.u16 {%rs2368, %rs2369, %rs2370, %rs2371}, [%rd524]; - ld.local.v4.u16 {%rs2376, %rs2377, %rs2378, %rs2379}, [%rd525]; - ld.local.v4.u16 {%rs2384, %rs2385, %rs2386, %rs2387}, [%rd526]; - ld.local.v4.u16 {%rs2392, %rs2393, %rs2394, %rs2395}, [%rd527]; - ld.local.v4.u16 {%rs2400, %rs2401, %rs2402, %rs2403}, [%rd528]; - ld.local.v4.u16 {%rs2408, %rs2409, %rs2410, %rs2411}, [%rd530]; - and.b16 %rs2415, %rs2408, 255; - st.local.u64 [%rd1], %rd1907; - st.local.u64 [%rd1+8], %rd1907; - st.local.u64 [%rd1+16], %rd1907; - st.local.u64 [%rd1+24], %rd1907; - st.local.u64 [%rd1+32], %rd1907; - st.local.u64 [%rd1+40], %rd1907; - st.local.u64 [%rd1+48], %rd1907; - st.local.u64 [%rd1+56], %rd1907; - st.local.u64 [%rd1+64], %rd1907; - st.local.u64 [%rd1+72], %rd1907; - st.local.u64 [%rd1+80], %rd1907; - st.local.u64 [%rd1+88], %rd1907; - st.local.u64 [%rd1+96], %rd1907; - st.local.u64 [%rd1+104], %rd1907; - st.local.u64 [%rd1+112], %rd1907; - st.local.u64 [%rd1+120], %rd1907; - st.local.u64 [%rd1+128], %rd1907; - st.local.u64 [%rd1+136], %rd1907; - st.local.u64 [%rd1+144], %rd1907; - st.local.u64 [%rd1+152], %rd1907; - st.local.u64 [%rd1+160], %rd1907; - st.local.u64 [%rd1+168], %rd1907; - st.local.u64 [%rd1+176], %rd1907; - st.local.u64 [%rd1+184], %rd1907; - st.local.u64 [%rd1+192], %rd1907; - st.local.v4.u16 [%rd1+200], {%rs2266, %rs2267, %rs2268, %rs2269}; - st.local.v4.u16 [%rd1+208], {%rs2274, %rs2275, %rs2276, %rs2277}; - st.local.v4.u16 [%rd1+216], {%rs2282, %rs2283, %rs2284, %rs2285}; - st.local.v4.u16 [%rd1+224], {%rs2290, %rs2291, %rs2292, %rs2293}; - st.local.v2.u16 [%rd1+232], {%rs2298, %rs2299}; - st.local.u16 [%rd1+236], %rs2300; - st.local.u8 [%rd1+238], %rs2301; - st.local.u8 [%rd1+239], %rs2304; - st.local.v4.u16 [%rd1+240], {%rs2305, %rs2306, %rs2307, %rs2308}; - st.local.v4.u16 [%rd1+248], {%rs2313, %rs2314, %rs2315, %rs2316}; - st.local.v4.u16 [%rd1+256], {%rs2321, %rs2322, %rs2323, %rs2324}; - st.local.v4.u16 [%rd1+264], {%rs2329, %rs2330, %rs2331, %rs2332}; - st.local.v4.u16 [%rd1+272], {%rs2337, %rs2338, %rs2339, %rs2340}; - st.local.v4.u16 [%rd1+280], {%rs2345, %rs2346, %rs2347, %rs2348}; - st.local.v4.u16 [%rd1+288], {%rs2353, %rs2354, %rs2355, %rs2356}; - st.local.v2.u16 [%rd1+296], {%rs2361, %rs2362}; - st.local.u16 [%rd1+300], %rs2363; - st.local.u8 [%rd1+302], %rs2364; - st.local.u8 [%rd1+303], %rs2367; - st.local.v4.u16 [%rd1+304], {%rs2368, %rs2369, %rs2370, %rs2371}; - st.local.v4.u16 [%rd1+312], {%rs2376, %rs2377, %rs2378, %rs2379}; - st.local.v4.u16 [%rd1+320], {%rs2384, %rs2385, %rs2386, %rs2387}; - st.local.v4.u16 [%rd1+328], {%rs2392, %rs2393, %rs2394, %rs2395}; - st.local.v4.u16 [%rd1+336], {%rs2400, %rs2401, %rs2402, %rs2403}; - st.local.v4.u16 [%rd1+344], {%rs2408, %rs2409, %rs2410, %rs2411}; - setp.gt.u16 %p110, %rs2415, 144; - @%p110 bra $L__BB1_205; - - setp.eq.s16 %p111, %rs2415, 144; - @%p111 bra $L__BB1_203; - - cvt.u64.u16 %rd1909, %rs2408; - and.b64 %rd546, %rd1909, 255; - add.s64 %rd1910, %rd1, %rd546; - add.s64 %rd547, %rd1910, 200; - neg.s16 %rs2421, %rs2408; - and.b16 %rs369, %rs2421, 7; - setp.eq.s16 %p112, %rs369, 0; - mov.u64 %rd4181, %rd547; - @%p112 bra $L__BB1_171; - - cvt.u64.u16 %rd1911, %rs369; - neg.s64 %rd4175, %rd1911; - mov.u64 %rd4176, %rd547; - -$L__BB1_170: - .pragma "nounroll"; - add.s64 %rd4181, %rd4176, 1; - st.local.u8 [%rd4176], %rs2264; - add.s64 %rd4175, %rd4175, 1; - setp.ne.s64 %p113, %rd4175, 0; - mov.u64 %rd4176, %rd4181; - @%p113 bra $L__BB1_170; - -$L__BB1_171: - mov.u64 %rd1912, 143; - sub.s64 %rd1913, %rd1912, %rd546; - setp.lt.u64 %p114, %rd1913, 7; - @%p114 bra $L__BB1_178; - - add.s64 %rd1914, %rd1, 336; - sub.s64 %rd556, %rd1914, %rd4181; - shr.u64 %rd1915, %rd556, 3; - add.s64 %rd1916, %rd1915, 1; - and.b64 %rd557, %rd1916, 3; - setp.eq.s64 %p115, %rd557, 0; - mov.u64 %rd4184, %rd4181; - @%p115 bra $L__BB1_175; - - neg.s64 %rd4178, %rd557; - mov.u64 %rd4180, %rd4181; - -$L__BB1_174: - .pragma "nounroll"; - st.local.u8 [%rd4180], %rs2264; - st.local.u8 [%rd4180+1], %rs2264; - st.local.u8 [%rd4180+2], %rs2264; - st.local.u8 [%rd4180+3], %rs2264; - st.local.u8 [%rd4180+4], %rs2264; - st.local.u8 [%rd4180+5], %rs2264; - st.local.u8 [%rd4180+6], %rs2264; - add.s64 %rd4181, %rd4181, 8; - add.s64 %rd4184, %rd4180, 8; - st.local.u8 [%rd4180+7], %rs2264; - add.s64 %rd4178, %rd4178, 1; - setp.ne.s64 %p116, %rd4178, 0; - mov.u64 %rd4180, %rd4184; - @%p116 bra $L__BB1_174; - -$L__BB1_175: - setp.lt.u64 %p117, %rd556, 24; - @%p117 bra $L__BB1_178; - - sub.s64 %rd1917, %rd1, %rd4181; - add.s64 %rd4183, %rd1917, 344; - -$L__BB1_177: - st.local.u8 [%rd4184], %rs2264; - st.local.u8 [%rd4184+1], %rs2264; - st.local.u8 [%rd4184+2], %rs2264; - st.local.u8 [%rd4184+3], %rs2264; - st.local.u8 [%rd4184+4], %rs2264; - st.local.u8 [%rd4184+5], %rs2264; - st.local.u8 [%rd4184+6], %rs2264; - st.local.u8 [%rd4184+7], %rs2264; - st.local.u8 [%rd4184+8], %rs2264; - st.local.u8 [%rd4184+9], %rs2264; - st.local.u8 [%rd4184+10], %rs2264; - st.local.u8 [%rd4184+11], %rs2264; - st.local.u8 [%rd4184+12], %rs2264; - st.local.u8 [%rd4184+13], %rs2264; - st.local.u8 [%rd4184+14], %rs2264; - st.local.u8 [%rd4184+15], %rs2264; - st.local.u8 [%rd4184+16], %rs2264; - st.local.u8 [%rd4184+17], %rs2264; - st.local.u8 [%rd4184+18], %rs2264; - st.local.u8 [%rd4184+19], %rs2264; - st.local.u8 [%rd4184+20], %rs2264; - st.local.u8 [%rd4184+21], %rs2264; - st.local.u8 [%rd4184+22], %rs2264; - st.local.u8 [%rd4184+23], %rs2264; - st.local.u8 [%rd4184+24], %rs2264; - st.local.u8 [%rd4184+25], %rs2264; - st.local.u8 [%rd4184+26], %rs2264; - st.local.u8 [%rd4184+27], %rs2264; - st.local.u8 [%rd4184+28], %rs2264; - st.local.u8 [%rd4184+29], %rs2264; - st.local.u8 [%rd4184+30], %rs2264; - st.local.u8 [%rd4184+31], %rs2264; - add.s64 %rd4183, %rd4183, -32; - setp.ne.s64 %p118, %rd4183, 0; - add.s64 %rd4184, %rd4184, 32; - @%p118 bra $L__BB1_177; - -$L__BB1_178: - st.local.u8 [%rd1+344], %rs2264; - setp.gt.u16 %p119, %rs2415, 143; - @%p119 bra $L__BB1_204; - - mov.u16 %rs2427, 6; - st.local.u8 [%rd547], %rs2427; - ld.local.u8 %rs2428, [%rd1+343]; - or.b16 %rs2429, %rs2428, 128; - st.local.u8 [%rd1+343], %rs2429; - ld.local.u64 %rd1918, [%rd1+200]; - shl.b64 %rd1919, %rd1918, 8; - mov.b64 {%r539, %r540}, %rd1919; - shr.u64 %rd1920, %rd1918, 56; - mov.b64 {%r541, %r542}, %rd1920; - mov.b32 {%rs378, %rs2430}, %r541; - mov.b32 {%rs374, %rs376}, %r540; - shr.u16 %rs377, %rs376, 8; - shr.u16 %rs375, %rs374, 8; - mov.b32 {%rs370, %rs372}, %r539; - shr.u16 %rs373, %rs372, 8; - shr.u16 %rs371, %rs370, 8; - mov.pred %p120, 0; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2431, %rs372, 8; - or.b16 %rs2432, %rs371, %rs2431; - shl.b16 %rs2433, %rs374, 8; - or.b16 %rs2434, %rs373, %rs2433; - mov.b32 %r543, {%rs2432, %rs2434}; - shl.b16 %rs2435, %rs376, 8; - or.b16 %rs2436, %rs375, %rs2435; - shl.b16 %rs2437, %rs378, 8; - or.b16 %rs2438, %rs377, %rs2437; - mov.b32 %r544, {%rs2436, %rs2438}; - mov.b64 %rd1921, {%r543, %r544}; - ld.local.u64 %rd1922, [%rd1]; - xor.b64 %rd4215, %rd1922, %rd1921; - st.local.u64 [%rd1], %rd4215; - ld.local.u64 %rd1923, [%rd1+208]; - shl.b64 %rd1924, %rd1923, 8; - mov.b64 {%r545, %r546}, %rd1924; - shr.u64 %rd1925, %rd1923, 56; - mov.b64 {%r547, %r548}, %rd1925; - mov.b32 {%rs387, %rs2439}, %r547; - mov.b32 {%rs383, %rs385}, %r546; - shr.u16 %rs386, %rs385, 8; - shr.u16 %rs384, %rs383, 8; - mov.b32 {%rs379, %rs381}, %r545; - shr.u16 %rs382, %rs381, 8; - shr.u16 %rs380, %rs379, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2440, %rs381, 8; - or.b16 %rs2441, %rs380, %rs2440; - shl.b16 %rs2442, %rs383, 8; - or.b16 %rs2443, %rs382, %rs2442; - mov.b32 %r549, {%rs2441, %rs2443}; - shl.b16 %rs2444, %rs385, 8; - or.b16 %rs2445, %rs384, %rs2444; - shl.b16 %rs2446, %rs387, 8; - or.b16 %rs2447, %rs386, %rs2446; - mov.b32 %r550, {%rs2445, %rs2447}; - mov.b64 %rd1926, {%r549, %r550}; - ld.local.u64 %rd1927, [%rd1+8]; - xor.b64 %rd4214, %rd1927, %rd1926; - st.local.u64 [%rd1+8], %rd4214; - ld.local.u64 %rd1928, [%rd1+216]; - shl.b64 %rd1929, %rd1928, 8; - mov.b64 {%r551, %r552}, %rd1929; - shr.u64 %rd1930, %rd1928, 56; - mov.b64 {%r553, %r554}, %rd1930; - mov.b32 {%rs396, %rs2448}, %r553; - mov.b32 {%rs392, %rs394}, %r552; - shr.u16 %rs395, %rs394, 8; - shr.u16 %rs393, %rs392, 8; - mov.b32 {%rs388, %rs390}, %r551; - shr.u16 %rs391, %rs390, 8; - shr.u16 %rs389, %rs388, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2449, %rs390, 8; - or.b16 %rs2450, %rs389, %rs2449; - shl.b16 %rs2451, %rs392, 8; - or.b16 %rs2452, %rs391, %rs2451; - mov.b32 %r555, {%rs2450, %rs2452}; - shl.b16 %rs2453, %rs394, 8; - or.b16 %rs2454, %rs393, %rs2453; - shl.b16 %rs2455, %rs396, 8; - or.b16 %rs2456, %rs395, %rs2455; - mov.b32 %r556, {%rs2454, %rs2456}; - mov.b64 %rd1931, {%r555, %r556}; - ld.local.u64 %rd1932, [%rd1+16]; - xor.b64 %rd4213, %rd1932, %rd1931; - st.local.u64 [%rd1+16], %rd4213; - ld.local.u64 %rd1933, [%rd1+224]; - shl.b64 %rd1934, %rd1933, 8; - mov.b64 {%r557, %r558}, %rd1934; - shr.u64 %rd1935, %rd1933, 56; - mov.b64 {%r559, %r560}, %rd1935; - mov.b32 {%rs405, %rs2457}, %r559; - mov.b32 {%rs401, %rs403}, %r558; - shr.u16 %rs404, %rs403, 8; - shr.u16 %rs402, %rs401, 8; - mov.b32 {%rs397, %rs399}, %r557; - shr.u16 %rs400, %rs399, 8; - shr.u16 %rs398, %rs397, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2458, %rs399, 8; - or.b16 %rs2459, %rs398, %rs2458; - shl.b16 %rs2460, %rs401, 8; - or.b16 %rs2461, %rs400, %rs2460; - mov.b32 %r561, {%rs2459, %rs2461}; - shl.b16 %rs2462, %rs403, 8; - or.b16 %rs2463, %rs402, %rs2462; - shl.b16 %rs2464, %rs405, 8; - or.b16 %rs2465, %rs404, %rs2464; - mov.b32 %r562, {%rs2463, %rs2465}; - mov.b64 %rd1936, {%r561, %r562}; - ld.local.u64 %rd1937, [%rd1+24]; - xor.b64 %rd4212, %rd1937, %rd1936; - st.local.u64 [%rd1+24], %rd4212; - ld.local.u64 %rd1938, [%rd1+232]; - shl.b64 %rd1939, %rd1938, 8; - mov.b64 {%r563, %r564}, %rd1939; - shr.u64 %rd1940, %rd1938, 56; - mov.b64 {%r565, %r566}, %rd1940; - mov.b32 {%rs414, %rs2466}, %r565; - mov.b32 {%rs410, %rs412}, %r564; - shr.u16 %rs413, %rs412, 8; - shr.u16 %rs411, %rs410, 8; - mov.b32 {%rs406, %rs408}, %r563; - shr.u16 %rs409, %rs408, 8; - shr.u16 %rs407, %rs406, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2467, %rs408, 8; - or.b16 %rs2468, %rs407, %rs2467; - shl.b16 %rs2469, %rs410, 8; - or.b16 %rs2470, %rs409, %rs2469; - mov.b32 %r567, {%rs2468, %rs2470}; - shl.b16 %rs2471, %rs412, 8; - or.b16 %rs2472, %rs411, %rs2471; - shl.b16 %rs2473, %rs414, 8; - or.b16 %rs2474, %rs413, %rs2473; - mov.b32 %r568, {%rs2472, %rs2474}; - mov.b64 %rd1941, {%r567, %r568}; - ld.local.u64 %rd1942, [%rd1+32]; - xor.b64 %rd4186, %rd1942, %rd1941; - st.local.u64 [%rd1+32], %rd4186; - ld.local.u64 %rd1943, [%rd1+240]; - shl.b64 %rd1944, %rd1943, 8; - mov.b64 {%r569, %r570}, %rd1944; - shr.u64 %rd1945, %rd1943, 56; - mov.b64 {%r571, %r572}, %rd1945; - mov.b32 {%rs423, %rs2475}, %r571; - mov.b32 {%rs419, %rs421}, %r570; - shr.u16 %rs422, %rs421, 8; - shr.u16 %rs420, %rs419, 8; - mov.b32 {%rs415, %rs417}, %r569; - shr.u16 %rs418, %rs417, 8; - shr.u16 %rs416, %rs415, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2476, %rs417, 8; - or.b16 %rs2477, %rs416, %rs2476; - shl.b16 %rs2478, %rs419, 8; - or.b16 %rs2479, %rs418, %rs2478; - mov.b32 %r573, {%rs2477, %rs2479}; - shl.b16 %rs2480, %rs421, 8; - or.b16 %rs2481, %rs420, %rs2480; - shl.b16 %rs2482, %rs423, 8; - or.b16 %rs2483, %rs422, %rs2482; - mov.b32 %r574, {%rs2481, %rs2483}; - mov.b64 %rd1946, {%r573, %r574}; - ld.local.u64 %rd1947, [%rd1+40]; - xor.b64 %rd4209, %rd1947, %rd1946; - st.local.u64 [%rd1+40], %rd4209; - ld.local.u64 %rd1948, [%rd1+248]; - shl.b64 %rd1949, %rd1948, 8; - mov.b64 {%r575, %r576}, %rd1949; - shr.u64 %rd1950, %rd1948, 56; - mov.b64 {%r577, %r578}, %rd1950; - mov.b32 {%rs432, %rs2484}, %r577; - mov.b32 {%rs428, %rs430}, %r576; - shr.u16 %rs431, %rs430, 8; - shr.u16 %rs429, %rs428, 8; - mov.b32 {%rs424, %rs426}, %r575; - shr.u16 %rs427, %rs426, 8; - shr.u16 %rs425, %rs424, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2485, %rs426, 8; - or.b16 %rs2486, %rs425, %rs2485; - shl.b16 %rs2487, %rs428, 8; - or.b16 %rs2488, %rs427, %rs2487; - mov.b32 %r579, {%rs2486, %rs2488}; - shl.b16 %rs2489, %rs430, 8; - or.b16 %rs2490, %rs429, %rs2489; - shl.b16 %rs2491, %rs432, 8; - or.b16 %rs2492, %rs431, %rs2491; - mov.b32 %r580, {%rs2490, %rs2492}; - mov.b64 %rd1951, {%r579, %r580}; - ld.local.u64 %rd1952, [%rd1+48]; - xor.b64 %rd4205, %rd1952, %rd1951; - st.local.u64 [%rd1+48], %rd4205; - ld.local.u64 %rd1953, [%rd1+256]; - shl.b64 %rd1954, %rd1953, 8; - mov.b64 {%r581, %r582}, %rd1954; - shr.u64 %rd1955, %rd1953, 56; - mov.b64 {%r583, %r584}, %rd1955; - mov.b32 {%rs441, %rs2493}, %r583; - mov.b32 {%rs437, %rs439}, %r582; - shr.u16 %rs440, %rs439, 8; - shr.u16 %rs438, %rs437, 8; - mov.b32 {%rs433, %rs435}, %r581; - shr.u16 %rs436, %rs435, 8; - shr.u16 %rs434, %rs433, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2494, %rs435, 8; - or.b16 %rs2495, %rs434, %rs2494; - shl.b16 %rs2496, %rs437, 8; - or.b16 %rs2497, %rs436, %rs2496; - mov.b32 %r585, {%rs2495, %rs2497}; - shl.b16 %rs2498, %rs439, 8; - or.b16 %rs2499, %rs438, %rs2498; - shl.b16 %rs2500, %rs441, 8; - or.b16 %rs2501, %rs440, %rs2500; - mov.b32 %r586, {%rs2499, %rs2501}; - mov.b64 %rd1956, {%r585, %r586}; - ld.local.u64 %rd1957, [%rd1+56]; - xor.b64 %rd4201, %rd1957, %rd1956; - st.local.u64 [%rd1+56], %rd4201; - ld.local.u64 %rd1958, [%rd1+264]; - shl.b64 %rd1959, %rd1958, 8; - mov.b64 {%r587, %r588}, %rd1959; - shr.u64 %rd1960, %rd1958, 56; - mov.b64 {%r589, %r590}, %rd1960; - mov.b32 {%rs450, %rs2502}, %r589; - mov.b32 {%rs446, %rs448}, %r588; - shr.u16 %rs449, %rs448, 8; - shr.u16 %rs447, %rs446, 8; - mov.b32 {%rs442, %rs444}, %r587; - shr.u16 %rs445, %rs444, 8; - shr.u16 %rs443, %rs442, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2503, %rs444, 8; - or.b16 %rs2504, %rs443, %rs2503; - shl.b16 %rs2505, %rs446, 8; - or.b16 %rs2506, %rs445, %rs2505; - mov.b32 %r591, {%rs2504, %rs2506}; - shl.b16 %rs2507, %rs448, 8; - or.b16 %rs2508, %rs447, %rs2507; - shl.b16 %rs2509, %rs450, 8; - or.b16 %rs2510, %rs449, %rs2509; - mov.b32 %r592, {%rs2508, %rs2510}; - mov.b64 %rd1961, {%r591, %r592}; - ld.local.u64 %rd1962, [%rd1+64]; - xor.b64 %rd4197, %rd1962, %rd1961; - st.local.u64 [%rd1+64], %rd4197; - ld.local.u64 %rd1963, [%rd1+272]; - shl.b64 %rd1964, %rd1963, 8; - mov.b64 {%r593, %r594}, %rd1964; - shr.u64 %rd1965, %rd1963, 56; - mov.b64 {%r595, %r596}, %rd1965; - mov.b32 {%rs459, %rs2511}, %r595; - mov.b32 {%rs455, %rs457}, %r594; - shr.u16 %rs458, %rs457, 8; - shr.u16 %rs456, %rs455, 8; - mov.b32 {%rs451, %rs453}, %r593; - shr.u16 %rs454, %rs453, 8; - shr.u16 %rs452, %rs451, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2512, %rs453, 8; - or.b16 %rs2513, %rs452, %rs2512; - shl.b16 %rs2514, %rs455, 8; - or.b16 %rs2515, %rs454, %rs2514; - mov.b32 %r597, {%rs2513, %rs2515}; - shl.b16 %rs2516, %rs457, 8; - or.b16 %rs2517, %rs456, %rs2516; - shl.b16 %rs2518, %rs459, 8; - or.b16 %rs2519, %rs458, %rs2518; - mov.b32 %r598, {%rs2517, %rs2519}; - mov.b64 %rd1966, {%r597, %r598}; - ld.local.u64 %rd1967, [%rd1+72]; - xor.b64 %rd4193, %rd1967, %rd1966; - st.local.u64 [%rd1+72], %rd4193; - ld.local.u64 %rd1968, [%rd1+280]; - shl.b64 %rd1969, %rd1968, 8; - mov.b64 {%r599, %r600}, %rd1969; - shr.u64 %rd1970, %rd1968, 56; - mov.b64 {%r601, %r602}, %rd1970; - mov.b32 {%rs468, %rs2520}, %r601; - mov.b32 {%rs464, %rs466}, %r600; - shr.u16 %rs467, %rs466, 8; - shr.u16 %rs465, %rs464, 8; - mov.b32 {%rs460, %rs462}, %r599; - shr.u16 %rs463, %rs462, 8; - shr.u16 %rs461, %rs460, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2521, %rs462, 8; - or.b16 %rs2522, %rs461, %rs2521; - shl.b16 %rs2523, %rs464, 8; - or.b16 %rs2524, %rs463, %rs2523; - mov.b32 %r603, {%rs2522, %rs2524}; - shl.b16 %rs2525, %rs466, 8; - or.b16 %rs2526, %rs465, %rs2525; - shl.b16 %rs2527, %rs468, 8; - or.b16 %rs2528, %rs467, %rs2527; - mov.b32 %r604, {%rs2526, %rs2528}; - mov.b64 %rd1971, {%r603, %r604}; - ld.local.u64 %rd1972, [%rd1+80]; - xor.b64 %rd4208, %rd1972, %rd1971; - st.local.u64 [%rd1+80], %rd4208; - ld.local.u64 %rd1973, [%rd1+288]; - shl.b64 %rd1974, %rd1973, 8; - mov.b64 {%r605, %r606}, %rd1974; - shr.u64 %rd1975, %rd1973, 56; - mov.b64 {%r607, %r608}, %rd1975; - mov.b32 {%rs477, %rs2529}, %r607; - mov.b32 {%rs473, %rs475}, %r606; - shr.u16 %rs476, %rs475, 8; - shr.u16 %rs474, %rs473, 8; - mov.b32 {%rs469, %rs471}, %r605; - shr.u16 %rs472, %rs471, 8; - shr.u16 %rs470, %rs469, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2530, %rs471, 8; - or.b16 %rs2531, %rs470, %rs2530; - shl.b16 %rs2532, %rs473, 8; - or.b16 %rs2533, %rs472, %rs2532; - mov.b32 %r609, {%rs2531, %rs2533}; - shl.b16 %rs2534, %rs475, 8; - or.b16 %rs2535, %rs474, %rs2534; - shl.b16 %rs2536, %rs477, 8; - or.b16 %rs2537, %rs476, %rs2536; - mov.b32 %r610, {%rs2535, %rs2537}; - mov.b64 %rd1976, {%r609, %r610}; - ld.local.u64 %rd1977, [%rd1+88]; - xor.b64 %rd4204, %rd1977, %rd1976; - st.local.u64 [%rd1+88], %rd4204; - ld.local.u64 %rd1978, [%rd1+296]; - shl.b64 %rd1979, %rd1978, 8; - mov.b64 {%r611, %r612}, %rd1979; - shr.u64 %rd1980, %rd1978, 56; - mov.b64 {%r613, %r614}, %rd1980; - mov.b32 {%rs486, %rs2538}, %r613; - mov.b32 {%rs482, %rs484}, %r612; - shr.u16 %rs485, %rs484, 8; - shr.u16 %rs483, %rs482, 8; - mov.b32 {%rs478, %rs480}, %r611; - shr.u16 %rs481, %rs480, 8; - shr.u16 %rs479, %rs478, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2539, %rs480, 8; - or.b16 %rs2540, %rs479, %rs2539; - shl.b16 %rs2541, %rs482, 8; - or.b16 %rs2542, %rs481, %rs2541; - mov.b32 %r615, {%rs2540, %rs2542}; - shl.b16 %rs2543, %rs484, 8; - or.b16 %rs2544, %rs483, %rs2543; - shl.b16 %rs2545, %rs486, 8; - or.b16 %rs2546, %rs485, %rs2545; - mov.b32 %r616, {%rs2544, %rs2546}; - mov.b64 %rd1981, {%r615, %r616}; - ld.local.u64 %rd1982, [%rd1+96]; - xor.b64 %rd4200, %rd1982, %rd1981; - st.local.u64 [%rd1+96], %rd4200; - ld.local.u64 %rd1983, [%rd1+304]; - shl.b64 %rd1984, %rd1983, 8; - mov.b64 {%r617, %r618}, %rd1984; - shr.u64 %rd1985, %rd1983, 56; - mov.b64 {%r619, %r620}, %rd1985; - mov.b32 {%rs495, %rs2547}, %r619; - mov.b32 {%rs491, %rs493}, %r618; - shr.u16 %rs494, %rs493, 8; - shr.u16 %rs492, %rs491, 8; - mov.b32 {%rs487, %rs489}, %r617; - shr.u16 %rs490, %rs489, 8; - shr.u16 %rs488, %rs487, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2548, %rs489, 8; - or.b16 %rs2549, %rs488, %rs2548; - shl.b16 %rs2550, %rs491, 8; - or.b16 %rs2551, %rs490, %rs2550; - mov.b32 %r621, {%rs2549, %rs2551}; - shl.b16 %rs2552, %rs493, 8; - or.b16 %rs2553, %rs492, %rs2552; - shl.b16 %rs2554, %rs495, 8; - or.b16 %rs2555, %rs494, %rs2554; - mov.b32 %r622, {%rs2553, %rs2555}; - mov.b64 %rd1986, {%r621, %r622}; - ld.local.u64 %rd1987, [%rd1+104]; - xor.b64 %rd4196, %rd1987, %rd1986; - st.local.u64 [%rd1+104], %rd4196; - ld.local.u64 %rd1988, [%rd1+312]; - shl.b64 %rd1989, %rd1988, 8; - mov.b64 {%r623, %r624}, %rd1989; - shr.u64 %rd1990, %rd1988, 56; - mov.b64 {%r625, %r626}, %rd1990; - mov.b32 {%rs504, %rs2556}, %r625; - mov.b32 {%rs500, %rs502}, %r624; - shr.u16 %rs503, %rs502, 8; - shr.u16 %rs501, %rs500, 8; - mov.b32 {%rs496, %rs498}, %r623; - shr.u16 %rs499, %rs498, 8; - shr.u16 %rs497, %rs496, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2557, %rs498, 8; - or.b16 %rs2558, %rs497, %rs2557; - shl.b16 %rs2559, %rs500, 8; - or.b16 %rs2560, %rs499, %rs2559; - mov.b32 %r627, {%rs2558, %rs2560}; - shl.b16 %rs2561, %rs502, 8; - or.b16 %rs2562, %rs501, %rs2561; - shl.b16 %rs2563, %rs504, 8; - or.b16 %rs2564, %rs503, %rs2563; - mov.b32 %r628, {%rs2562, %rs2564}; - mov.b64 %rd1991, {%r627, %r628}; - ld.local.u64 %rd1992, [%rd1+112]; - xor.b64 %rd4192, %rd1992, %rd1991; - st.local.u64 [%rd1+112], %rd4192; - ld.local.u64 %rd1993, [%rd1+320]; - shl.b64 %rd1994, %rd1993, 8; - mov.b64 {%r629, %r630}, %rd1994; - shr.u64 %rd1995, %rd1993, 56; - mov.b64 {%r631, %r632}, %rd1995; - mov.b32 {%rs513, %rs2565}, %r631; - mov.b32 {%rs509, %rs511}, %r630; - shr.u16 %rs512, %rs511, 8; - shr.u16 %rs510, %rs509, 8; - mov.b32 {%rs505, %rs507}, %r629; - shr.u16 %rs508, %rs507, 8; - shr.u16 %rs506, %rs505, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2566, %rs507, 8; - or.b16 %rs2567, %rs506, %rs2566; - shl.b16 %rs2568, %rs509, 8; - or.b16 %rs2569, %rs508, %rs2568; - mov.b32 %r633, {%rs2567, %rs2569}; - shl.b16 %rs2570, %rs511, 8; - or.b16 %rs2571, %rs510, %rs2570; - shl.b16 %rs2572, %rs513, 8; - or.b16 %rs2573, %rs512, %rs2572; - mov.b32 %r634, {%rs2571, %rs2573}; - mov.b64 %rd1996, {%r633, %r634}; - ld.local.u64 %rd1997, [%rd1+120]; - xor.b64 %rd4207, %rd1997, %rd1996; - st.local.u64 [%rd1+120], %rd4207; - ld.local.u64 %rd1998, [%rd1+328]; - shl.b64 %rd1999, %rd1998, 8; - mov.b64 {%r635, %r636}, %rd1999; - shr.u64 %rd2000, %rd1998, 56; - mov.b64 {%r637, %r638}, %rd2000; - mov.b32 {%rs522, %rs2574}, %r637; - mov.b32 {%rs518, %rs520}, %r636; - shr.u16 %rs521, %rs520, 8; - shr.u16 %rs519, %rs518, 8; - mov.b32 {%rs514, %rs516}, %r635; - shr.u16 %rs517, %rs516, 8; - shr.u16 %rs515, %rs514, 8; - @%p120 bra $L__BB1_197; - - shl.b16 %rs2575, %rs516, 8; - or.b16 %rs2576, %rs515, %rs2575; - shl.b16 %rs2577, %rs518, 8; - or.b16 %rs2578, %rs517, %rs2577; - mov.b32 %r639, {%rs2576, %rs2578}; - shl.b16 %rs2579, %rs520, 8; - or.b16 %rs2580, %rs519, %rs2579; - shl.b16 %rs2581, %rs522, 8; - or.b16 %rs2582, %rs521, %rs2581; - mov.b32 %r640, {%rs2580, %rs2582}; - mov.b64 %rd2001, {%r639, %r640}; - ld.local.u64 %rd2002, [%rd1+128]; - xor.b64 %rd4203, %rd2002, %rd2001; - st.local.u64 [%rd1+128], %rd4203; - ld.local.u64 %rd2003, [%rd1+336]; - shl.b64 %rd2004, %rd2003, 8; - mov.b64 {%r641, %r642}, %rd2004; - shr.u64 %rd2005, %rd2003, 56; - mov.b64 {%r643, %r644}, %rd2005; - mov.b32 {%rs531, %rs2583}, %r643; - mov.b32 {%rs527, %rs529}, %r642; - shr.u16 %rs530, %rs529, 8; - shr.u16 %rs528, %rs527, 8; - mov.b32 {%rs523, %rs525}, %r641; - shr.u16 %rs526, %rs525, 8; - shr.u16 %rs524, %rs523, 8; - mov.pred %p137, -1; - @%p137 bra $L__BB1_198; - bra.uni $L__BB1_197; - -$L__BB1_198: - shl.b16 %rs2584, %rs525, 8; - or.b16 %rs2585, %rs524, %rs2584; - shl.b16 %rs2586, %rs527, 8; - or.b16 %rs2587, %rs526, %rs2586; - mov.b32 %r645, {%rs2585, %rs2587}; - shl.b16 %rs2588, %rs529, 8; - or.b16 %rs2589, %rs528, %rs2588; - shl.b16 %rs2590, %rs531, 8; - or.b16 %rs2591, %rs530, %rs2590; - mov.b32 %r646, {%rs2589, %rs2591}; - mov.b64 %rd2006, {%r645, %r646}; - ld.local.u64 %rd2007, [%rd1+136]; - xor.b64 %rd4199, %rd2007, %rd2006; - st.local.u64 [%rd1+136], %rd4199; - @%p120 bra $L__BB1_202; - - add.s64 %rd2011, %rd968, 40; - cvta.to.local.u64 %rd591, %rd2011; - add.s64 %rd2012, %rd968, 80; - cvta.to.local.u64 %rd592, %rd2012; - add.s64 %rd2013, %rd968, 120; - cvta.to.local.u64 %rd593, %rd2013; - add.s64 %rd2014, %rd968, 160; - cvta.to.local.u64 %rd594, %rd2014; - add.s64 %rd2015, %rd968, 8; - cvta.to.local.u64 %rd595, %rd2015; - add.s64 %rd2016, %rd968, 48; - cvta.to.local.u64 %rd596, %rd2016; - add.s64 %rd2017, %rd968, 88; - cvta.to.local.u64 %rd597, %rd2017; - add.s64 %rd2018, %rd968, 128; - cvta.to.local.u64 %rd598, %rd2018; - add.s64 %rd2019, %rd968, 168; - cvta.to.local.u64 %rd599, %rd2019; - add.s64 %rd2020, %rd968, 16; - cvta.to.local.u64 %rd600, %rd2020; - add.s64 %rd2021, %rd968, 56; - cvta.to.local.u64 %rd601, %rd2021; - add.s64 %rd2022, %rd968, 96; - cvta.to.local.u64 %rd602, %rd2022; - add.s64 %rd2023, %rd968, 136; - cvta.to.local.u64 %rd603, %rd2023; - add.s64 %rd2024, %rd968, 176; - cvta.to.local.u64 %rd604, %rd2024; - add.s64 %rd2025, %rd968, 24; - cvta.to.local.u64 %rd605, %rd2025; - add.s64 %rd2026, %rd968, 64; - cvta.to.local.u64 %rd606, %rd2026; - add.s64 %rd2027, %rd968, 104; - cvta.to.local.u64 %rd607, %rd2027; - add.s64 %rd2028, %rd968, 144; - cvta.to.local.u64 %rd608, %rd2028; - add.s64 %rd2029, %rd968, 184; - cvta.to.local.u64 %rd609, %rd2029; - add.s64 %rd2030, %rd968, 32; - cvta.to.local.u64 %rd610, %rd2030; - add.s64 %rd2031, %rd968, 72; - cvta.to.local.u64 %rd611, %rd2031; - add.s64 %rd2032, %rd968, 112; - cvta.to.local.u64 %rd612, %rd2032; - add.s64 %rd2033, %rd968, 152; - cvta.to.local.u64 %rd613, %rd2033; - add.s64 %rd2034, %rd968, 192; - mov.u64 %rd4185, 192; - cvta.to.local.u64 %rd614, %rd2034; - ld.local.u64 %rd4206, [%rd594]; - ld.local.u64 %rd4202, [%rd599]; - ld.local.u64 %rd4198, [%rd604]; - ld.local.u64 %rd4195, [%rd608]; - ld.local.u64 %rd4194, [%rd609]; - ld.local.u64 %rd4191, [%rd613]; - ld.local.u64 %rd4190, [%rd614]; - mov.u64 %rd4211, private$9214; - -$L__BB1_200: - add.s64 %rd649, %rd4211, 8; - xor.b64 %rd2035, %rd4207, %rd4206; - xor.b64 %rd2036, %rd2035, %rd4208; - xor.b64 %rd2037, %rd2036, %rd4209; - xor.b64 %rd2038, %rd2037, %rd4215; - xor.b64 %rd2039, %rd4202, %rd4214; - xor.b64 %rd2040, %rd2039, %rd4203; - xor.b64 %rd2041, %rd2040, %rd4204; - xor.b64 %rd2042, %rd2041, %rd4205; - xor.b64 %rd2043, %rd4198, %rd4213; - xor.b64 %rd2044, %rd2043, %rd4199; - xor.b64 %rd2045, %rd2044, %rd4200; - xor.b64 %rd2046, %rd2045, %rd4201; - xor.b64 %rd2047, %rd4194, %rd4212; - xor.b64 %rd2048, %rd2047, %rd4195; - xor.b64 %rd2049, %rd2048, %rd4196; - xor.b64 %rd2050, %rd2049, %rd4197; - xor.b64 %rd2051, %rd4190, %rd4186; - xor.b64 %rd2052, %rd2051, %rd4191; - xor.b64 %rd2053, %rd2052, %rd4192; - xor.b64 %rd2054, %rd2053, %rd4193; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2042, 1; - shr.b64 %rhs, %rd2042, 63; - add.u64 %rd2055, %lhs, %rhs; - } - xor.b64 %rd2056, %rd2055, %rd2054; - xor.b64 %rd2057, %rd4215, %rd2056; - xor.b64 %rd2058, %rd2056, %rd4209; - xor.b64 %rd2059, %rd2056, %rd4208; - xor.b64 %rd2060, %rd2056, %rd4207; - xor.b64 %rd2061, %rd2056, %rd4206; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2046, 1; - shr.b64 %rhs, %rd2046, 63; - add.u64 %rd2062, %lhs, %rhs; - } - xor.b64 %rd2063, %rd2038, %rd2062; - xor.b64 %rd2064, %rd2063, %rd4214; - xor.b64 %rd2065, %rd2063, %rd4205; - xor.b64 %rd2066, %rd2063, %rd4204; - xor.b64 %rd2067, %rd2063, %rd4203; - xor.b64 %rd2068, %rd2063, %rd4202; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2050, 1; - shr.b64 %rhs, %rd2050, 63; - add.u64 %rd2069, %lhs, %rhs; - } - xor.b64 %rd2070, %rd2042, %rd2069; - xor.b64 %rd2071, %rd2070, %rd4213; - xor.b64 %rd2072, %rd2070, %rd4201; - xor.b64 %rd2073, %rd2070, %rd4200; - xor.b64 %rd2074, %rd2070, %rd4199; - xor.b64 %rd2075, %rd2070, %rd4198; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2054, 1; - shr.b64 %rhs, %rd2054, 63; - add.u64 %rd2076, %lhs, %rhs; - } - xor.b64 %rd2077, %rd2046, %rd2076; - xor.b64 %rd2078, %rd2077, %rd4212; - xor.b64 %rd2079, %rd2077, %rd4197; - xor.b64 %rd2080, %rd2077, %rd4196; - xor.b64 %rd2081, %rd2077, %rd4195; - xor.b64 %rd2082, %rd2077, %rd4194; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2038, 1; - shr.b64 %rhs, %rd2038, 63; - add.u64 %rd2083, %lhs, %rhs; - } - xor.b64 %rd2084, %rd2083, %rd2050; - xor.b64 %rd2085, %rd2084, %rd4186; - xor.b64 %rd2086, %rd2084, %rd4193; - xor.b64 %rd2087, %rd2084, %rd4192; - xor.b64 %rd2088, %rd2084, %rd4191; - xor.b64 %rd2089, %rd2084, %rd4190; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2064, 1; - shr.b64 %rhs, %rd2064, 63; - add.u64 %rd2090, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2059, 3; - shr.b64 %rhs, %rd2059, 61; - add.u64 %rd2091, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2072, 6; - shr.b64 %rhs, %rd2072, 58; - add.u64 %rd2092, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2066, 10; - shr.b64 %rhs, %rd2066, 54; - add.u64 %rd2093, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2074, 15; - shr.b64 %rhs, %rd2074, 49; - add.u64 %rd2094, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2081, 21; - shr.b64 %rhs, %rd2081, 43; - add.u64 %rd2095, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2078, 28; - shr.b64 %rhs, %rd2078, 36; - add.u64 %rd2096, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2058, 36; - shr.b64 %rhs, %rd2058, 28; - add.u64 %rd2097, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2067, 45; - shr.b64 %rhs, %rd2067, 19; - add.u64 %rd2098, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2079, 55; - shr.b64 %rhs, %rd2079, 9; - add.u64 %rd2099, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2068, 2; - shr.b64 %rhs, %rd2068, 62; - add.u64 %rd2100, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2089, 14; - shr.b64 %rhs, %rd2089, 50; - add.u64 %rd2101, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2085, 27; - shr.b64 %rhs, %rd2085, 37; - add.u64 %rd2102, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2060, 41; - shr.b64 %rhs, %rd2060, 23; - add.u64 %rd2103, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2082, 56; - shr.b64 %rhs, %rd2082, 8; - add.u64 %rd2104, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2088, 8; - shr.b64 %rhs, %rd2088, 56; - add.u64 %rd2105, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2080, 25; - shr.b64 %rhs, %rd2080, 39; - add.u64 %rd2106, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2073, 43; - shr.b64 %rhs, %rd2073, 21; - add.u64 %rd2107, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2071, 62; - shr.b64 %rhs, %rd2071, 2; - add.u64 %rd2108, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2061, 18; - shr.b64 %rhs, %rd2061, 46; - add.u64 %rd2109, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2087, 39; - shr.b64 %rhs, %rd2087, 25; - add.u64 %rd2110, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2075, 61; - shr.b64 %rhs, %rd2075, 3; - add.u64 %rd2111, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2086, 20; - shr.b64 %rhs, %rd2086, 44; - add.u64 %rd2112, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd2065, 44; - shr.b64 %rhs, %rd2065, 20; - add.u64 %rd2113, %lhs, %rhs; - } - not.b64 %rd2114, %rd2113; - and.b64 %rd2115, %rd2107, %rd2114; - not.b64 %rd2116, %rd2107; - and.b64 %rd2117, %rd2095, %rd2116; - xor.b64 %rd4214, %rd2113, %rd2117; - not.b64 %rd2118, %rd2095; - and.b64 %rd2119, %rd2101, %rd2118; - xor.b64 %rd4213, %rd2119, %rd2107; - not.b64 %rd2120, %rd2101; - and.b64 %rd2121, %rd2057, %rd2120; - xor.b64 %rd4212, %rd2121, %rd2095; - not.b64 %rd2122, %rd2057; - and.b64 %rd2123, %rd2113, %rd2122; - xor.b64 %rd4186, %rd2123, %rd2101; - not.b64 %rd2124, %rd2112; - and.b64 %rd2125, %rd2091, %rd2124; - xor.b64 %rd4209, %rd2125, %rd2096; - not.b64 %rd2126, %rd2091; - and.b64 %rd2127, %rd2098, %rd2126; - xor.b64 %rd4205, %rd2127, %rd2112; - not.b64 %rd2128, %rd2098; - and.b64 %rd2129, %rd2111, %rd2128; - xor.b64 %rd4201, %rd2129, %rd2091; - not.b64 %rd2130, %rd2111; - and.b64 %rd2131, %rd2096, %rd2130; - xor.b64 %rd4197, %rd2098, %rd2131; - not.b64 %rd2132, %rd2096; - and.b64 %rd2133, %rd2112, %rd2132; - xor.b64 %rd4193, %rd2133, %rd2111; - not.b64 %rd2134, %rd2092; - and.b64 %rd2135, %rd2106, %rd2134; - xor.b64 %rd4208, %rd2090, %rd2135; - not.b64 %rd2136, %rd2106; - and.b64 %rd2137, %rd2105, %rd2136; - xor.b64 %rd4204, %rd2137, %rd2092; - not.b64 %rd2138, %rd2105; - and.b64 %rd2139, %rd2109, %rd2138; - xor.b64 %rd4200, %rd2139, %rd2106; - not.b64 %rd2140, %rd2109; - and.b64 %rd2141, %rd2090, %rd2140; - xor.b64 %rd4196, %rd2141, %rd2105; - not.b64 %rd2142, %rd2090; - and.b64 %rd2143, %rd2092, %rd2142; - xor.b64 %rd4192, %rd2143, %rd2109; - not.b64 %rd2144, %rd2097; - and.b64 %rd2145, %rd2093, %rd2144; - xor.b64 %rd4207, %rd2145, %rd2102; - not.b64 %rd2146, %rd2093; - and.b64 %rd2147, %rd2094, %rd2146; - xor.b64 %rd4203, %rd2147, %rd2097; - not.b64 %rd2148, %rd2094; - and.b64 %rd2149, %rd2104, %rd2148; - xor.b64 %rd4199, %rd2093, %rd2149; - not.b64 %rd2150, %rd2104; - and.b64 %rd2151, %rd2102, %rd2150; - xor.b64 %rd4195, %rd2151, %rd2094; - not.b64 %rd2152, %rd2102; - and.b64 %rd2153, %rd2097, %rd2152; - xor.b64 %rd4191, %rd2153, %rd2104; - not.b64 %rd2154, %rd2099; - and.b64 %rd2155, %rd2110, %rd2154; - xor.b64 %rd4206, %rd2155, %rd2108; - not.b64 %rd2156, %rd2110; - and.b64 %rd2157, %rd2103, %rd2156; - xor.b64 %rd4202, %rd2157, %rd2099; - not.b64 %rd2158, %rd2103; - and.b64 %rd2159, %rd2100, %rd2158; - xor.b64 %rd4198, %rd2159, %rd2110; - not.b64 %rd2160, %rd2100; - and.b64 %rd2161, %rd2108, %rd2160; - xor.b64 %rd4194, %rd2161, %rd2103; - not.b64 %rd2162, %rd2108; - and.b64 %rd2163, %rd2099, %rd2162; - xor.b64 %rd4190, %rd2100, %rd2163; - ld.global.nc.u64 %rd2164, [%rd4211]; - xor.b64 %rd2165, %rd2164, %rd2057; - xor.b64 %rd4215, %rd2165, %rd2115; - add.s64 %rd4185, %rd4185, -8; - setp.ne.s64 %p139, %rd4185, 0; - mov.u64 %rd4211, %rd649; - @%p139 bra $L__BB1_200; - - st.local.u64 [%rd599], %rd4202; - st.local.u64 [%rd614], %rd4190; - st.local.u64 [%rd609], %rd4194; - st.local.u64 [%rd600], %rd4213; - st.local.u64 [%rd605], %rd4212; - st.local.u64 [%rd610], %rd4186; - st.local.u64 [%rd591], %rd4209; - st.local.u64 [%rd596], %rd4205; - st.local.u64 [%rd601], %rd4201; - st.local.u64 [%rd606], %rd4197; - st.local.u64 [%rd611], %rd4193; - st.local.u64 [%rd592], %rd4208; - st.local.u64 [%rd597], %rd4204; - st.local.u64 [%rd602], %rd4200; - st.local.u64 [%rd607], %rd4196; - st.local.u64 [%rd612], %rd4192; - st.local.u64 [%rd593], %rd4207; - st.local.u64 [%rd598], %rd4203; - st.local.u64 [%rd603], %rd4199; - st.local.u64 [%rd608], %rd4195; - st.local.u64 [%rd613], %rd4191; - st.local.u64 [%rd594], %rd4206; - st.local.u64 [%rd604], %rd4198; - st.local.u64 [%rd595], %rd4214; - st.local.u64 [%rd1], %rd4215; - -$L__BB1_202: - shr.u64 %rd2166, %rd4213, 8; - shr.u64 %rd2167, %rd4213, 16; - shr.u64 %rd2168, %rd4213, 24; - shr.u64 %rd2169, %rd4213, 32; - shr.u64 %rd2170, %rd4213, 40; - shr.u64 %rd2171, %rd4213, 48; - shr.u64 %rd2172, %rd4213, 56; - shr.u64 %rd2173, %rd4212, 8; - shr.u64 %rd2174, %rd4212, 16; - shr.u64 %rd2175, %rd4212, 24; - shr.u64 %rd2176, %rd4215, 8; - shr.u64 %rd2177, %rd4215, 16; - shr.u64 %rd2178, %rd4215, 24; - shr.u64 %rd2179, %rd4215, 32; - shr.u64 %rd2180, %rd4215, 40; - shr.u64 %rd2181, %rd4215, 48; - shr.u64 %rd2182, %rd4215, 56; - shr.u64 %rd2183, %rd4214, 8; - shr.u64 %rd2184, %rd4214, 16; - shr.u64 %rd2185, %rd4214, 24; - shr.u64 %rd2186, %rd4214, 32; - shr.u64 %rd2187, %rd4214, 40; - shr.u64 %rd2188, %rd4214, 48; - shr.u64 %rd2189, %rd4214, 56; - mov.u16 %rs2592, 28; - st.local.u16 [%rd12], %rs2592; - cvt.u16.u64 %rs2593, %rd4215; - cvt.u16.u64 %rs2594, %rd2176; - st.local.v2.u8 [%rd12+2], {%rs2593, %rs2594}; - cvt.u16.u64 %rs2595, %rd2178; - cvt.u16.u64 %rs2596, %rd2177; - st.local.v2.u8 [%rd12+4], {%rs2596, %rs2595}; - cvt.u16.u64 %rs2597, %rd2180; - cvt.u16.u64 %rs2598, %rd2179; - st.local.v2.u8 [%rd12+6], {%rs2598, %rs2597}; - cvt.u16.u64 %rs2599, %rd2182; - cvt.u16.u64 %rs2600, %rd2181; - st.local.v2.u8 [%rd12+8], {%rs2600, %rs2599}; - cvt.u16.u64 %rs2601, %rd4214; - cvt.u16.u64 %rs2602, %rd2183; - st.local.v2.u8 [%rd12+10], {%rs2601, %rs2602}; - cvt.u16.u64 %rs2603, %rd2185; - cvt.u16.u64 %rs2604, %rd2184; - st.local.v2.u8 [%rd12+12], {%rs2604, %rs2603}; - cvt.u16.u64 %rs2605, %rd2187; - cvt.u16.u64 %rs2606, %rd2186; - st.local.v2.u8 [%rd12+14], {%rs2606, %rs2605}; - cvt.u16.u64 %rs2607, %rd2189; - cvt.u16.u64 %rs2608, %rd2188; - st.local.v2.u8 [%rd12+16], {%rs2608, %rs2607}; - cvt.u16.u64 %rs2609, %rd4213; - cvt.u16.u64 %rs2610, %rd2166; - st.local.v2.u8 [%rd12+18], {%rs2609, %rs2610}; - cvt.u16.u64 %rs2611, %rd2168; - cvt.u16.u64 %rs2612, %rd2167; - st.local.v2.u8 [%rd12+20], {%rs2612, %rs2611}; - cvt.u16.u64 %rs2613, %rd2170; - cvt.u16.u64 %rs2614, %rd2169; - st.local.v2.u8 [%rd12+22], {%rs2614, %rs2613}; - cvt.u16.u64 %rs2615, %rd2172; - cvt.u16.u64 %rs2616, %rd2171; - st.local.v2.u8 [%rd12+24], {%rs2616, %rs2615}; - cvt.u16.u64 %rs2617, %rd4212; - cvt.u16.u64 %rs2618, %rd2173; - st.local.v2.u8 [%rd12+26], {%rs2617, %rs2618}; - cvt.u16.u64 %rs2619, %rd2175; - cvt.u16.u64 %rs2620, %rd2174; - st.local.v2.u8 [%rd12+28], {%rs2620, %rs2619}; - st.local.v2.u8 [%rd12+30], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+32], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+34], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+36], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+38], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+40], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+42], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+44], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+46], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+48], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+50], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+52], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+54], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+56], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+58], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+60], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+62], {%rs2264, %rs2264}; - st.local.v2.u8 [%rd12+64], {%rs2264, %rs2264}; - bra.uni $L__BB1_549; - -$L__BB1_23: - setp.eq.s16 %p3, %rs1380, 9; - @%p3 bra $L__BB1_110; - - setp.eq.s16 %p4, %rs1380, 10; - @%p4 bra $L__BB1_66; - - setp.ne.s16 %p5, %rs1380, 11; - @%p5 bra $L__BB1_470; - - setp.gt.u16 %p15, %rs1, 10; - add.u64 %rd982, %SP, 352; - add.u64 %rd13, %SPL, 352; - mov.u16 %rs1383, 0; - st.local.v4.u16 [%rd13], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd983, %rd982, 8; - cvta.to.local.u64 %rd14, %rd983; - st.local.v4.u16 [%rd14], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd984, %rd982, 16; - cvta.to.local.u64 %rd15, %rd984; - st.local.v4.u16 [%rd15], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd985, %rd982, 24; - cvta.to.local.u64 %rd16, %rd985; - st.local.v4.u16 [%rd16], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd986, %rd982, 32; - cvta.to.local.u64 %rd17, %rd986; - st.local.v4.u16 [%rd17], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd987, %rd982, 40; - cvta.to.local.u64 %rd18, %rd987; - st.local.v4.u16 [%rd18], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd988, %rd982, 48; - cvta.to.local.u64 %rd19, %rd988; - st.local.v4.u16 [%rd19], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd989, %rd982, 56; - cvta.to.local.u64 %rd20, %rd989; - st.local.v4.u16 [%rd20], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd990, %rd982, 64; - cvta.to.local.u64 %rd21, %rd990; - st.local.v4.u16 [%rd21], {%rs1383, %rs1383, %rs1383, %rs1383}; - add.s64 %rd22, %rd982, 72; - cvta.to.local.u64 %rd23, %rd22; - st.local.u8 [%rd23], %rs1383; - @%p15 bra $L__BB1_65; - - shr.u64 %rd25, %rd11, 1; - setp.eq.s64 %p16, %rd25, 0; - @%p16 bra $L__BB1_31; - - mov.u64 %rd4032, 1; - mov.u64 %rd4030, %rd979; - mov.u64 %rd4031, %rd13; - bra.uni $L__BB1_29; - -$L__BB1_30: - ld.local.u16 %rs2, [%rd4030+4]; - add.s64 %rd4032, %rd4032, 1; - add.s64 %rd4031, %rd4031, 2; - add.s64 %rd4030, %rd4030, 2; - -$L__BB1_29: - st.local.u16 [%rd4031], %rs2; - setp.ge.u64 %p17, %rd4032, %rd25; - @%p17 bra $L__BB1_31; - bra.uni $L__BB1_30; - -$L__BB1_31: - and.b64 %rd33, %rd11, 1; - setp.eq.s64 %p18, %rd33, 0; - @%p18 bra $L__BB1_34; - - and.b64 %rd995, %rd11, 65534; - cvta.to.local.u64 %rd997, %rd982; - add.s64 %rd34, %rd997, %rd995; - add.s64 %rd998, %rd979, %rd995; - add.s64 %rd35, %rd998, 2; - mov.u64 %rd4033, 0; - -$L__BB1_33: - add.s64 %rd999, %rd35, %rd4033; - ld.local.u8 %rs1384, [%rd999]; - add.s64 %rd1000, %rd34, %rd4033; - st.local.u8 [%rd1000], %rs1384; - add.s64 %rd4033, %rd4033, 1; - setp.lt.u64 %p19, %rd4033, %rd33; - @%p19 bra $L__BB1_33; - -$L__BB1_34: - mov.u64 %rd1001, 0; - st.local.u8 [%rd23], %rs1; - ld.local.v4.u16 {%rs1385, %rs1386, %rs1387, %rs1388}, [%rd13]; - ld.local.v4.u16 {%rs1393, %rs1394, %rs1395, %rs1396}, [%rd14]; - ld.local.v4.u16 {%rs1401, %rs1402, %rs1403, %rs1404}, [%rd15]; - ld.local.v4.u16 {%rs1409, %rs1410, %rs1411, %rs1412}, [%rd16]; - ld.local.v4.u16 {%rs1417, %rs1418, %rs1419, %rs1420}, [%rd17]; - shr.u16 %rs1423, %rs1420, 8; - ld.local.v4.u16 {%rs1424, %rs1425, %rs1426, %rs1427}, [%rd18]; - ld.local.v4.u16 {%rs1432, %rs1433, %rs1434, %rs1435}, [%rd19]; - ld.local.v4.u16 {%rs1440, %rs1441, %rs1442, %rs1443}, [%rd20]; - ld.local.v4.u16 {%rs1448, %rs1449, %rs1450, %rs1451}, [%rd21]; - ld.local.v4.u16 {%rs1456, %rs1457, %rs1458, %rs1459}, [%rd23]; - and.b16 %rs1463, %rs1456, 255; - st.local.u64 [%rd1], %rd1001; - st.local.u64 [%rd1+8], %rd1001; - st.local.u64 [%rd1+16], %rd1001; - st.local.u64 [%rd1+24], %rd1001; - st.local.u64 [%rd1+32], %rd1001; - st.local.u64 [%rd1+40], %rd1001; - st.local.u64 [%rd1+48], %rd1001; - st.local.u64 [%rd1+56], %rd1001; - st.local.u64 [%rd1+64], %rd1001; - st.local.u64 [%rd1+72], %rd1001; - st.local.u64 [%rd1+80], %rd1001; - st.local.u64 [%rd1+88], %rd1001; - st.local.u64 [%rd1+96], %rd1001; - st.local.u64 [%rd1+104], %rd1001; - st.local.u64 [%rd1+112], %rd1001; - st.local.u64 [%rd1+120], %rd1001; - st.local.u64 [%rd1+128], %rd1001; - st.local.u64 [%rd1+136], %rd1001; - st.local.u64 [%rd1+144], %rd1001; - st.local.u64 [%rd1+152], %rd1001; - st.local.u64 [%rd1+160], %rd1001; - st.local.u64 [%rd1+168], %rd1001; - st.local.u64 [%rd1+176], %rd1001; - st.local.u64 [%rd1+184], %rd1001; - st.local.u64 [%rd1+192], %rd1001; - st.local.v4.u16 [%rd1+200], {%rs1385, %rs1386, %rs1387, %rs1388}; - st.local.v4.u16 [%rd1+208], {%rs1393, %rs1394, %rs1395, %rs1396}; - st.local.v4.u16 [%rd1+216], {%rs1401, %rs1402, %rs1403, %rs1404}; - st.local.v4.u16 [%rd1+224], {%rs1409, %rs1410, %rs1411, %rs1412}; - st.local.v2.u16 [%rd1+232], {%rs1417, %rs1418}; - st.local.u16 [%rd1+236], %rs1419; - st.local.u8 [%rd1+238], %rs1420; - st.local.u8 [%rd1+239], %rs1423; - st.local.v4.u16 [%rd1+240], {%rs1424, %rs1425, %rs1426, %rs1427}; - st.local.v4.u16 [%rd1+248], {%rs1432, %rs1433, %rs1434, %rs1435}; - st.local.v4.u16 [%rd1+256], {%rs1440, %rs1441, %rs1442, %rs1443}; - st.local.v4.u16 [%rd1+264], {%rs1448, %rs1449, %rs1450, %rs1451}; - st.local.v4.u16 [%rd1+272], {%rs1456, %rs1457, %rs1458, %rs1459}; - setp.gt.u16 %p20, %rs1463, 72; - @%p20 bra $L__BB1_64; - - setp.eq.s16 %p21, %rs1463, 72; - @%p21 bra $L__BB1_62; - - cvt.u64.u16 %rd1003, %rs1456; - and.b64 %rd39, %rd1003, 255; - add.s64 %rd1004, %rd1, %rd39; - add.s64 %rd40, %rd1004, 200; - neg.s16 %rs1467, %rs1456; - and.b16 %rs6, %rs1467, 7; - setp.eq.s16 %p22, %rs6, 0; - mov.u64 %rd4040, %rd40; - @%p22 bra $L__BB1_39; - - cvt.u64.u16 %rd1005, %rs6; - neg.s64 %rd4034, %rd1005; - mov.u64 %rd4035, %rd40; - -$L__BB1_38: - .pragma "nounroll"; - add.s64 %rd4040, %rd4035, 1; - st.local.u8 [%rd4035], %rs1383; - add.s64 %rd4034, %rd4034, 1; - setp.ne.s64 %p23, %rd4034, 0; - mov.u64 %rd4035, %rd4040; - @%p23 bra $L__BB1_38; - -$L__BB1_39: - mov.u64 %rd1006, 71; - sub.s64 %rd1007, %rd1006, %rd39; - setp.lt.u64 %p24, %rd1007, 7; - @%p24 bra $L__BB1_46; - - add.s64 %rd1008, %rd1, 264; - sub.s64 %rd49, %rd1008, %rd4040; - shr.u64 %rd1009, %rd49, 3; - add.s64 %rd1010, %rd1009, 1; - and.b64 %rd50, %rd1010, 3; - setp.eq.s64 %p25, %rd50, 0; - mov.u64 %rd4043, %rd4040; - @%p25 bra $L__BB1_43; - - neg.s64 %rd4037, %rd50; - mov.u64 %rd4039, %rd4040; - -$L__BB1_42: - .pragma "nounroll"; - st.local.u8 [%rd4039], %rs1383; - st.local.u8 [%rd4039+1], %rs1383; - st.local.u8 [%rd4039+2], %rs1383; - st.local.u8 [%rd4039+3], %rs1383; - st.local.u8 [%rd4039+4], %rs1383; - st.local.u8 [%rd4039+5], %rs1383; - st.local.u8 [%rd4039+6], %rs1383; - add.s64 %rd4040, %rd4040, 8; - add.s64 %rd4043, %rd4039, 8; - st.local.u8 [%rd4039+7], %rs1383; - add.s64 %rd4037, %rd4037, 1; - setp.ne.s64 %p26, %rd4037, 0; - mov.u64 %rd4039, %rd4043; - @%p26 bra $L__BB1_42; - -$L__BB1_43: - setp.lt.u64 %p27, %rd49, 24; - @%p27 bra $L__BB1_46; - - sub.s64 %rd1011, %rd1, %rd4040; - add.s64 %rd4042, %rd1011, 272; - -$L__BB1_45: - st.local.u8 [%rd4043], %rs1383; - st.local.u8 [%rd4043+1], %rs1383; - st.local.u8 [%rd4043+2], %rs1383; - st.local.u8 [%rd4043+3], %rs1383; - st.local.u8 [%rd4043+4], %rs1383; - st.local.u8 [%rd4043+5], %rs1383; - st.local.u8 [%rd4043+6], %rs1383; - st.local.u8 [%rd4043+7], %rs1383; - st.local.u8 [%rd4043+8], %rs1383; - st.local.u8 [%rd4043+9], %rs1383; - st.local.u8 [%rd4043+10], %rs1383; - st.local.u8 [%rd4043+11], %rs1383; - st.local.u8 [%rd4043+12], %rs1383; - st.local.u8 [%rd4043+13], %rs1383; - st.local.u8 [%rd4043+14], %rs1383; - st.local.u8 [%rd4043+15], %rs1383; - st.local.u8 [%rd4043+16], %rs1383; - st.local.u8 [%rd4043+17], %rs1383; - st.local.u8 [%rd4043+18], %rs1383; - st.local.u8 [%rd4043+19], %rs1383; - st.local.u8 [%rd4043+20], %rs1383; - st.local.u8 [%rd4043+21], %rs1383; - st.local.u8 [%rd4043+22], %rs1383; - st.local.u8 [%rd4043+23], %rs1383; - st.local.u8 [%rd4043+24], %rs1383; - st.local.u8 [%rd4043+25], %rs1383; - st.local.u8 [%rd4043+26], %rs1383; - st.local.u8 [%rd4043+27], %rs1383; - st.local.u8 [%rd4043+28], %rs1383; - st.local.u8 [%rd4043+29], %rs1383; - st.local.u8 [%rd4043+30], %rs1383; - st.local.u8 [%rd4043+31], %rs1383; - add.s64 %rd4042, %rd4042, -32; - setp.ne.s64 %p28, %rd4042, 0; - add.s64 %rd4043, %rd4043, 32; - @%p28 bra $L__BB1_45; - -$L__BB1_46: - st.local.u8 [%rd1+272], %rs1383; - setp.gt.u16 %p29, %rs1463, 71; - @%p29 bra $L__BB1_63; - - mov.u16 %rs1473, 6; - st.local.u8 [%rd40], %rs1473; - ld.local.u8 %rs1474, [%rd1+271]; - or.b16 %rs1475, %rs1474, 128; - st.local.u8 [%rd1+271], %rs1475; - ld.local.u64 %rd1012, [%rd1+200]; - shl.b64 %rd1013, %rd1012, 8; - mov.b64 {%r305, %r306}, %rd1013; - shr.u64 %rd1014, %rd1012, 56; - mov.b64 {%r307, %r308}, %rd1014; - mov.b32 {%rs15, %rs1476}, %r307; - mov.b32 {%rs11, %rs13}, %r306; - shr.u16 %rs14, %rs13, 8; - shr.u16 %rs12, %rs11, 8; - mov.b32 {%rs7, %rs9}, %r305; - shr.u16 %rs10, %rs9, 8; - shr.u16 %rs8, %rs7, 8; - mov.pred %p30, 0; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1477, %rs9, 8; - or.b16 %rs1478, %rs8, %rs1477; - shl.b16 %rs1479, %rs11, 8; - or.b16 %rs1480, %rs10, %rs1479; - mov.b32 %r309, {%rs1478, %rs1480}; - shl.b16 %rs1481, %rs13, 8; - or.b16 %rs1482, %rs12, %rs1481; - shl.b16 %rs1483, %rs15, 8; - or.b16 %rs1484, %rs14, %rs1483; - mov.b32 %r310, {%rs1482, %rs1484}; - mov.b64 %rd1015, {%r309, %r310}; - ld.local.u64 %rd1016, [%rd1]; - xor.b64 %rd4078, %rd1016, %rd1015; - st.local.u64 [%rd1], %rd4078; - ld.local.u64 %rd1017, [%rd1+208]; - shl.b64 %rd1018, %rd1017, 8; - mov.b64 {%r311, %r312}, %rd1018; - shr.u64 %rd1019, %rd1017, 56; - mov.b64 {%r313, %r314}, %rd1019; - mov.b32 {%rs24, %rs1485}, %r313; - mov.b32 {%rs20, %rs22}, %r312; - shr.u16 %rs23, %rs22, 8; - shr.u16 %rs21, %rs20, 8; - mov.b32 {%rs16, %rs18}, %r311; - shr.u16 %rs19, %rs18, 8; - shr.u16 %rs17, %rs16, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1486, %rs18, 8; - or.b16 %rs1487, %rs17, %rs1486; - shl.b16 %rs1488, %rs20, 8; - or.b16 %rs1489, %rs19, %rs1488; - mov.b32 %r315, {%rs1487, %rs1489}; - shl.b16 %rs1490, %rs22, 8; - or.b16 %rs1491, %rs21, %rs1490; - shl.b16 %rs1492, %rs24, 8; - or.b16 %rs1493, %rs23, %rs1492; - mov.b32 %r316, {%rs1491, %rs1493}; - mov.b64 %rd1020, {%r315, %r316}; - ld.local.u64 %rd1021, [%rd1+8]; - xor.b64 %rd4077, %rd1021, %rd1020; - st.local.u64 [%rd1+8], %rd4077; - ld.local.u64 %rd1022, [%rd1+216]; - shl.b64 %rd1023, %rd1022, 8; - mov.b64 {%r317, %r318}, %rd1023; - shr.u64 %rd1024, %rd1022, 56; - mov.b64 {%r319, %r320}, %rd1024; - mov.b32 {%rs33, %rs1494}, %r319; - mov.b32 {%rs29, %rs31}, %r318; - shr.u16 %rs32, %rs31, 8; - shr.u16 %rs30, %rs29, 8; - mov.b32 {%rs25, %rs27}, %r317; - shr.u16 %rs28, %rs27, 8; - shr.u16 %rs26, %rs25, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1495, %rs27, 8; - or.b16 %rs1496, %rs26, %rs1495; - shl.b16 %rs1497, %rs29, 8; - or.b16 %rs1498, %rs28, %rs1497; - mov.b32 %r321, {%rs1496, %rs1498}; - shl.b16 %rs1499, %rs31, 8; - or.b16 %rs1500, %rs30, %rs1499; - shl.b16 %rs1501, %rs33, 8; - or.b16 %rs1502, %rs32, %rs1501; - mov.b32 %r322, {%rs1500, %rs1502}; - mov.b64 %rd1025, {%r321, %r322}; - ld.local.u64 %rd1026, [%rd1+16]; - xor.b64 %rd4076, %rd1026, %rd1025; - st.local.u64 [%rd1+16], %rd4076; - ld.local.u64 %rd1027, [%rd1+224]; - shl.b64 %rd1028, %rd1027, 8; - mov.b64 {%r323, %r324}, %rd1028; - shr.u64 %rd1029, %rd1027, 56; - mov.b64 {%r325, %r326}, %rd1029; - mov.b32 {%rs42, %rs1503}, %r325; - mov.b32 {%rs38, %rs40}, %r324; - shr.u16 %rs41, %rs40, 8; - shr.u16 %rs39, %rs38, 8; - mov.b32 {%rs34, %rs36}, %r323; - shr.u16 %rs37, %rs36, 8; - shr.u16 %rs35, %rs34, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1504, %rs36, 8; - or.b16 %rs1505, %rs35, %rs1504; - shl.b16 %rs1506, %rs38, 8; - or.b16 %rs1507, %rs37, %rs1506; - mov.b32 %r327, {%rs1505, %rs1507}; - shl.b16 %rs1508, %rs40, 8; - or.b16 %rs1509, %rs39, %rs1508; - shl.b16 %rs1510, %rs42, 8; - or.b16 %rs1511, %rs41, %rs1510; - mov.b32 %r328, {%rs1509, %rs1511}; - mov.b64 %rd1030, {%r327, %r328}; - ld.local.u64 %rd1031, [%rd1+24]; - xor.b64 %rd4075, %rd1031, %rd1030; - st.local.u64 [%rd1+24], %rd4075; - ld.local.u64 %rd1032, [%rd1+232]; - shl.b64 %rd1033, %rd1032, 8; - mov.b64 {%r329, %r330}, %rd1033; - shr.u64 %rd1034, %rd1032, 56; - mov.b64 {%r331, %r332}, %rd1034; - mov.b32 {%rs51, %rs1512}, %r331; - mov.b32 {%rs47, %rs49}, %r330; - shr.u16 %rs50, %rs49, 8; - shr.u16 %rs48, %rs47, 8; - mov.b32 {%rs43, %rs45}, %r329; - shr.u16 %rs46, %rs45, 8; - shr.u16 %rs44, %rs43, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1513, %rs45, 8; - or.b16 %rs1514, %rs44, %rs1513; - shl.b16 %rs1515, %rs47, 8; - or.b16 %rs1516, %rs46, %rs1515; - mov.b32 %r333, {%rs1514, %rs1516}; - shl.b16 %rs1517, %rs49, 8; - or.b16 %rs1518, %rs48, %rs1517; - shl.b16 %rs1519, %rs51, 8; - or.b16 %rs1520, %rs50, %rs1519; - mov.b32 %r334, {%rs1518, %rs1520}; - mov.b64 %rd1035, {%r333, %r334}; - ld.local.u64 %rd1036, [%rd1+32]; - xor.b64 %rd4074, %rd1036, %rd1035; - st.local.u64 [%rd1+32], %rd4074; - ld.local.u64 %rd1037, [%rd1+240]; - shl.b64 %rd1038, %rd1037, 8; - mov.b64 {%r335, %r336}, %rd1038; - shr.u64 %rd1039, %rd1037, 56; - mov.b64 {%r337, %r338}, %rd1039; - mov.b32 {%rs60, %rs1521}, %r337; - mov.b32 {%rs56, %rs58}, %r336; - shr.u16 %rs59, %rs58, 8; - shr.u16 %rs57, %rs56, 8; - mov.b32 {%rs52, %rs54}, %r335; - shr.u16 %rs55, %rs54, 8; - shr.u16 %rs53, %rs52, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1522, %rs54, 8; - or.b16 %rs1523, %rs53, %rs1522; - shl.b16 %rs1524, %rs56, 8; - or.b16 %rs1525, %rs55, %rs1524; - mov.b32 %r339, {%rs1523, %rs1525}; - shl.b16 %rs1526, %rs58, 8; - or.b16 %rs1527, %rs57, %rs1526; - shl.b16 %rs1528, %rs60, 8; - or.b16 %rs1529, %rs59, %rs1528; - mov.b32 %r340, {%rs1527, %rs1529}; - mov.b64 %rd1040, {%r339, %r340}; - ld.local.u64 %rd1041, [%rd1+40]; - xor.b64 %rd4073, %rd1041, %rd1040; - st.local.u64 [%rd1+40], %rd4073; - ld.local.u64 %rd1042, [%rd1+248]; - shl.b64 %rd1043, %rd1042, 8; - mov.b64 {%r341, %r342}, %rd1043; - shr.u64 %rd1044, %rd1042, 56; - mov.b64 {%r343, %r344}, %rd1044; - mov.b32 {%rs69, %rs1530}, %r343; - mov.b32 {%rs65, %rs67}, %r342; - shr.u16 %rs68, %rs67, 8; - shr.u16 %rs66, %rs65, 8; - mov.b32 {%rs61, %rs63}, %r341; - shr.u16 %rs64, %rs63, 8; - shr.u16 %rs62, %rs61, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1531, %rs63, 8; - or.b16 %rs1532, %rs62, %rs1531; - shl.b16 %rs1533, %rs65, 8; - or.b16 %rs1534, %rs64, %rs1533; - mov.b32 %r345, {%rs1532, %rs1534}; - shl.b16 %rs1535, %rs67, 8; - or.b16 %rs1536, %rs66, %rs1535; - shl.b16 %rs1537, %rs69, 8; - or.b16 %rs1538, %rs68, %rs1537; - mov.b32 %r346, {%rs1536, %rs1538}; - mov.b64 %rd1045, {%r345, %r346}; - ld.local.u64 %rd1046, [%rd1+48]; - xor.b64 %rd4072, %rd1046, %rd1045; - st.local.u64 [%rd1+48], %rd4072; - ld.local.u64 %rd1047, [%rd1+256]; - shl.b64 %rd1048, %rd1047, 8; - mov.b64 {%r347, %r348}, %rd1048; - shr.u64 %rd1049, %rd1047, 56; - mov.b64 {%r349, %r350}, %rd1049; - mov.b32 {%rs78, %rs1539}, %r349; - mov.b32 {%rs74, %rs76}, %r348; - shr.u16 %rs77, %rs76, 8; - shr.u16 %rs75, %rs74, 8; - mov.b32 {%rs70, %rs72}, %r347; - shr.u16 %rs73, %rs72, 8; - shr.u16 %rs71, %rs70, 8; - @%p30 bra $L__BB1_56; - - shl.b16 %rs1540, %rs72, 8; - or.b16 %rs1541, %rs71, %rs1540; - shl.b16 %rs1542, %rs74, 8; - or.b16 %rs1543, %rs73, %rs1542; - mov.b32 %r351, {%rs1541, %rs1543}; - shl.b16 %rs1544, %rs76, 8; - or.b16 %rs1545, %rs75, %rs1544; - shl.b16 %rs1546, %rs78, 8; - or.b16 %rs1547, %rs77, %rs1546; - mov.b32 %r352, {%rs1545, %rs1547}; - mov.b64 %rd1050, {%r351, %r352}; - ld.local.u64 %rd1051, [%rd1+56]; - xor.b64 %rd4071, %rd1051, %rd1050; - st.local.u64 [%rd1+56], %rd4071; - ld.local.u64 %rd1052, [%rd1+264]; - shl.b64 %rd1053, %rd1052, 8; - mov.b64 {%r353, %r354}, %rd1053; - shr.u64 %rd1054, %rd1052, 56; - mov.b64 {%r355, %r356}, %rd1054; - mov.b32 {%rs87, %rs1548}, %r355; - mov.b32 {%rs83, %rs85}, %r354; - shr.u16 %rs86, %rs85, 8; - shr.u16 %rs84, %rs83, 8; - mov.b32 {%rs79, %rs81}, %r353; - shr.u16 %rs82, %rs81, 8; - shr.u16 %rs80, %rs79, 8; - mov.pred %p38, -1; - @%p38 bra $L__BB1_57; - bra.uni $L__BB1_56; - -$L__BB1_57: - shl.b16 %rs1549, %rs81, 8; - or.b16 %rs1550, %rs80, %rs1549; - shl.b16 %rs1551, %rs83, 8; - or.b16 %rs1552, %rs82, %rs1551; - mov.b32 %r357, {%rs1550, %rs1552}; - shl.b16 %rs1553, %rs85, 8; - or.b16 %rs1554, %rs84, %rs1553; - shl.b16 %rs1555, %rs87, 8; - or.b16 %rs1556, %rs86, %rs1555; - mov.b32 %r358, {%rs1554, %rs1556}; - mov.b64 %rd1055, {%r357, %r358}; - ld.local.u64 %rd1056, [%rd1+64]; - xor.b64 %rd4056, %rd1056, %rd1055; - st.local.u64 [%rd1+64], %rd4056; - @%p30 bra $L__BB1_61; - - add.s64 %rd1060, %rd968, 40; - cvta.to.local.u64 %rd75, %rd1060; - add.s64 %rd1061, %rd968, 80; - cvta.to.local.u64 %rd76, %rd1061; - add.s64 %rd1062, %rd968, 120; - cvta.to.local.u64 %rd77, %rd1062; - add.s64 %rd1063, %rd968, 160; - cvta.to.local.u64 %rd78, %rd1063; - add.s64 %rd1064, %rd968, 8; - cvta.to.local.u64 %rd79, %rd1064; - add.s64 %rd1065, %rd968, 48; - cvta.to.local.u64 %rd80, %rd1065; - add.s64 %rd1066, %rd968, 88; - cvta.to.local.u64 %rd81, %rd1066; - add.s64 %rd1067, %rd968, 128; - cvta.to.local.u64 %rd82, %rd1067; - add.s64 %rd1068, %rd968, 168; - cvta.to.local.u64 %rd83, %rd1068; - add.s64 %rd1069, %rd968, 16; - cvta.to.local.u64 %rd84, %rd1069; - add.s64 %rd1070, %rd968, 56; - cvta.to.local.u64 %rd85, %rd1070; - add.s64 %rd1071, %rd968, 96; - cvta.to.local.u64 %rd86, %rd1071; - add.s64 %rd1072, %rd968, 136; - cvta.to.local.u64 %rd87, %rd1072; - add.s64 %rd1073, %rd968, 176; - cvta.to.local.u64 %rd88, %rd1073; - add.s64 %rd1074, %rd968, 24; - cvta.to.local.u64 %rd89, %rd1074; - add.s64 %rd1075, %rd968, 64; - cvta.to.local.u64 %rd90, %rd1075; - add.s64 %rd1076, %rd968, 104; - cvta.to.local.u64 %rd91, %rd1076; - add.s64 %rd1077, %rd968, 144; - cvta.to.local.u64 %rd92, %rd1077; - add.s64 %rd1078, %rd968, 184; - cvta.to.local.u64 %rd93, %rd1078; - add.s64 %rd1079, %rd968, 32; - cvta.to.local.u64 %rd94, %rd1079; - add.s64 %rd1080, %rd968, 72; - cvta.to.local.u64 %rd95, %rd1080; - add.s64 %rd1081, %rd968, 112; - cvta.to.local.u64 %rd96, %rd1081; - add.s64 %rd1082, %rd968, 152; - cvta.to.local.u64 %rd97, %rd1082; - add.s64 %rd1083, %rd968, 192; - mov.u64 %rd4044, 192; - cvta.to.local.u64 %rd98, %rd1083; - ld.local.u64 %rd4067, [%rd76]; - ld.local.u64 %rd4066, [%rd77]; - ld.local.u64 %rd4065, [%rd78]; - ld.local.u64 %rd4063, [%rd81]; - ld.local.u64 %rd4062, [%rd82]; - ld.local.u64 %rd4061, [%rd83]; - ld.local.u64 %rd4059, [%rd86]; - ld.local.u64 %rd4058, [%rd87]; - ld.local.u64 %rd4057, [%rd88]; - ld.local.u64 %rd4055, [%rd91]; - ld.local.u64 %rd4054, [%rd92]; - ld.local.u64 %rd4053, [%rd93]; - ld.local.u64 %rd4052, [%rd95]; - ld.local.u64 %rd4051, [%rd96]; - ld.local.u64 %rd4050, [%rd97]; - ld.local.u64 %rd4049, [%rd98]; - mov.u64 %rd4070, private$9214; - -$L__BB1_59: - add.s64 %rd142, %rd4070, 8; - xor.b64 %rd1084, %rd4066, %rd4065; - xor.b64 %rd1085, %rd1084, %rd4067; - xor.b64 %rd1086, %rd1085, %rd4073; - xor.b64 %rd1087, %rd1086, %rd4078; - xor.b64 %rd1088, %rd4061, %rd4077; - xor.b64 %rd1089, %rd1088, %rd4062; - xor.b64 %rd1090, %rd1089, %rd4063; - xor.b64 %rd1091, %rd1090, %rd4072; - xor.b64 %rd1092, %rd4057, %rd4076; - xor.b64 %rd1093, %rd1092, %rd4058; - xor.b64 %rd1094, %rd1093, %rd4059; - xor.b64 %rd1095, %rd1094, %rd4071; - xor.b64 %rd1096, %rd4053, %rd4075; - xor.b64 %rd1097, %rd1096, %rd4054; - xor.b64 %rd1098, %rd1097, %rd4055; - xor.b64 %rd1099, %rd1098, %rd4056; - xor.b64 %rd1100, %rd4049, %rd4074; - xor.b64 %rd1101, %rd1100, %rd4050; - xor.b64 %rd1102, %rd1101, %rd4051; - xor.b64 %rd1103, %rd1102, %rd4052; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1091, 1; - shr.b64 %rhs, %rd1091, 63; - add.u64 %rd1104, %lhs, %rhs; - } - xor.b64 %rd1105, %rd1104, %rd1103; - xor.b64 %rd1106, %rd4078, %rd1105; - xor.b64 %rd1107, %rd1105, %rd4073; - xor.b64 %rd1108, %rd1105, %rd4067; - xor.b64 %rd1109, %rd1105, %rd4066; - xor.b64 %rd1110, %rd1105, %rd4065; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1095, 1; - shr.b64 %rhs, %rd1095, 63; - add.u64 %rd1111, %lhs, %rhs; - } - xor.b64 %rd1112, %rd1087, %rd1111; - xor.b64 %rd1113, %rd1112, %rd4077; - xor.b64 %rd1114, %rd1112, %rd4072; - xor.b64 %rd1115, %rd1112, %rd4063; - xor.b64 %rd1116, %rd1112, %rd4062; - xor.b64 %rd1117, %rd1112, %rd4061; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1099, 1; - shr.b64 %rhs, %rd1099, 63; - add.u64 %rd1118, %lhs, %rhs; - } - xor.b64 %rd1119, %rd1091, %rd1118; - xor.b64 %rd1120, %rd1119, %rd4076; - xor.b64 %rd1121, %rd1119, %rd4071; - xor.b64 %rd1122, %rd1119, %rd4059; - xor.b64 %rd1123, %rd1119, %rd4058; - xor.b64 %rd1124, %rd1119, %rd4057; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1103, 1; - shr.b64 %rhs, %rd1103, 63; - add.u64 %rd1125, %lhs, %rhs; - } - xor.b64 %rd1126, %rd1095, %rd1125; - xor.b64 %rd1127, %rd1126, %rd4075; - xor.b64 %rd1128, %rd1126, %rd4056; - xor.b64 %rd1129, %rd1126, %rd4055; - xor.b64 %rd1130, %rd1126, %rd4054; - xor.b64 %rd1131, %rd1126, %rd4053; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1087, 1; - shr.b64 %rhs, %rd1087, 63; - add.u64 %rd1132, %lhs, %rhs; - } - xor.b64 %rd1133, %rd1132, %rd1099; - xor.b64 %rd1134, %rd1133, %rd4074; - xor.b64 %rd1135, %rd1133, %rd4052; - xor.b64 %rd1136, %rd1133, %rd4051; - xor.b64 %rd1137, %rd1133, %rd4050; - xor.b64 %rd1138, %rd1133, %rd4049; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1113, 1; - shr.b64 %rhs, %rd1113, 63; - add.u64 %rd1139, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1108, 3; - shr.b64 %rhs, %rd1108, 61; - add.u64 %rd1140, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1121, 6; - shr.b64 %rhs, %rd1121, 58; - add.u64 %rd1141, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1115, 10; - shr.b64 %rhs, %rd1115, 54; - add.u64 %rd1142, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1123, 15; - shr.b64 %rhs, %rd1123, 49; - add.u64 %rd1143, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1130, 21; - shr.b64 %rhs, %rd1130, 43; - add.u64 %rd1144, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1127, 28; - shr.b64 %rhs, %rd1127, 36; - add.u64 %rd1145, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1107, 36; - shr.b64 %rhs, %rd1107, 28; - add.u64 %rd1146, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1116, 45; - shr.b64 %rhs, %rd1116, 19; - add.u64 %rd1147, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1128, 55; - shr.b64 %rhs, %rd1128, 9; - add.u64 %rd1148, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1117, 2; - shr.b64 %rhs, %rd1117, 62; - add.u64 %rd1149, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1138, 14; - shr.b64 %rhs, %rd1138, 50; - add.u64 %rd1150, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1134, 27; - shr.b64 %rhs, %rd1134, 37; - add.u64 %rd1151, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1109, 41; - shr.b64 %rhs, %rd1109, 23; - add.u64 %rd1152, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1131, 56; - shr.b64 %rhs, %rd1131, 8; - add.u64 %rd1153, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1137, 8; - shr.b64 %rhs, %rd1137, 56; - add.u64 %rd1154, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1129, 25; - shr.b64 %rhs, %rd1129, 39; - add.u64 %rd1155, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1122, 43; - shr.b64 %rhs, %rd1122, 21; - add.u64 %rd1156, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1120, 62; - shr.b64 %rhs, %rd1120, 2; - add.u64 %rd1157, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1110, 18; - shr.b64 %rhs, %rd1110, 46; - add.u64 %rd1158, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1136, 39; - shr.b64 %rhs, %rd1136, 25; - add.u64 %rd1159, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1124, 61; - shr.b64 %rhs, %rd1124, 3; - add.u64 %rd1160, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1135, 20; - shr.b64 %rhs, %rd1135, 44; - add.u64 %rd1161, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1114, 44; - shr.b64 %rhs, %rd1114, 20; - add.u64 %rd1162, %lhs, %rhs; - } - not.b64 %rd1163, %rd1162; - and.b64 %rd1164, %rd1156, %rd1163; - not.b64 %rd1165, %rd1156; - and.b64 %rd1166, %rd1144, %rd1165; - xor.b64 %rd4077, %rd1162, %rd1166; - not.b64 %rd1167, %rd1144; - and.b64 %rd1168, %rd1150, %rd1167; - xor.b64 %rd4076, %rd1168, %rd1156; - not.b64 %rd1169, %rd1150; - and.b64 %rd1170, %rd1106, %rd1169; - xor.b64 %rd4075, %rd1170, %rd1144; - not.b64 %rd1171, %rd1106; - and.b64 %rd1172, %rd1162, %rd1171; - xor.b64 %rd4074, %rd1172, %rd1150; - not.b64 %rd1173, %rd1161; - and.b64 %rd1174, %rd1140, %rd1173; - xor.b64 %rd4073, %rd1174, %rd1145; - not.b64 %rd1175, %rd1140; - and.b64 %rd1176, %rd1147, %rd1175; - xor.b64 %rd4072, %rd1176, %rd1161; - not.b64 %rd1177, %rd1147; - and.b64 %rd1178, %rd1160, %rd1177; - xor.b64 %rd4071, %rd1178, %rd1140; - not.b64 %rd1179, %rd1160; - and.b64 %rd1180, %rd1145, %rd1179; - xor.b64 %rd4056, %rd1147, %rd1180; - not.b64 %rd1181, %rd1145; - and.b64 %rd1182, %rd1161, %rd1181; - xor.b64 %rd4052, %rd1182, %rd1160; - not.b64 %rd1183, %rd1141; - and.b64 %rd1184, %rd1155, %rd1183; - xor.b64 %rd4067, %rd1139, %rd1184; - not.b64 %rd1185, %rd1155; - and.b64 %rd1186, %rd1154, %rd1185; - xor.b64 %rd4063, %rd1186, %rd1141; - not.b64 %rd1187, %rd1154; - and.b64 %rd1188, %rd1158, %rd1187; - xor.b64 %rd4059, %rd1188, %rd1155; - not.b64 %rd1189, %rd1158; - and.b64 %rd1190, %rd1139, %rd1189; - xor.b64 %rd4055, %rd1190, %rd1154; - not.b64 %rd1191, %rd1139; - and.b64 %rd1192, %rd1141, %rd1191; - xor.b64 %rd4051, %rd1192, %rd1158; - not.b64 %rd1193, %rd1146; - and.b64 %rd1194, %rd1142, %rd1193; - xor.b64 %rd4066, %rd1194, %rd1151; - not.b64 %rd1195, %rd1142; - and.b64 %rd1196, %rd1143, %rd1195; - xor.b64 %rd4062, %rd1196, %rd1146; - not.b64 %rd1197, %rd1143; - and.b64 %rd1198, %rd1153, %rd1197; - xor.b64 %rd4058, %rd1142, %rd1198; - not.b64 %rd1199, %rd1153; - and.b64 %rd1200, %rd1151, %rd1199; - xor.b64 %rd4054, %rd1200, %rd1143; - not.b64 %rd1201, %rd1151; - and.b64 %rd1202, %rd1146, %rd1201; - xor.b64 %rd4050, %rd1202, %rd1153; - not.b64 %rd1203, %rd1148; - and.b64 %rd1204, %rd1159, %rd1203; - xor.b64 %rd4065, %rd1204, %rd1157; - not.b64 %rd1205, %rd1159; - and.b64 %rd1206, %rd1152, %rd1205; - xor.b64 %rd4061, %rd1206, %rd1148; - not.b64 %rd1207, %rd1152; - and.b64 %rd1208, %rd1149, %rd1207; - xor.b64 %rd4057, %rd1208, %rd1159; - not.b64 %rd1209, %rd1149; - and.b64 %rd1210, %rd1157, %rd1209; - xor.b64 %rd4053, %rd1210, %rd1152; - not.b64 %rd1211, %rd1157; - and.b64 %rd1212, %rd1148, %rd1211; - xor.b64 %rd4049, %rd1149, %rd1212; - ld.global.nc.u64 %rd1213, [%rd4070]; - xor.b64 %rd1214, %rd1213, %rd1106; - xor.b64 %rd4078, %rd1214, %rd1164; - add.s64 %rd4044, %rd4044, -8; - setp.ne.s64 %p40, %rd4044, 0; - mov.u64 %rd4070, %rd142; - @%p40 bra $L__BB1_59; - - st.local.u64 [%rd83], %rd4061; - st.local.u64 [%rd98], %rd4049; - st.local.u64 [%rd93], %rd4053; - st.local.u64 [%rd84], %rd4076; - st.local.u64 [%rd89], %rd4075; - st.local.u64 [%rd94], %rd4074; - st.local.u64 [%rd75], %rd4073; - st.local.u64 [%rd80], %rd4072; - st.local.u64 [%rd85], %rd4071; - st.local.u64 [%rd90], %rd4056; - st.local.u64 [%rd95], %rd4052; - st.local.u64 [%rd76], %rd4067; - st.local.u64 [%rd81], %rd4063; - st.local.u64 [%rd86], %rd4059; - st.local.u64 [%rd91], %rd4055; - st.local.u64 [%rd96], %rd4051; - st.local.u64 [%rd77], %rd4066; - st.local.u64 [%rd82], %rd4062; - st.local.u64 [%rd87], %rd4058; - st.local.u64 [%rd92], %rd4054; - st.local.u64 [%rd97], %rd4050; - st.local.u64 [%rd78], %rd4065; - st.local.u64 [%rd88], %rd4057; - st.local.u64 [%rd79], %rd4077; - st.local.u64 [%rd1], %rd4078; - -$L__BB1_61: - shr.u64 %rd1215, %rd4076, 8; - shr.u64 %rd1216, %rd4076, 16; - shr.u64 %rd1217, %rd4076, 24; - shr.u64 %rd1218, %rd4076, 32; - shr.u64 %rd1219, %rd4076, 40; - shr.u64 %rd1220, %rd4076, 48; - shr.u64 %rd1221, %rd4076, 56; - shr.u64 %rd1222, %rd4075, 8; - shr.u64 %rd1223, %rd4075, 16; - shr.u64 %rd1224, %rd4075, 24; - shr.u64 %rd1225, %rd4075, 32; - shr.u64 %rd1226, %rd4075, 40; - shr.u64 %rd1227, %rd4075, 48; - shr.u64 %rd1228, %rd4075, 56; - shr.u64 %rd1229, %rd4074, 8; - shr.u64 %rd1230, %rd4074, 16; - shr.u64 %rd1231, %rd4074, 24; - shr.u64 %rd1232, %rd4074, 32; - shr.u64 %rd1233, %rd4074, 40; - shr.u64 %rd1234, %rd4074, 48; - shr.u64 %rd1235, %rd4074, 56; - shr.u64 %rd1236, %rd4073, 8; - shr.u64 %rd1237, %rd4073, 16; - shr.u64 %rd1238, %rd4073, 24; - shr.u64 %rd1239, %rd4073, 32; - shr.u64 %rd1240, %rd4073, 40; - shr.u64 %rd1241, %rd4073, 48; - shr.u64 %rd1242, %rd4073, 56; - shr.u64 %rd1243, %rd4072, 8; - shr.u64 %rd1244, %rd4072, 16; - shr.u64 %rd1245, %rd4072, 24; - shr.u64 %rd1246, %rd4072, 32; - shr.u64 %rd1247, %rd4072, 40; - shr.u64 %rd1248, %rd4072, 48; - shr.u64 %rd1249, %rd4072, 56; - shr.u64 %rd1250, %rd4071, 8; - shr.u64 %rd1251, %rd4071, 16; - shr.u64 %rd1252, %rd4071, 24; - shr.u64 %rd1253, %rd4071, 32; - shr.u64 %rd1254, %rd4071, 40; - shr.u64 %rd1255, %rd4071, 48; - shr.u64 %rd1256, %rd4071, 56; - shr.u64 %rd1257, %rd4078, 8; - shr.u64 %rd1258, %rd4078, 16; - shr.u64 %rd1259, %rd4078, 24; - shr.u64 %rd1260, %rd4078, 32; - shr.u64 %rd1261, %rd4078, 40; - shr.u64 %rd1262, %rd4078, 48; - shr.u64 %rd1263, %rd4078, 56; - shr.u64 %rd1264, %rd4077, 8; - shr.u64 %rd1265, %rd4077, 16; - shr.u64 %rd1266, %rd4077, 24; - shr.u64 %rd1267, %rd4077, 32; - shr.u64 %rd1268, %rd4077, 40; - shr.u64 %rd1269, %rd4077, 48; - shr.u64 %rd1270, %rd4077, 56; - mov.u16 %rs1557, 64; - st.local.u16 [%rd12], %rs1557; - cvt.u16.u64 %rs1558, %rd4078; - cvt.u16.u64 %rs1559, %rd1257; - st.local.v2.u8 [%rd12+2], {%rs1558, %rs1559}; - cvt.u16.u64 %rs1560, %rd1259; - cvt.u16.u64 %rs1561, %rd1258; - st.local.v2.u8 [%rd12+4], {%rs1561, %rs1560}; - cvt.u16.u64 %rs1562, %rd1261; - cvt.u16.u64 %rs1563, %rd1260; - st.local.v2.u8 [%rd12+6], {%rs1563, %rs1562}; - cvt.u16.u64 %rs1564, %rd1263; - cvt.u16.u64 %rs1565, %rd1262; - st.local.v2.u8 [%rd12+8], {%rs1565, %rs1564}; - cvt.u16.u64 %rs1566, %rd4077; - cvt.u16.u64 %rs1567, %rd1264; - st.local.v2.u8 [%rd12+10], {%rs1566, %rs1567}; - cvt.u16.u64 %rs1568, %rd1266; - cvt.u16.u64 %rs1569, %rd1265; - st.local.v2.u8 [%rd12+12], {%rs1569, %rs1568}; - cvt.u16.u64 %rs1570, %rd1268; - cvt.u16.u64 %rs1571, %rd1267; - st.local.v2.u8 [%rd12+14], {%rs1571, %rs1570}; - cvt.u16.u64 %rs1572, %rd1270; - cvt.u16.u64 %rs1573, %rd1269; - st.local.v2.u8 [%rd12+16], {%rs1573, %rs1572}; - cvt.u16.u64 %rs1574, %rd4076; - cvt.u16.u64 %rs1575, %rd1215; - st.local.v2.u8 [%rd12+18], {%rs1574, %rs1575}; - cvt.u16.u64 %rs1576, %rd1217; - cvt.u16.u64 %rs1577, %rd1216; - st.local.v2.u8 [%rd12+20], {%rs1577, %rs1576}; - cvt.u16.u64 %rs1578, %rd1219; - cvt.u16.u64 %rs1579, %rd1218; - st.local.v2.u8 [%rd12+22], {%rs1579, %rs1578}; - cvt.u16.u64 %rs1580, %rd1221; - cvt.u16.u64 %rs1581, %rd1220; - st.local.v2.u8 [%rd12+24], {%rs1581, %rs1580}; - cvt.u16.u64 %rs1582, %rd4075; - cvt.u16.u64 %rs1583, %rd1222; - st.local.v2.u8 [%rd12+26], {%rs1582, %rs1583}; - cvt.u16.u64 %rs1584, %rd1224; - cvt.u16.u64 %rs1585, %rd1223; - st.local.v2.u8 [%rd12+28], {%rs1585, %rs1584}; - cvt.u16.u64 %rs1586, %rd1226; - cvt.u16.u64 %rs1587, %rd1225; - st.local.v2.u8 [%rd12+30], {%rs1587, %rs1586}; - cvt.u16.u64 %rs1588, %rd1228; - cvt.u16.u64 %rs1589, %rd1227; - st.local.v2.u8 [%rd12+32], {%rs1589, %rs1588}; - cvt.u16.u64 %rs1590, %rd4074; - cvt.u16.u64 %rs1591, %rd1229; - st.local.v2.u8 [%rd12+34], {%rs1590, %rs1591}; - cvt.u16.u64 %rs1592, %rd1231; - cvt.u16.u64 %rs1593, %rd1230; - st.local.v2.u8 [%rd12+36], {%rs1593, %rs1592}; - cvt.u16.u64 %rs1594, %rd1233; - cvt.u16.u64 %rs1595, %rd1232; - st.local.v2.u8 [%rd12+38], {%rs1595, %rs1594}; - cvt.u16.u64 %rs1596, %rd1235; - cvt.u16.u64 %rs1597, %rd1234; - st.local.v2.u8 [%rd12+40], {%rs1597, %rs1596}; - cvt.u16.u64 %rs1598, %rd4073; - cvt.u16.u64 %rs1599, %rd1236; - st.local.v2.u8 [%rd12+42], {%rs1598, %rs1599}; - cvt.u16.u64 %rs1600, %rd1238; - cvt.u16.u64 %rs1601, %rd1237; - st.local.v2.u8 [%rd12+44], {%rs1601, %rs1600}; - cvt.u16.u64 %rs1602, %rd1240; - cvt.u16.u64 %rs1603, %rd1239; - st.local.v2.u8 [%rd12+46], {%rs1603, %rs1602}; - cvt.u16.u64 %rs1604, %rd1242; - cvt.u16.u64 %rs1605, %rd1241; - st.local.v2.u8 [%rd12+48], {%rs1605, %rs1604}; - cvt.u16.u64 %rs1606, %rd4072; - cvt.u16.u64 %rs1607, %rd1243; - st.local.v2.u8 [%rd12+50], {%rs1606, %rs1607}; - cvt.u16.u64 %rs1608, %rd1245; - cvt.u16.u64 %rs1609, %rd1244; - st.local.v2.u8 [%rd12+52], {%rs1609, %rs1608}; - cvt.u16.u64 %rs1610, %rd1247; - cvt.u16.u64 %rs1611, %rd1246; - st.local.v2.u8 [%rd12+54], {%rs1611, %rs1610}; - cvt.u16.u64 %rs1612, %rd1249; - cvt.u16.u64 %rs1613, %rd1248; - st.local.v2.u8 [%rd12+56], {%rs1613, %rs1612}; - cvt.u16.u64 %rs1614, %rd4071; - cvt.u16.u64 %rs1615, %rd1250; - st.local.v2.u8 [%rd12+58], {%rs1614, %rs1615}; - cvt.u16.u64 %rs1616, %rd1252; - cvt.u16.u64 %rs1617, %rd1251; - st.local.v2.u8 [%rd12+60], {%rs1617, %rs1616}; - cvt.u16.u64 %rs1618, %rd1254; - cvt.u16.u64 %rs1619, %rd1253; - st.local.v2.u8 [%rd12+62], {%rs1619, %rs1618}; - cvt.u16.u64 %rs1620, %rd1256; - cvt.u16.u64 %rs1621, %rd1255; - st.local.v2.u8 [%rd12+64], {%rs1621, %rs1620}; - bra.uni $L__BB1_549; - -$L__BB1_2: - setp.eq.s16 %p13, %rs1380, 1; - @%p13 bra $L__BB1_399; - - setp.eq.s16 %p14, %rs1380, 2; - @%p14 bra $L__BB1_4; - bra.uni $L__BB1_470; - -$L__BB1_4: - setp.gt.u16 %p229, %rs1, 10; - add.u64 %rd3571, %SP, 352; - add.u64 %rd827, %SPL, 352; - mov.u16 %rs3463, 0; - st.local.v4.u16 [%rd827], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3572, %rd3571, 8; - cvta.to.local.u64 %rd828, %rd3572; - st.local.v4.u16 [%rd828], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3573, %rd3571, 16; - cvta.to.local.u64 %rd829, %rd3573; - st.local.v4.u16 [%rd829], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3574, %rd3571, 24; - cvta.to.local.u64 %rd830, %rd3574; - st.local.v4.u16 [%rd830], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3575, %rd3571, 32; - cvta.to.local.u64 %rd831, %rd3575; - st.local.v4.u16 [%rd831], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3576, %rd3571, 40; - cvta.to.local.u64 %rd832, %rd3576; - st.local.v4.u16 [%rd832], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3577, %rd3571, 48; - cvta.to.local.u64 %rd833, %rd3577; - st.local.v4.u16 [%rd833], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd3578, %rd3571, 56; - cvta.to.local.u64 %rd834, %rd3578; - st.local.v4.u16 [%rd834], {%rs3463, %rs3463, %rs3463, %rs3463}; - add.s64 %rd835, %rd3571, 64; - cvta.to.local.u64 %rd836, %rd835; - st.local.u8 [%rd836], %rs3463; - @%p229 bra $L__BB1_398; - - cvta.to.local.u64 %rd837, %rd978; - shr.u64 %rd838, %rd11, 1; - setp.eq.s64 %p230, %rd838, 0; - @%p230 bra $L__BB1_327; - - mov.u64 %rd4251, 1; - mov.u64 %rd4249, %rd837; - mov.u64 %rd4250, %rd827; - bra.uni $L__BB1_7; - -$L__BB1_8: - ld.local.u16 %rs2, [%rd4249+4]; - add.s64 %rd4251, %rd4251, 1; - add.s64 %rd4250, %rd4250, 2; - add.s64 %rd4249, %rd4249, 2; - -$L__BB1_7: - st.local.u16 [%rd4250], %rs2; - setp.ge.u64 %p231, %rd4251, %rd838; - @%p231 bra $L__BB1_327; - bra.uni $L__BB1_8; - -$L__BB1_327: - and.b64 %rd846, %rd11, 1; - setp.eq.s64 %p232, %rd846, 0; - @%p232 bra $L__BB1_330; - - and.b64 %rd3583, %rd11, 65534; - cvta.to.local.u64 %rd3585, %rd3571; - add.s64 %rd847, %rd3585, %rd3583; - add.s64 %rd3586, %rd837, %rd3583; - add.s64 %rd848, %rd3586, 2; - mov.u64 %rd4252, 0; - -$L__BB1_329: - add.s64 %rd3587, %rd848, %rd4252; - ld.local.u8 %rs3464, [%rd3587]; - add.s64 %rd3588, %rd847, %rd4252; - st.local.u8 [%rd3588], %rs3464; - add.s64 %rd4252, %rd4252, 1; - setp.lt.u64 %p233, %rd4252, %rd846; - @%p233 bra $L__BB1_329; - -$L__BB1_330: - mov.u64 %rd3589, 0; - st.local.u8 [%rd836], %rs1; - ld.local.v4.u16 {%rs3465, %rs3466, %rs3467, %rs3468}, [%rd827]; - ld.local.v4.u16 {%rs3473, %rs3474, %rs3475, %rs3476}, [%rd828]; - ld.local.v4.u16 {%rs3481, %rs3482, %rs3483, %rs3484}, [%rd829]; - ld.local.v4.u16 {%rs3489, %rs3490, %rs3491, %rs3492}, [%rd830]; - ld.local.v4.u16 {%rs3497, %rs3498, %rs3499, %rs3500}, [%rd831]; - ld.local.v4.u16 {%rs3505, %rs3506, %rs3507, %rs3508}, [%rd832]; - ld.local.v4.u16 {%rs3513, %rs3514, %rs3515, %rs3516}, [%rd833]; - ld.local.v4.u16 {%rs3521, %rs3522, %rs3523, %rs3524}, [%rd834]; - shr.u16 %rs3527, %rs3522, 8; - ld.local.v4.u16 {%rs3528, %rs3529, %rs3530, %rs3531}, [%rd836]; - and.b16 %rs3532, %rs3528, 255; - shr.u16 %rs3534, %rs3529, 8; - shr.u16 %rs3537, %rs3531, 8; - st.local.u64 [%rd1], %rd3589; - mov.u32 %r9107, -271733879; - mov.u32 %r9108, 1732584193; - st.local.v2.u32 [%rd1+8], {%r9108, %r9107}; - mov.u32 %r9105, 271733878; - mov.u32 %r9106, -1732584194; - st.local.v2.u32 [%rd1+16], {%r9106, %r9105}; - st.local.v4.u16 [%rd1+24], {%rs3465, %rs3466, %rs3467, %rs3468}; - st.local.v4.u16 [%rd1+32], {%rs3473, %rs3474, %rs3475, %rs3476}; - st.local.v4.u16 [%rd1+40], {%rs3481, %rs3482, %rs3483, %rs3484}; - st.local.v4.u16 [%rd1+48], {%rs3489, %rs3490, %rs3491, %rs3492}; - st.local.v4.u16 [%rd1+56], {%rs3497, %rs3498, %rs3499, %rs3500}; - st.local.v4.u16 [%rd1+64], {%rs3505, %rs3506, %rs3507, %rs3508}; - st.local.v4.u16 [%rd1+72], {%rs3513, %rs3514, %rs3515, %rs3516}; - st.local.u16 [%rd1+80], %rs3521; - st.local.u8 [%rd1+82], %rs3522; - st.local.u8 [%rd1+83], %rs3527; - st.local.v2.u16 [%rd1+84], {%rs3523, %rs3524}; - st.local.u16 [%rd1+88], %rs3528; - st.local.u8 [%rd1+90], %rs3529; - st.local.u8 [%rd1+91], %rs3534; - st.local.u16 [%rd1+92], %rs3530; - st.local.u8 [%rd1+94], %rs3531; - st.local.u8 [%rd1+95], %rs3537; - cvt.u64.u16 %rd3591, %rs3528; - and.b64 %rd852, %rd3591, 255; - cvt.u32.u16 %r5357, %rs3528; - and.b32 %r5358, %r5357, 255; - mul.wide.u32 %rd853, %r5358, 8; - setp.lt.u16 %p234, %rs3532, 64; - @%p234 bra $L__BB1_332; - bra.uni $L__BB1_331; - -$L__BB1_332: - add.s64 %rd3592, %rd1, %rd852; - add.s64 %rd854, %rd1, 88; - mov.u16 %rs3540, 128; - st.local.u8 [%rd3592+24], %rs3540; - add.s64 %rd855, %rd852, 1; - setp.eq.s64 %p235, %rd855, 64; - @%p235 bra $L__BB1_339; - - add.s64 %rd3593, %rd1, %rd855; - add.s64 %rd4257, %rd3593, 24; - mov.u16 %rs3541, 3; - sub.s16 %rs3542, %rs3541, %rs3528; - and.b16 %rs787, %rs3542, 3; - setp.eq.s16 %p236, %rs787, 0; - @%p236 bra $L__BB1_336; - - cvt.u64.u16 %rd3594, %rs787; - neg.s64 %rd4253, %rd3594; - mov.u64 %rd4254, %rd4257; - -$L__BB1_335: - .pragma "nounroll"; - add.s64 %rd4257, %rd4254, 1; - st.local.u8 [%rd4254], %rs3463; - add.s64 %rd4253, %rd4253, 1; - setp.ne.s64 %p237, %rd4253, 0; - mov.u64 %rd4254, %rd4257; - @%p237 bra $L__BB1_335; - -$L__BB1_336: - mov.u64 %rd3595, 62; - sub.s64 %rd3596, %rd3595, %rd852; - setp.lt.u64 %p238, %rd3596, 3; - @%p238 bra $L__BB1_339; - - sub.s64 %rd4256, %rd854, %rd4257; - -$L__BB1_338: - st.local.u8 [%rd4257], %rs3463; - st.local.u8 [%rd4257+1], %rs3463; - st.local.u8 [%rd4257+2], %rs3463; - st.local.u8 [%rd4257+3], %rs3463; - add.s64 %rd4256, %rd4256, -4; - setp.ne.s64 %p239, %rd4256, 0; - add.s64 %rd4257, %rd4257, 4; - @%p239 bra $L__BB1_338; - -$L__BB1_339: - or.b64 %rd3597, %rd852, 7; - setp.eq.s64 %p240, %rd3597, 63; - add.s64 %rd4258, %rd1, 24; - @%p240 bra $L__BB1_359; - bra.uni $L__BB1_340; - -$L__BB1_359: - mov.u32 %r9108, 1732584193; - mov.u32 %r9107, -271733879; - mov.u32 %r9106, -1732584194; - mov.u32 %r9105, 271733878; - mov.pred %p258, 0; - mov.pred %p273, -1; - mov.u64 %rd4261, %rd4258; - -$L__BB1_360: - ld.local.u32 %rd3631, [%rd4261]; - shl.b64 %rd3632, %rd3631, 8; - mov.b64 {%r5939, %r5940}, %rd3632; - mov.b32 {%rs872, %rs3625}, %r5940; - mov.b32 {%rs868, %rs870}, %r5939; - shr.u16 %rs871, %rs870, 8; - shr.u16 %rs869, %rs868, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3633, [%rd4261+4]; - shl.b64 %rd3634, %rd3633, 8; - mov.b64 {%r5941, %r5942}, %rd3634; - mov.b32 {%rs877, %rs3626}, %r5942; - mov.b32 {%rs873, %rs875}, %r5941; - shr.u16 %rs876, %rs875, 8; - shr.u16 %rs874, %rs873, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3635, [%rd4261+8]; - shl.b64 %rd3636, %rd3635, 8; - mov.b64 {%r5943, %r5944}, %rd3636; - mov.b32 {%rs882, %rs3627}, %r5944; - mov.b32 {%rs878, %rs880}, %r5943; - shr.u16 %rs881, %rs880, 8; - shr.u16 %rs879, %rs878, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3637, [%rd4261+12]; - shl.b64 %rd3638, %rd3637, 8; - mov.b64 {%r5945, %r5946}, %rd3638; - mov.b32 {%rs887, %rs3628}, %r5946; - mov.b32 {%rs883, %rs885}, %r5945; - shr.u16 %rs886, %rs885, 8; - shr.u16 %rs884, %rs883, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3639, [%rd4261+16]; - shl.b64 %rd3640, %rd3639, 8; - mov.b64 {%r5947, %r5948}, %rd3640; - mov.b32 {%rs892, %rs3629}, %r5948; - mov.b32 {%rs888, %rs890}, %r5947; - shr.u16 %rs891, %rs890, 8; - shr.u16 %rs889, %rs888, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3641, [%rd4261+20]; - shl.b64 %rd3642, %rd3641, 8; - mov.b64 {%r5949, %r5950}, %rd3642; - mov.b32 {%rs897, %rs3630}, %r5950; - mov.b32 {%rs893, %rs895}, %r5949; - shr.u16 %rs896, %rs895, 8; - shr.u16 %rs894, %rs893, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3643, [%rd4261+24]; - shl.b64 %rd3644, %rd3643, 8; - mov.b64 {%r5951, %r5952}, %rd3644; - mov.b32 {%rs902, %rs3631}, %r5952; - mov.b32 {%rs898, %rs900}, %r5951; - shr.u16 %rs901, %rs900, 8; - shr.u16 %rs899, %rs898, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3645, [%rd4261+28]; - shl.b64 %rd3646, %rd3645, 8; - mov.b64 {%r5953, %r5954}, %rd3646; - mov.b32 {%rs907, %rs3632}, %r5954; - mov.b32 {%rs903, %rs905}, %r5953; - shr.u16 %rs906, %rs905, 8; - shr.u16 %rs904, %rs903, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3647, [%rd4261+32]; - shl.b64 %rd3648, %rd3647, 8; - mov.b64 {%r5955, %r5956}, %rd3648; - mov.b32 {%rs912, %rs3633}, %r5956; - mov.b32 {%rs908, %rs910}, %r5955; - shr.u16 %rs911, %rs910, 8; - shr.u16 %rs909, %rs908, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3649, [%rd4261+36]; - shl.b64 %rd3650, %rd3649, 8; - mov.b64 {%r5957, %r5958}, %rd3650; - mov.b32 {%rs917, %rs3634}, %r5958; - mov.b32 {%rs913, %rs915}, %r5957; - shr.u16 %rs916, %rs915, 8; - shr.u16 %rs914, %rs913, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3651, [%rd4261+40]; - shl.b64 %rd3652, %rd3651, 8; - mov.b64 {%r5959, %r5960}, %rd3652; - mov.b32 {%rs922, %rs3635}, %r5960; - mov.b32 {%rs918, %rs920}, %r5959; - shr.u16 %rs921, %rs920, 8; - shr.u16 %rs919, %rs918, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3653, [%rd4261+44]; - shl.b64 %rd3654, %rd3653, 8; - mov.b64 {%r5961, %r5962}, %rd3654; - mov.b32 {%rs927, %rs3636}, %r5962; - mov.b32 {%rs923, %rs925}, %r5961; - shr.u16 %rs926, %rs925, 8; - shr.u16 %rs924, %rs923, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3655, [%rd4261+48]; - shl.b64 %rd3656, %rd3655, 8; - mov.b64 {%r5963, %r5964}, %rd3656; - mov.b32 {%rs932, %rs3637}, %r5964; - mov.b32 {%rs928, %rs930}, %r5963; - shr.u16 %rs931, %rs930, 8; - shr.u16 %rs929, %rs928, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3657, [%rd4261+52]; - shl.b64 %rd3658, %rd3657, 8; - mov.b64 {%r5965, %r5966}, %rd3658; - mov.b32 {%rs937, %rs3638}, %r5966; - mov.b32 {%rs933, %rs935}, %r5965; - shr.u16 %rs936, %rs935, 8; - shr.u16 %rs934, %rs933, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3659, [%rd4261+56]; - shl.b64 %rd3660, %rd3659, 8; - mov.b64 {%r5967, %r5968}, %rd3660; - mov.b32 {%rs942, %rs3639}, %r5968; - mov.b32 {%rs938, %rs940}, %r5967; - shr.u16 %rs941, %rs940, 8; - shr.u16 %rs939, %rs938, 8; - @%p258 bra $L__BB1_376; - - ld.local.u32 %rd3661, [%rd4261+60]; - shl.b64 %rd3662, %rd3661, 8; - mov.b64 {%r5969, %r5970}, %rd3662; - mov.b32 {%rs947, %rs3640}, %r5970; - mov.b32 {%rs943, %rs945}, %r5969; - shr.u16 %rs946, %rs945, 8; - shr.u16 %rs944, %rs943, 8; - @%p273 bra $L__BB1_377; - bra.uni $L__BB1_376; - -$L__BB1_377: - add.s64 %rd4258, %rd4258, 64; - shl.b16 %rs3641, %rs940, 8; - or.b16 %rs3642, %rs939, %rs3641; - shl.b16 %rs3643, %rs942, 8; - or.b16 %rs3644, %rs941, %rs3643; - shl.b16 %rs3645, %rs945, 8; - or.b16 %rs3646, %rs944, %rs3645; - shl.b16 %rs3647, %rs947, 8; - or.b16 %rs3648, %rs946, %rs3647; - mov.b32 %r5971, {%rs3646, %rs3648}; - not.b32 %r5972, %r9107; - and.b32 %r5973, %r9105, %r5972; - and.b32 %r5974, %r9106, %r9107; - or.b32 %r5975, %r5973, %r5974; - add.s32 %r5976, %r9108, %r5975; - shl.b16 %rs3649, %rs870, 8; - or.b16 %rs3650, %rs869, %rs3649; - shl.b16 %rs3651, %rs872, 8; - or.b16 %rs3652, %rs871, %rs3651; - mov.b32 %r5977, {%rs3650, %rs3652}; - add.s32 %r5978, %r5976, %r5977; - add.s32 %r5979, %r5978, -680876936; - shf.l.wrap.b32 %r5980, %r5979, %r5979, 7; - add.s32 %r5981, %r5980, %r9107; - and.b32 %r5982, %r5981, %r9107; - not.b32 %r5983, %r5981; - and.b32 %r5984, %r9106, %r5983; - or.b32 %r5985, %r5984, %r5982; - shl.b16 %rs3653, %rs875, 8; - or.b16 %rs3654, %rs874, %rs3653; - shl.b16 %rs3655, %rs877, 8; - or.b16 %rs3656, %rs876, %rs3655; - mov.b32 %r5986, {%rs3654, %rs3656}; - add.s32 %r5987, %r9105, %r5986; - add.s32 %r5988, %r5987, %r5985; - add.s32 %r5989, %r5988, -389564586; - shf.l.wrap.b32 %r5990, %r5989, %r5989, 12; - add.s32 %r5991, %r5990, %r5981; - and.b32 %r5992, %r5991, %r5981; - not.b32 %r5993, %r5991; - and.b32 %r5994, %r9107, %r5993; - or.b32 %r5995, %r5994, %r5992; - shl.b16 %rs3657, %rs880, 8; - or.b16 %rs3658, %rs879, %rs3657; - shl.b16 %rs3659, %rs882, 8; - or.b16 %rs3660, %rs881, %rs3659; - mov.b32 %r5996, {%rs3658, %rs3660}; - add.s32 %r5997, %r9106, %r5996; - add.s32 %r5998, %r5997, %r5995; - add.s32 %r5999, %r5998, 606105819; - shf.l.wrap.b32 %r6000, %r5999, %r5999, 17; - add.s32 %r6001, %r6000, %r5991; - and.b32 %r6002, %r6001, %r5991; - not.b32 %r6003, %r6001; - and.b32 %r6004, %r5981, %r6003; - or.b32 %r6005, %r6004, %r6002; - shl.b16 %rs3661, %rs885, 8; - or.b16 %rs3662, %rs884, %rs3661; - shl.b16 %rs3663, %rs887, 8; - or.b16 %rs3664, %rs886, %rs3663; - mov.b32 %r6006, {%rs3662, %rs3664}; - add.s32 %r6007, %r9107, %r6006; - add.s32 %r6008, %r6007, %r6005; - add.s32 %r6009, %r6008, -1044525330; - shf.l.wrap.b32 %r6010, %r6009, %r6009, 22; - add.s32 %r6011, %r6010, %r6001; - and.b32 %r6012, %r6011, %r6001; - not.b32 %r6013, %r6011; - and.b32 %r6014, %r5991, %r6013; - or.b32 %r6015, %r6014, %r6012; - shl.b16 %rs3665, %rs890, 8; - or.b16 %rs3666, %rs889, %rs3665; - shl.b16 %rs3667, %rs892, 8; - or.b16 %rs3668, %rs891, %rs3667; - mov.b32 %r6016, {%rs3666, %rs3668}; - add.s32 %r6017, %r5981, %r6016; - add.s32 %r6018, %r6017, %r6015; - add.s32 %r6019, %r6018, -176418897; - shf.l.wrap.b32 %r6020, %r6019, %r6019, 7; - add.s32 %r6021, %r6020, %r6011; - and.b32 %r6022, %r6021, %r6011; - not.b32 %r6023, %r6021; - and.b32 %r6024, %r6001, %r6023; - or.b32 %r6025, %r6024, %r6022; - shl.b16 %rs3669, %rs895, 8; - or.b16 %rs3670, %rs894, %rs3669; - shl.b16 %rs3671, %rs897, 8; - or.b16 %rs3672, %rs896, %rs3671; - mov.b32 %r6026, {%rs3670, %rs3672}; - add.s32 %r6027, %r6026, %r5991; - add.s32 %r6028, %r6027, %r6025; - add.s32 %r6029, %r6028, 1200080426; - shf.l.wrap.b32 %r6030, %r6029, %r6029, 12; - add.s32 %r6031, %r6030, %r6021; - and.b32 %r6032, %r6031, %r6021; - not.b32 %r6033, %r6031; - and.b32 %r6034, %r6011, %r6033; - or.b32 %r6035, %r6034, %r6032; - shl.b16 %rs3673, %rs900, 8; - or.b16 %rs3674, %rs899, %rs3673; - shl.b16 %rs3675, %rs902, 8; - or.b16 %rs3676, %rs901, %rs3675; - mov.b32 %r6036, {%rs3674, %rs3676}; - add.s32 %r6037, %r6036, %r6001; - add.s32 %r6038, %r6037, %r6035; - add.s32 %r6039, %r6038, -1473231341; - shf.l.wrap.b32 %r6040, %r6039, %r6039, 17; - add.s32 %r6041, %r6040, %r6031; - and.b32 %r6042, %r6041, %r6031; - not.b32 %r6043, %r6041; - and.b32 %r6044, %r6021, %r6043; - or.b32 %r6045, %r6044, %r6042; - shl.b16 %rs3677, %rs905, 8; - or.b16 %rs3678, %rs904, %rs3677; - shl.b16 %rs3679, %rs907, 8; - or.b16 %rs3680, %rs906, %rs3679; - mov.b32 %r6046, {%rs3678, %rs3680}; - add.s32 %r6047, %r6046, %r6011; - add.s32 %r6048, %r6047, %r6045; - add.s32 %r6049, %r6048, -45705983; - shf.l.wrap.b32 %r6050, %r6049, %r6049, 22; - add.s32 %r6051, %r6050, %r6041; - and.b32 %r6052, %r6051, %r6041; - not.b32 %r6053, %r6051; - and.b32 %r6054, %r6031, %r6053; - or.b32 %r6055, %r6054, %r6052; - shl.b16 %rs3681, %rs910, 8; - or.b16 %rs3682, %rs909, %rs3681; - shl.b16 %rs3683, %rs912, 8; - or.b16 %rs3684, %rs911, %rs3683; - mov.b32 %r6056, {%rs3682, %rs3684}; - add.s32 %r6057, %r6056, %r6021; - add.s32 %r6058, %r6057, %r6055; - add.s32 %r6059, %r6058, 1770035416; - shf.l.wrap.b32 %r6060, %r6059, %r6059, 7; - add.s32 %r6061, %r6060, %r6051; - and.b32 %r6062, %r6061, %r6051; - not.b32 %r6063, %r6061; - and.b32 %r6064, %r6041, %r6063; - or.b32 %r6065, %r6064, %r6062; - shl.b16 %rs3685, %rs915, 8; - or.b16 %rs3686, %rs914, %rs3685; - shl.b16 %rs3687, %rs917, 8; - or.b16 %rs3688, %rs916, %rs3687; - mov.b32 %r6066, {%rs3686, %rs3688}; - add.s32 %r6067, %r6066, %r6031; - add.s32 %r6068, %r6067, %r6065; - add.s32 %r6069, %r6068, -1958414417; - shf.l.wrap.b32 %r6070, %r6069, %r6069, 12; - add.s32 %r6071, %r6070, %r6061; - and.b32 %r6072, %r6071, %r6061; - not.b32 %r6073, %r6071; - and.b32 %r6074, %r6051, %r6073; - or.b32 %r6075, %r6074, %r6072; - shl.b16 %rs3689, %rs920, 8; - or.b16 %rs3690, %rs919, %rs3689; - shl.b16 %rs3691, %rs922, 8; - or.b16 %rs3692, %rs921, %rs3691; - mov.b32 %r6076, {%rs3690, %rs3692}; - add.s32 %r6077, %r6076, %r6041; - add.s32 %r6078, %r6077, %r6075; - add.s32 %r6079, %r6078, -42063; - shf.l.wrap.b32 %r6080, %r6079, %r6079, 17; - add.s32 %r6081, %r6080, %r6071; - and.b32 %r6082, %r6081, %r6071; - not.b32 %r6083, %r6081; - and.b32 %r6084, %r6061, %r6083; - or.b32 %r6085, %r6084, %r6082; - shl.b16 %rs3693, %rs925, 8; - or.b16 %rs3694, %rs924, %rs3693; - shl.b16 %rs3695, %rs927, 8; - or.b16 %rs3696, %rs926, %rs3695; - mov.b32 %r6086, {%rs3694, %rs3696}; - add.s32 %r6087, %r6086, %r6051; - add.s32 %r6088, %r6087, %r6085; - add.s32 %r6089, %r6088, -1990404162; - shf.l.wrap.b32 %r6090, %r6089, %r6089, 22; - add.s32 %r6091, %r6090, %r6081; - and.b32 %r6092, %r6091, %r6081; - not.b32 %r6093, %r6091; - and.b32 %r6094, %r6071, %r6093; - or.b32 %r6095, %r6094, %r6092; - shl.b16 %rs3697, %rs930, 8; - or.b16 %rs3698, %rs929, %rs3697; - shl.b16 %rs3699, %rs932, 8; - or.b16 %rs3700, %rs931, %rs3699; - mov.b32 %r6096, {%rs3698, %rs3700}; - add.s32 %r6097, %r6096, %r6061; - add.s32 %r6098, %r6097, %r6095; - add.s32 %r6099, %r6098, 1804603682; - shf.l.wrap.b32 %r6100, %r6099, %r6099, 7; - add.s32 %r6101, %r6100, %r6091; - and.b32 %r6102, %r6101, %r6091; - not.b32 %r6103, %r6101; - and.b32 %r6104, %r6081, %r6103; - or.b32 %r6105, %r6104, %r6102; - shl.b16 %rs3701, %rs935, 8; - or.b16 %rs3702, %rs934, %rs3701; - shl.b16 %rs3703, %rs937, 8; - or.b16 %rs3704, %rs936, %rs3703; - mov.b32 %r6106, {%rs3702, %rs3704}; - add.s32 %r6107, %r6106, %r6071; - add.s32 %r6108, %r6107, %r6105; - add.s32 %r6109, %r6108, -40341101; - shf.l.wrap.b32 %r6110, %r6109, %r6109, 12; - add.s32 %r6111, %r6110, %r6101; - mov.b32 %r6112, {%rs3642, %rs3644}; - and.b32 %r6113, %r6111, %r6101; - not.b32 %r6114, %r6111; - and.b32 %r6115, %r6091, %r6114; - or.b32 %r6116, %r6115, %r6113; - add.s32 %r6117, %r6112, %r6081; - add.s32 %r6118, %r6117, %r6116; - add.s32 %r6119, %r6118, -1502002290; - shf.l.wrap.b32 %r6120, %r6119, %r6119, 17; - add.s32 %r6121, %r6120, %r6111; - and.b32 %r6122, %r6121, %r6111; - not.b32 %r6123, %r6121; - and.b32 %r6124, %r6101, %r6123; - or.b32 %r6125, %r6124, %r6122; - add.s32 %r6126, %r5971, %r6091; - add.s32 %r6127, %r6126, %r6125; - add.s32 %r6128, %r6127, 1236535329; - shf.l.wrap.b32 %r6129, %r6128, %r6128, 22; - add.s32 %r6130, %r6129, %r6121; - and.b32 %r6131, %r6130, %r6111; - and.b32 %r6132, %r6121, %r6114; - or.b32 %r6133, %r6131, %r6132; - add.s32 %r6134, %r5986, %r6101; - add.s32 %r6135, %r6134, %r6133; - add.s32 %r6136, %r6135, -165796510; - shf.l.wrap.b32 %r6137, %r6136, %r6136, 5; - add.s32 %r6138, %r6137, %r6130; - and.b32 %r6139, %r6138, %r6121; - and.b32 %r6140, %r6130, %r6123; - or.b32 %r6141, %r6139, %r6140; - add.s32 %r6142, %r6036, %r6111; - add.s32 %r6143, %r6142, %r6141; - add.s32 %r6144, %r6143, -1069501632; - shf.l.wrap.b32 %r6145, %r6144, %r6144, 9; - add.s32 %r6146, %r6145, %r6138; - and.b32 %r6147, %r6146, %r6130; - not.b32 %r6148, %r6130; - and.b32 %r6149, %r6138, %r6148; - or.b32 %r6150, %r6147, %r6149; - add.s32 %r6151, %r6086, %r6121; - add.s32 %r6152, %r6151, %r6150; - add.s32 %r6153, %r6152, 643717713; - shf.l.wrap.b32 %r6154, %r6153, %r6153, 14; - add.s32 %r6155, %r6154, %r6146; - and.b32 %r6156, %r6155, %r6138; - not.b32 %r6157, %r6138; - and.b32 %r6158, %r6146, %r6157; - or.b32 %r6159, %r6156, %r6158; - add.s32 %r6160, %r5977, %r6130; - add.s32 %r6161, %r6160, %r6159; - add.s32 %r6162, %r6161, -373897302; - shf.l.wrap.b32 %r6163, %r6162, %r6162, 20; - add.s32 %r6164, %r6163, %r6155; - and.b32 %r6165, %r6164, %r6146; - not.b32 %r6166, %r6146; - and.b32 %r6167, %r6155, %r6166; - or.b32 %r6168, %r6165, %r6167; - add.s32 %r6169, %r6026, %r6138; - add.s32 %r6170, %r6169, %r6168; - add.s32 %r6171, %r6170, -701558691; - shf.l.wrap.b32 %r6172, %r6171, %r6171, 5; - add.s32 %r6173, %r6172, %r6164; - and.b32 %r6174, %r6173, %r6155; - not.b32 %r6175, %r6155; - and.b32 %r6176, %r6164, %r6175; - or.b32 %r6177, %r6174, %r6176; - add.s32 %r6178, %r6076, %r6146; - add.s32 %r6179, %r6178, %r6177; - add.s32 %r6180, %r6179, 38016083; - shf.l.wrap.b32 %r6181, %r6180, %r6180, 9; - add.s32 %r6182, %r6181, %r6173; - and.b32 %r6183, %r6182, %r6164; - not.b32 %r6184, %r6164; - and.b32 %r6185, %r6173, %r6184; - or.b32 %r6186, %r6183, %r6185; - add.s32 %r6187, %r5971, %r6155; - add.s32 %r6188, %r6187, %r6186; - add.s32 %r6189, %r6188, -660478335; - shf.l.wrap.b32 %r6190, %r6189, %r6189, 14; - add.s32 %r6191, %r6190, %r6182; - and.b32 %r6192, %r6191, %r6173; - not.b32 %r6193, %r6173; - and.b32 %r6194, %r6182, %r6193; - or.b32 %r6195, %r6192, %r6194; - add.s32 %r6196, %r6016, %r6164; - add.s32 %r6197, %r6196, %r6195; - add.s32 %r6198, %r6197, -405537848; - shf.l.wrap.b32 %r6199, %r6198, %r6198, 20; - add.s32 %r6200, %r6199, %r6191; - and.b32 %r6201, %r6200, %r6182; - not.b32 %r6202, %r6182; - and.b32 %r6203, %r6191, %r6202; - or.b32 %r6204, %r6201, %r6203; - add.s32 %r6205, %r6066, %r6173; - add.s32 %r6206, %r6205, %r6204; - add.s32 %r6207, %r6206, 568446438; - shf.l.wrap.b32 %r6208, %r6207, %r6207, 5; - add.s32 %r6209, %r6208, %r6200; - and.b32 %r6210, %r6209, %r6191; - not.b32 %r6211, %r6191; - and.b32 %r6212, %r6200, %r6211; - or.b32 %r6213, %r6210, %r6212; - add.s32 %r6214, %r6112, %r6182; - add.s32 %r6215, %r6214, %r6213; - add.s32 %r6216, %r6215, -1019803690; - shf.l.wrap.b32 %r6217, %r6216, %r6216, 9; - add.s32 %r6218, %r6217, %r6209; - and.b32 %r6219, %r6218, %r6200; - not.b32 %r6220, %r6200; - and.b32 %r6221, %r6209, %r6220; - or.b32 %r6222, %r6219, %r6221; - add.s32 %r6223, %r6006, %r6191; - add.s32 %r6224, %r6223, %r6222; - add.s32 %r6225, %r6224, -187363961; - shf.l.wrap.b32 %r6226, %r6225, %r6225, 14; - add.s32 %r6227, %r6226, %r6218; - and.b32 %r6228, %r6227, %r6209; - not.b32 %r6229, %r6209; - and.b32 %r6230, %r6218, %r6229; - or.b32 %r6231, %r6228, %r6230; - add.s32 %r6232, %r6056, %r6200; - add.s32 %r6233, %r6232, %r6231; - add.s32 %r6234, %r6233, 1163531501; - shf.l.wrap.b32 %r6235, %r6234, %r6234, 20; - add.s32 %r6236, %r6235, %r6227; - and.b32 %r6237, %r6236, %r6218; - not.b32 %r6238, %r6218; - and.b32 %r6239, %r6227, %r6238; - or.b32 %r6240, %r6237, %r6239; - add.s32 %r6241, %r6106, %r6209; - add.s32 %r6242, %r6241, %r6240; - add.s32 %r6243, %r6242, -1444681467; - shf.l.wrap.b32 %r6244, %r6243, %r6243, 5; - add.s32 %r6245, %r6244, %r6236; - and.b32 %r6246, %r6245, %r6227; - not.b32 %r6247, %r6227; - and.b32 %r6248, %r6236, %r6247; - or.b32 %r6249, %r6246, %r6248; - add.s32 %r6250, %r5996, %r6218; - add.s32 %r6251, %r6250, %r6249; - add.s32 %r6252, %r6251, -51403784; - shf.l.wrap.b32 %r6253, %r6252, %r6252, 9; - add.s32 %r6254, %r6253, %r6245; - and.b32 %r6255, %r6254, %r6236; - not.b32 %r6256, %r6236; - and.b32 %r6257, %r6245, %r6256; - or.b32 %r6258, %r6255, %r6257; - add.s32 %r6259, %r6046, %r6227; - add.s32 %r6260, %r6259, %r6258; - add.s32 %r6261, %r6260, 1735328473; - shf.l.wrap.b32 %r6262, %r6261, %r6261, 14; - add.s32 %r6263, %r6262, %r6254; - and.b32 %r6264, %r6263, %r6245; - not.b32 %r6265, %r6245; - and.b32 %r6266, %r6254, %r6265; - or.b32 %r6267, %r6264, %r6266; - add.s32 %r6268, %r6096, %r6236; - add.s32 %r6269, %r6268, %r6267; - add.s32 %r6270, %r6269, -1926607734; - shf.l.wrap.b32 %r6271, %r6270, %r6270, 20; - add.s32 %r6272, %r6271, %r6263; - xor.b32 %r6273, %r6272, %r6263; - xor.b32 %r6274, %r6273, %r6254; - add.s32 %r6275, %r6026, %r6245; - add.s32 %r6276, %r6275, %r6274; - add.s32 %r6277, %r6276, -378558; - shf.l.wrap.b32 %r6278, %r6277, %r6277, 4; - add.s32 %r6279, %r6278, %r6272; - xor.b32 %r6280, %r6279, %r6273; - add.s32 %r6281, %r6056, %r6254; - add.s32 %r6282, %r6281, %r6280; - add.s32 %r6283, %r6282, -2022574463; - shf.l.wrap.b32 %r6284, %r6283, %r6283, 11; - add.s32 %r6285, %r6284, %r6279; - xor.b32 %r6286, %r6285, %r6279; - xor.b32 %r6287, %r6286, %r6272; - add.s32 %r6288, %r6086, %r6263; - add.s32 %r6289, %r6288, %r6287; - add.s32 %r6290, %r6289, 1839030562; - shf.l.wrap.b32 %r6291, %r6290, %r6290, 16; - add.s32 %r6292, %r6291, %r6285; - xor.b32 %r6293, %r6292, %r6286; - add.s32 %r6294, %r6112, %r6272; - add.s32 %r6295, %r6294, %r6293; - add.s32 %r6296, %r6295, -35309556; - shf.l.wrap.b32 %r6297, %r6296, %r6296, 23; - add.s32 %r6298, %r6297, %r6292; - xor.b32 %r6299, %r6292, %r6285; - xor.b32 %r6300, %r6299, %r6298; - add.s32 %r6301, %r5986, %r6279; - add.s32 %r6302, %r6301, %r6300; - add.s32 %r6303, %r6302, -1530992060; - shf.l.wrap.b32 %r6304, %r6303, %r6303, 4; - add.s32 %r6305, %r6304, %r6298; - xor.b32 %r6306, %r6298, %r6292; - xor.b32 %r6307, %r6306, %r6305; - add.s32 %r6308, %r6016, %r6285; - add.s32 %r6309, %r6308, %r6307; - add.s32 %r6310, %r6309, 1272893353; - shf.l.wrap.b32 %r6311, %r6310, %r6310, 11; - add.s32 %r6312, %r6311, %r6305; - xor.b32 %r6313, %r6305, %r6298; - xor.b32 %r6314, %r6313, %r6312; - add.s32 %r6315, %r6046, %r6292; - add.s32 %r6316, %r6315, %r6314; - add.s32 %r6317, %r6316, -155497632; - shf.l.wrap.b32 %r6318, %r6317, %r6317, 16; - add.s32 %r6319, %r6318, %r6312; - xor.b32 %r6320, %r6312, %r6305; - xor.b32 %r6321, %r6320, %r6319; - add.s32 %r6322, %r6076, %r6298; - add.s32 %r6323, %r6322, %r6321; - add.s32 %r6324, %r6323, -1094730640; - shf.l.wrap.b32 %r6325, %r6324, %r6324, 23; - add.s32 %r6326, %r6325, %r6319; - xor.b32 %r6327, %r6319, %r6312; - xor.b32 %r6328, %r6327, %r6326; - add.s32 %r6329, %r6106, %r6305; - add.s32 %r6330, %r6329, %r6328; - add.s32 %r6331, %r6330, 681279174; - shf.l.wrap.b32 %r6332, %r6331, %r6331, 4; - add.s32 %r6333, %r6332, %r6326; - xor.b32 %r6334, %r6326, %r6319; - xor.b32 %r6335, %r6334, %r6333; - add.s32 %r6336, %r5977, %r6312; - add.s32 %r6337, %r6336, %r6335; - add.s32 %r6338, %r6337, -358537222; - shf.l.wrap.b32 %r6339, %r6338, %r6338, 11; - add.s32 %r6340, %r6339, %r6333; - xor.b32 %r6341, %r6333, %r6326; - xor.b32 %r6342, %r6341, %r6340; - add.s32 %r6343, %r6006, %r6319; - add.s32 %r6344, %r6343, %r6342; - add.s32 %r6345, %r6344, -722521979; - shf.l.wrap.b32 %r6346, %r6345, %r6345, 16; - add.s32 %r6347, %r6346, %r6340; - xor.b32 %r6348, %r6340, %r6333; - xor.b32 %r6349, %r6348, %r6347; - add.s32 %r6350, %r6036, %r6326; - add.s32 %r6351, %r6350, %r6349; - add.s32 %r6352, %r6351, 76029189; - shf.l.wrap.b32 %r6353, %r6352, %r6352, 23; - add.s32 %r6354, %r6353, %r6347; - xor.b32 %r6355, %r6347, %r6340; - xor.b32 %r6356, %r6355, %r6354; - add.s32 %r6357, %r6066, %r6333; - add.s32 %r6358, %r6357, %r6356; - add.s32 %r6359, %r6358, -640364487; - shf.l.wrap.b32 %r6360, %r6359, %r6359, 4; - add.s32 %r6361, %r6360, %r6354; - xor.b32 %r6362, %r6354, %r6347; - xor.b32 %r6363, %r6362, %r6361; - add.s32 %r6364, %r6096, %r6340; - add.s32 %r6365, %r6364, %r6363; - add.s32 %r6366, %r6365, -421815835; - shf.l.wrap.b32 %r6367, %r6366, %r6366, 11; - add.s32 %r6368, %r6367, %r6361; - xor.b32 %r6369, %r6361, %r6354; - xor.b32 %r6370, %r6369, %r6368; - add.s32 %r6371, %r5971, %r6347; - add.s32 %r6372, %r6371, %r6370; - add.s32 %r6373, %r6372, 530742520; - shf.l.wrap.b32 %r6374, %r6373, %r6373, 16; - add.s32 %r6375, %r6374, %r6368; - xor.b32 %r6376, %r6368, %r6361; - xor.b32 %r6377, %r6376, %r6375; - add.s32 %r6378, %r5996, %r6354; - add.s32 %r6379, %r6378, %r6377; - add.s32 %r6380, %r6379, -995338651; - shf.l.wrap.b32 %r6381, %r6380, %r6380, 23; - add.s32 %r6382, %r6381, %r6375; - not.b32 %r6383, %r6368; - or.b32 %r6384, %r6382, %r6383; - xor.b32 %r6385, %r6384, %r6375; - add.s32 %r6386, %r5977, %r6361; - add.s32 %r6387, %r6386, %r6385; - add.s32 %r6388, %r6387, -198630844; - shf.l.wrap.b32 %r6389, %r6388, %r6388, 6; - add.s32 %r6390, %r6389, %r6382; - not.b32 %r6391, %r6375; - or.b32 %r6392, %r6390, %r6391; - xor.b32 %r6393, %r6392, %r6382; - add.s32 %r6394, %r6046, %r6368; - add.s32 %r6395, %r6394, %r6393; - add.s32 %r6396, %r6395, 1126891415; - shf.l.wrap.b32 %r6397, %r6396, %r6396, 10; - add.s32 %r6398, %r6397, %r6390; - not.b32 %r6399, %r6382; - or.b32 %r6400, %r6398, %r6399; - xor.b32 %r6401, %r6400, %r6390; - add.s32 %r6402, %r6112, %r6375; - add.s32 %r6403, %r6402, %r6401; - add.s32 %r6404, %r6403, -1416354905; - shf.l.wrap.b32 %r6405, %r6404, %r6404, 15; - add.s32 %r6406, %r6405, %r6398; - not.b32 %r6407, %r6390; - or.b32 %r6408, %r6406, %r6407; - xor.b32 %r6409, %r6408, %r6398; - add.s32 %r6410, %r6026, %r6382; - add.s32 %r6411, %r6410, %r6409; - add.s32 %r6412, %r6411, -57434055; - shf.l.wrap.b32 %r6413, %r6412, %r6412, 21; - add.s32 %r6414, %r6413, %r6406; - not.b32 %r6415, %r6398; - or.b32 %r6416, %r6414, %r6415; - xor.b32 %r6417, %r6416, %r6406; - add.s32 %r6418, %r6096, %r6390; - add.s32 %r6419, %r6418, %r6417; - add.s32 %r6420, %r6419, 1700485571; - shf.l.wrap.b32 %r6421, %r6420, %r6420, 6; - add.s32 %r6422, %r6421, %r6414; - not.b32 %r6423, %r6406; - or.b32 %r6424, %r6422, %r6423; - xor.b32 %r6425, %r6424, %r6414; - add.s32 %r6426, %r6006, %r6398; - add.s32 %r6427, %r6426, %r6425; - add.s32 %r6428, %r6427, -1894986606; - shf.l.wrap.b32 %r6429, %r6428, %r6428, 10; - add.s32 %r6430, %r6429, %r6422; - not.b32 %r6431, %r6414; - or.b32 %r6432, %r6430, %r6431; - xor.b32 %r6433, %r6432, %r6422; - add.s32 %r6434, %r6076, %r6406; - add.s32 %r6435, %r6434, %r6433; - add.s32 %r6436, %r6435, -1051523; - shf.l.wrap.b32 %r6437, %r6436, %r6436, 15; - add.s32 %r6438, %r6437, %r6430; - not.b32 %r6439, %r6422; - or.b32 %r6440, %r6438, %r6439; - xor.b32 %r6441, %r6440, %r6430; - add.s32 %r6442, %r5986, %r6414; - add.s32 %r6443, %r6442, %r6441; - add.s32 %r6444, %r6443, -2054922799; - shf.l.wrap.b32 %r6445, %r6444, %r6444, 21; - add.s32 %r6446, %r6445, %r6438; - not.b32 %r6447, %r6430; - or.b32 %r6448, %r6446, %r6447; - xor.b32 %r6449, %r6448, %r6438; - add.s32 %r6450, %r6056, %r6422; - add.s32 %r6451, %r6450, %r6449; - add.s32 %r6452, %r6451, 1873313359; - shf.l.wrap.b32 %r6453, %r6452, %r6452, 6; - add.s32 %r6454, %r6453, %r6446; - not.b32 %r6455, %r6438; - or.b32 %r6456, %r6454, %r6455; - xor.b32 %r6457, %r6456, %r6446; - add.s32 %r6458, %r5971, %r6430; - add.s32 %r6459, %r6458, %r6457; - add.s32 %r6460, %r6459, -30611744; - shf.l.wrap.b32 %r6461, %r6460, %r6460, 10; - add.s32 %r6462, %r6461, %r6454; - not.b32 %r6463, %r6446; - or.b32 %r6464, %r6462, %r6463; - xor.b32 %r6465, %r6464, %r6454; - add.s32 %r6466, %r6036, %r6438; - add.s32 %r6467, %r6466, %r6465; - add.s32 %r6468, %r6467, -1560198380; - shf.l.wrap.b32 %r6469, %r6468, %r6468, 15; - add.s32 %r6470, %r6469, %r6462; - not.b32 %r6471, %r6454; - or.b32 %r6472, %r6470, %r6471; - xor.b32 %r6473, %r6472, %r6462; - add.s32 %r6474, %r6106, %r6446; - add.s32 %r6475, %r6474, %r6473; - add.s32 %r6476, %r6475, 1309151649; - shf.l.wrap.b32 %r6477, %r6476, %r6476, 21; - add.s32 %r6478, %r6477, %r6470; - not.b32 %r6479, %r6462; - or.b32 %r6480, %r6478, %r6479; - xor.b32 %r6481, %r6480, %r6470; - add.s32 %r6482, %r6016, %r6454; - add.s32 %r6483, %r6482, %r6481; - add.s32 %r6484, %r6483, -145523070; - shf.l.wrap.b32 %r6485, %r6484, %r6484, 6; - add.s32 %r6486, %r6485, %r6478; - not.b32 %r6487, %r6470; - or.b32 %r6488, %r6486, %r6487; - xor.b32 %r6489, %r6488, %r6478; - add.s32 %r6490, %r6086, %r6462; - add.s32 %r6491, %r6490, %r6489; - add.s32 %r6492, %r6491, -1120210379; - shf.l.wrap.b32 %r6493, %r6492, %r6492, 10; - add.s32 %r6494, %r6493, %r6486; - not.b32 %r6495, %r6478; - or.b32 %r6496, %r6494, %r6495; - xor.b32 %r6497, %r6496, %r6486; - add.s32 %r6498, %r5996, %r6470; - add.s32 %r6499, %r6498, %r6497; - add.s32 %r6500, %r6499, 718787259; - shf.l.wrap.b32 %r6501, %r6500, %r6500, 15; - add.s32 %r6502, %r6501, %r6494; - not.b32 %r6503, %r6486; - or.b32 %r6504, %r6502, %r6503; - xor.b32 %r6505, %r6504, %r6494; - add.s32 %r6506, %r6066, %r6478; - add.s32 %r6507, %r6506, %r6505; - add.s32 %r6508, %r6507, -343485551; - shf.l.wrap.b32 %r6509, %r6508, %r6508, 21; - add.s32 %r9108, %r6486, %r9108; - add.s32 %r6510, %r6502, %r9107; - add.s32 %r9107, %r6510, %r6509; - add.s32 %r9106, %r6502, %r9106; - add.s32 %r9105, %r6494, %r9105; - setp.ne.s64 %p274, %rd4258, %rd854; - add.s64 %rd4261, %rd4261, 64; - @%p274 bra $L__BB1_360; - - cvt.u32.u16 %r9084, %rs3528; - and.b32 %r9083, %r9084, 255; - mul.wide.u32 %rd4027, %r9083, 8; - add.u64 %rd4262, %SPL, 504; - mov.u16 %rs4342, 0; - st.local.u8 [%rd4262], %rs4342; - st.local.u8 [%rd4262+1], %rs4342; - st.local.u8 [%rd4262+2], %rs4342; - st.local.u8 [%rd4262+3], %rs4342; - st.local.u8 [%rd4262+4], %rs4342; - st.local.u8 [%rd4262+5], %rs4342; - st.local.u8 [%rd4262+6], %rs4342; - st.local.u8 [%rd4262+7], %rs4342; - st.local.u8 [%rd4262+8], %rs4342; - st.local.u8 [%rd4262+9], %rs4342; - st.local.u8 [%rd4262+10], %rs4342; - st.local.u8 [%rd4262+11], %rs4342; - st.local.u8 [%rd4262+12], %rs4342; - st.local.u8 [%rd4262+13], %rs4342; - st.local.u8 [%rd4262+14], %rs4342; - st.local.u8 [%rd4262+15], %rs4342; - st.local.u8 [%rd4262+16], %rs4342; - st.local.u8 [%rd4262+17], %rs4342; - st.local.u8 [%rd4262+18], %rs4342; - st.local.u8 [%rd4262+19], %rs4342; - st.local.u8 [%rd4262+20], %rs4342; - st.local.u8 [%rd4262+21], %rs4342; - st.local.u8 [%rd4262+22], %rs4342; - st.local.u8 [%rd4262+23], %rs4342; - st.local.u8 [%rd4262+24], %rs4342; - st.local.u8 [%rd4262+25], %rs4342; - st.local.u8 [%rd4262+26], %rs4342; - st.local.u8 [%rd4262+27], %rs4342; - st.local.u8 [%rd4262+28], %rs4342; - st.local.u8 [%rd4262+29], %rs4342; - st.local.u8 [%rd4262+30], %rs4342; - st.local.u8 [%rd4262+31], %rs4342; - st.local.u8 [%rd4262+32], %rs4342; - st.local.u8 [%rd4262+33], %rs4342; - st.local.u8 [%rd4262+34], %rs4342; - st.local.u8 [%rd4262+35], %rs4342; - st.local.u8 [%rd4262+36], %rs4342; - st.local.u8 [%rd4262+37], %rs4342; - st.local.u8 [%rd4262+38], %rs4342; - st.local.u8 [%rd4262+39], %rs4342; - st.local.u8 [%rd4262+40], %rs4342; - st.local.u8 [%rd4262+41], %rs4342; - st.local.u8 [%rd4262+42], %rs4342; - st.local.u8 [%rd4262+43], %rs4342; - st.local.u8 [%rd4262+44], %rs4342; - st.local.u8 [%rd4262+45], %rs4342; - st.local.u8 [%rd4262+46], %rs4342; - st.local.u8 [%rd4262+47], %rs4342; - st.local.u8 [%rd4262+48], %rs4342; - st.local.u8 [%rd4262+49], %rs4342; - st.local.u8 [%rd4262+50], %rs4342; - st.local.u8 [%rd4262+51], %rs4342; - st.local.u8 [%rd4262+52], %rs4342; - st.local.u8 [%rd4262+53], %rs4342; - st.local.u8 [%rd4262+54], %rs4342; - st.local.u8 [%rd4262+55], %rs4342; - shr.u64 %rd3663, %rd4027, 56; - st.local.u8 [%rd4262+63], %rd3663; - shr.u64 %rd3664, %rd4027, 48; - st.local.u8 [%rd4262+62], %rd3664; - shr.u64 %rd3665, %rd4027, 40; - st.local.u8 [%rd4262+61], %rd3665; - shr.u64 %rd3666, %rd4027, 32; - st.local.u8 [%rd4262+60], %rd3666; - shr.u64 %rd3667, %rd4027, 24; - st.local.u8 [%rd4262+59], %rd3667; - shr.u64 %rd3668, %rd4027, 16; - st.local.u8 [%rd4262+58], %rd3668; - shr.u64 %rd3669, %rd4027, 8; - st.local.u8 [%rd4262+57], %rd3669; - st.local.u8 [%rd4262+56], %rd4027; - add.s64 %rd882, %rd4262, 64; - mov.u64 %rd4263, %rd4262; - -$L__BB1_379: - ld.local.u8 %rd3670, [%rd4263]; - ld.local.u8 %rd3671, [%rd4263+1]; - bfi.b64 %rd3672, %rd3671, %rd3670, 8, 8; - ld.local.u8 %rd3673, [%rd4263+2]; - ld.local.u8 %rd3674, [%rd4263+3]; - bfi.b64 %rd3675, %rd3674, %rd3673, 8, 56; - bfi.b64 %rd3676, %rd3675, %rd3672, 16, 48; - shl.b64 %rd3677, %rd3676, 8; - mov.b64 {%r6511, %r6512}, %rd3677; - mov.b32 {%rs952, %rs3706}, %r6512; - mov.b32 {%rs948, %rs950}, %r6511; - shr.u16 %rs951, %rs950, 8; - shr.u16 %rs949, %rs948, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3678, [%rd4263+4]; - ld.local.u8 %rd3679, [%rd4263+5]; - bfi.b64 %rd3680, %rd3679, %rd3678, 8, 8; - ld.local.u8 %rd3681, [%rd4263+6]; - ld.local.u8 %rd3682, [%rd4263+7]; - bfi.b64 %rd3683, %rd3682, %rd3681, 8, 56; - bfi.b64 %rd3684, %rd3683, %rd3680, 16, 48; - shl.b64 %rd3685, %rd3684, 8; - mov.b64 {%r6513, %r6514}, %rd3685; - mov.b32 {%rs957, %rs3707}, %r6514; - mov.b32 {%rs953, %rs955}, %r6513; - shr.u16 %rs956, %rs955, 8; - shr.u16 %rs954, %rs953, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3686, [%rd4263+8]; - ld.local.u8 %rd3687, [%rd4263+9]; - bfi.b64 %rd3688, %rd3687, %rd3686, 8, 8; - ld.local.u8 %rd3689, [%rd4263+10]; - ld.local.u8 %rd3690, [%rd4263+11]; - bfi.b64 %rd3691, %rd3690, %rd3689, 8, 56; - bfi.b64 %rd3692, %rd3691, %rd3688, 16, 48; - shl.b64 %rd3693, %rd3692, 8; - mov.b64 {%r6515, %r6516}, %rd3693; - mov.b32 {%rs962, %rs3708}, %r6516; - mov.b32 {%rs958, %rs960}, %r6515; - shr.u16 %rs961, %rs960, 8; - shr.u16 %rs959, %rs958, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3694, [%rd4263+12]; - ld.local.u8 %rd3695, [%rd4263+13]; - bfi.b64 %rd3696, %rd3695, %rd3694, 8, 8; - ld.local.u8 %rd3697, [%rd4263+14]; - ld.local.u8 %rd3698, [%rd4263+15]; - bfi.b64 %rd3699, %rd3698, %rd3697, 8, 56; - bfi.b64 %rd3700, %rd3699, %rd3696, 16, 48; - shl.b64 %rd3701, %rd3700, 8; - mov.b64 {%r6517, %r6518}, %rd3701; - mov.b32 {%rs967, %rs3709}, %r6518; - mov.b32 {%rs963, %rs965}, %r6517; - shr.u16 %rs966, %rs965, 8; - shr.u16 %rs964, %rs963, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3702, [%rd4263+16]; - ld.local.u8 %rd3703, [%rd4263+17]; - bfi.b64 %rd3704, %rd3703, %rd3702, 8, 8; - ld.local.u8 %rd3705, [%rd4263+18]; - ld.local.u8 %rd3706, [%rd4263+19]; - bfi.b64 %rd3707, %rd3706, %rd3705, 8, 56; - bfi.b64 %rd3708, %rd3707, %rd3704, 16, 48; - shl.b64 %rd3709, %rd3708, 8; - mov.b64 {%r6519, %r6520}, %rd3709; - mov.b32 {%rs972, %rs3710}, %r6520; - mov.b32 {%rs968, %rs970}, %r6519; - shr.u16 %rs971, %rs970, 8; - shr.u16 %rs969, %rs968, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3710, [%rd4263+20]; - ld.local.u8 %rd3711, [%rd4263+21]; - bfi.b64 %rd3712, %rd3711, %rd3710, 8, 8; - ld.local.u8 %rd3713, [%rd4263+22]; - ld.local.u8 %rd3714, [%rd4263+23]; - bfi.b64 %rd3715, %rd3714, %rd3713, 8, 56; - bfi.b64 %rd3716, %rd3715, %rd3712, 16, 48; - shl.b64 %rd3717, %rd3716, 8; - mov.b64 {%r6521, %r6522}, %rd3717; - mov.b32 {%rs977, %rs3711}, %r6522; - mov.b32 {%rs973, %rs975}, %r6521; - shr.u16 %rs976, %rs975, 8; - shr.u16 %rs974, %rs973, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3718, [%rd4263+24]; - ld.local.u8 %rd3719, [%rd4263+25]; - bfi.b64 %rd3720, %rd3719, %rd3718, 8, 8; - ld.local.u8 %rd3721, [%rd4263+26]; - ld.local.u8 %rd3722, [%rd4263+27]; - bfi.b64 %rd3723, %rd3722, %rd3721, 8, 56; - bfi.b64 %rd3724, %rd3723, %rd3720, 16, 48; - shl.b64 %rd3725, %rd3724, 8; - mov.b64 {%r6523, %r6524}, %rd3725; - mov.b32 {%rs982, %rs3712}, %r6524; - mov.b32 {%rs978, %rs980}, %r6523; - shr.u16 %rs981, %rs980, 8; - shr.u16 %rs979, %rs978, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3726, [%rd4263+28]; - ld.local.u8 %rd3727, [%rd4263+29]; - bfi.b64 %rd3728, %rd3727, %rd3726, 8, 8; - ld.local.u8 %rd3729, [%rd4263+30]; - ld.local.u8 %rd3730, [%rd4263+31]; - bfi.b64 %rd3731, %rd3730, %rd3729, 8, 56; - bfi.b64 %rd3732, %rd3731, %rd3728, 16, 48; - shl.b64 %rd3733, %rd3732, 8; - mov.b64 {%r6525, %r6526}, %rd3733; - mov.b32 {%rs987, %rs3713}, %r6526; - mov.b32 {%rs983, %rs985}, %r6525; - shr.u16 %rs986, %rs985, 8; - shr.u16 %rs984, %rs983, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3734, [%rd4263+32]; - ld.local.u8 %rd3735, [%rd4263+33]; - bfi.b64 %rd3736, %rd3735, %rd3734, 8, 8; - ld.local.u8 %rd3737, [%rd4263+34]; - ld.local.u8 %rd3738, [%rd4263+35]; - bfi.b64 %rd3739, %rd3738, %rd3737, 8, 56; - bfi.b64 %rd3740, %rd3739, %rd3736, 16, 48; - shl.b64 %rd3741, %rd3740, 8; - mov.b64 {%r6527, %r6528}, %rd3741; - mov.b32 {%rs992, %rs3714}, %r6528; - mov.b32 {%rs988, %rs990}, %r6527; - shr.u16 %rs991, %rs990, 8; - shr.u16 %rs989, %rs988, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3742, [%rd4263+36]; - ld.local.u8 %rd3743, [%rd4263+37]; - bfi.b64 %rd3744, %rd3743, %rd3742, 8, 8; - ld.local.u8 %rd3745, [%rd4263+38]; - ld.local.u8 %rd3746, [%rd4263+39]; - bfi.b64 %rd3747, %rd3746, %rd3745, 8, 56; - bfi.b64 %rd3748, %rd3747, %rd3744, 16, 48; - shl.b64 %rd3749, %rd3748, 8; - mov.b64 {%r6529, %r6530}, %rd3749; - mov.b32 {%rs997, %rs3715}, %r6530; - mov.b32 {%rs993, %rs995}, %r6529; - shr.u16 %rs996, %rs995, 8; - shr.u16 %rs994, %rs993, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3750, [%rd4263+40]; - ld.local.u8 %rd3751, [%rd4263+41]; - bfi.b64 %rd3752, %rd3751, %rd3750, 8, 8; - ld.local.u8 %rd3753, [%rd4263+42]; - ld.local.u8 %rd3754, [%rd4263+43]; - bfi.b64 %rd3755, %rd3754, %rd3753, 8, 56; - bfi.b64 %rd3756, %rd3755, %rd3752, 16, 48; - shl.b64 %rd3757, %rd3756, 8; - mov.b64 {%r6531, %r6532}, %rd3757; - mov.b32 {%rs1002, %rs3716}, %r6532; - mov.b32 {%rs998, %rs1000}, %r6531; - shr.u16 %rs1001, %rs1000, 8; - shr.u16 %rs999, %rs998, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3758, [%rd4263+44]; - ld.local.u8 %rd3759, [%rd4263+45]; - bfi.b64 %rd3760, %rd3759, %rd3758, 8, 8; - ld.local.u8 %rd3761, [%rd4263+46]; - ld.local.u8 %rd3762, [%rd4263+47]; - bfi.b64 %rd3763, %rd3762, %rd3761, 8, 56; - bfi.b64 %rd3764, %rd3763, %rd3760, 16, 48; - shl.b64 %rd3765, %rd3764, 8; - mov.b64 {%r6533, %r6534}, %rd3765; - mov.b32 {%rs1007, %rs3717}, %r6534; - mov.b32 {%rs1003, %rs1005}, %r6533; - shr.u16 %rs1006, %rs1005, 8; - shr.u16 %rs1004, %rs1003, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3766, [%rd4263+48]; - ld.local.u8 %rd3767, [%rd4263+49]; - bfi.b64 %rd3768, %rd3767, %rd3766, 8, 8; - ld.local.u8 %rd3769, [%rd4263+50]; - ld.local.u8 %rd3770, [%rd4263+51]; - bfi.b64 %rd3771, %rd3770, %rd3769, 8, 56; - bfi.b64 %rd3772, %rd3771, %rd3768, 16, 48; - shl.b64 %rd3773, %rd3772, 8; - mov.b64 {%r6535, %r6536}, %rd3773; - mov.b32 {%rs1012, %rs3718}, %r6536; - mov.b32 {%rs1008, %rs1010}, %r6535; - shr.u16 %rs1011, %rs1010, 8; - shr.u16 %rs1009, %rs1008, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3774, [%rd4263+52]; - ld.local.u8 %rd3775, [%rd4263+53]; - bfi.b64 %rd3776, %rd3775, %rd3774, 8, 8; - ld.local.u8 %rd3777, [%rd4263+54]; - ld.local.u8 %rd3778, [%rd4263+55]; - bfi.b64 %rd3779, %rd3778, %rd3777, 8, 56; - bfi.b64 %rd3780, %rd3779, %rd3776, 16, 48; - shl.b64 %rd3781, %rd3780, 8; - mov.b64 {%r6537, %r6538}, %rd3781; - mov.b32 {%rs1017, %rs3719}, %r6538; - mov.b32 {%rs1013, %rs1015}, %r6537; - shr.u16 %rs1016, %rs1015, 8; - shr.u16 %rs1014, %rs1013, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3782, [%rd4263+56]; - ld.local.u8 %rd3783, [%rd4263+57]; - bfi.b64 %rd3784, %rd3783, %rd3782, 8, 8; - ld.local.u8 %rd3785, [%rd4263+58]; - ld.local.u8 %rd3786, [%rd4263+59]; - bfi.b64 %rd3787, %rd3786, %rd3785, 8, 56; - bfi.b64 %rd3788, %rd3787, %rd3784, 16, 48; - shl.b64 %rd3789, %rd3788, 8; - mov.b64 {%r6539, %r6540}, %rd3789; - mov.b32 {%rs1022, %rs3720}, %r6540; - mov.b32 {%rs1018, %rs1020}, %r6539; - shr.u16 %rs1021, %rs1020, 8; - shr.u16 %rs1019, %rs1018, 8; - @%p258 bra $L__BB1_395; - - ld.local.u8 %rd3790, [%rd4263+60]; - ld.local.u8 %rd3791, [%rd4263+61]; - bfi.b64 %rd3792, %rd3791, %rd3790, 8, 8; - ld.local.u8 %rd3793, [%rd4263+62]; - ld.local.u8 %rd3794, [%rd4263+63]; - bfi.b64 %rd3795, %rd3794, %rd3793, 8, 56; - bfi.b64 %rd3796, %rd3795, %rd3792, 16, 48; - shl.b64 %rd3797, %rd3796, 8; - mov.b64 {%r6541, %r6542}, %rd3797; - mov.b32 {%rs1027, %rs3721}, %r6542; - mov.b32 {%rs1023, %rs1025}, %r6541; - shr.u16 %rs1026, %rs1025, 8; - shr.u16 %rs1024, %rs1023, 8; - @%p273 bra $L__BB1_396; - bra.uni $L__BB1_395; - -$L__BB1_396: - add.s64 %rd4262, %rd4262, 64; - shl.b16 %rs3722, %rs1020, 8; - or.b16 %rs3723, %rs1019, %rs3722; - shl.b16 %rs3724, %rs1022, 8; - or.b16 %rs3725, %rs1021, %rs3724; - shl.b16 %rs3726, %rs1025, 8; - or.b16 %rs3727, %rs1024, %rs3726; - shl.b16 %rs3728, %rs1027, 8; - or.b16 %rs3729, %rs1026, %rs3728; - mov.b32 %r6543, {%rs3727, %rs3729}; - not.b32 %r6544, %r9107; - and.b32 %r6545, %r9105, %r6544; - and.b32 %r6546, %r9106, %r9107; - or.b32 %r6547, %r6545, %r6546; - add.s32 %r6548, %r9108, %r6547; - shl.b16 %rs3730, %rs950, 8; - or.b16 %rs3731, %rs949, %rs3730; - shl.b16 %rs3732, %rs952, 8; - or.b16 %rs3733, %rs951, %rs3732; - mov.b32 %r6549, {%rs3731, %rs3733}; - add.s32 %r6550, %r6548, %r6549; - add.s32 %r6551, %r6550, -680876936; - shf.l.wrap.b32 %r6552, %r6551, %r6551, 7; - add.s32 %r6553, %r6552, %r9107; - and.b32 %r6554, %r6553, %r9107; - not.b32 %r6555, %r6553; - and.b32 %r6556, %r9106, %r6555; - or.b32 %r6557, %r6556, %r6554; - shl.b16 %rs3734, %rs955, 8; - or.b16 %rs3735, %rs954, %rs3734; - shl.b16 %rs3736, %rs957, 8; - or.b16 %rs3737, %rs956, %rs3736; - mov.b32 %r6558, {%rs3735, %rs3737}; - add.s32 %r6559, %r9105, %r6558; - add.s32 %r6560, %r6559, %r6557; - add.s32 %r6561, %r6560, -389564586; - shf.l.wrap.b32 %r6562, %r6561, %r6561, 12; - add.s32 %r6563, %r6562, %r6553; - and.b32 %r6564, %r6563, %r6553; - not.b32 %r6565, %r6563; - and.b32 %r6566, %r9107, %r6565; - or.b32 %r6567, %r6566, %r6564; - shl.b16 %rs3738, %rs960, 8; - or.b16 %rs3739, %rs959, %rs3738; - shl.b16 %rs3740, %rs962, 8; - or.b16 %rs3741, %rs961, %rs3740; - mov.b32 %r6568, {%rs3739, %rs3741}; - add.s32 %r6569, %r9106, %r6568; - add.s32 %r6570, %r6569, %r6567; - add.s32 %r6571, %r6570, 606105819; - shf.l.wrap.b32 %r6572, %r6571, %r6571, 17; - add.s32 %r6573, %r6572, %r6563; - and.b32 %r6574, %r6573, %r6563; - not.b32 %r6575, %r6573; - and.b32 %r6576, %r6553, %r6575; - or.b32 %r6577, %r6576, %r6574; - shl.b16 %rs3742, %rs965, 8; - or.b16 %rs3743, %rs964, %rs3742; - shl.b16 %rs3744, %rs967, 8; - or.b16 %rs3745, %rs966, %rs3744; - mov.b32 %r6578, {%rs3743, %rs3745}; - add.s32 %r6579, %r9107, %r6578; - add.s32 %r6580, %r6579, %r6577; - add.s32 %r6581, %r6580, -1044525330; - shf.l.wrap.b32 %r6582, %r6581, %r6581, 22; - add.s32 %r6583, %r6582, %r6573; - and.b32 %r6584, %r6583, %r6573; - not.b32 %r6585, %r6583; - and.b32 %r6586, %r6563, %r6585; - or.b32 %r6587, %r6586, %r6584; - shl.b16 %rs3746, %rs970, 8; - or.b16 %rs3747, %rs969, %rs3746; - shl.b16 %rs3748, %rs972, 8; - or.b16 %rs3749, %rs971, %rs3748; - mov.b32 %r6588, {%rs3747, %rs3749}; - add.s32 %r6589, %r6553, %r6588; - add.s32 %r6590, %r6589, %r6587; - add.s32 %r6591, %r6590, -176418897; - shf.l.wrap.b32 %r6592, %r6591, %r6591, 7; - add.s32 %r6593, %r6592, %r6583; - and.b32 %r6594, %r6593, %r6583; - not.b32 %r6595, %r6593; - and.b32 %r6596, %r6573, %r6595; - or.b32 %r6597, %r6596, %r6594; - shl.b16 %rs3750, %rs975, 8; - or.b16 %rs3751, %rs974, %rs3750; - shl.b16 %rs3752, %rs977, 8; - or.b16 %rs3753, %rs976, %rs3752; - mov.b32 %r6598, {%rs3751, %rs3753}; - add.s32 %r6599, %r6598, %r6563; - add.s32 %r6600, %r6599, %r6597; - add.s32 %r6601, %r6600, 1200080426; - shf.l.wrap.b32 %r6602, %r6601, %r6601, 12; - add.s32 %r6603, %r6602, %r6593; - and.b32 %r6604, %r6603, %r6593; - not.b32 %r6605, %r6603; - and.b32 %r6606, %r6583, %r6605; - or.b32 %r6607, %r6606, %r6604; - shl.b16 %rs3754, %rs980, 8; - or.b16 %rs3755, %rs979, %rs3754; - shl.b16 %rs3756, %rs982, 8; - or.b16 %rs3757, %rs981, %rs3756; - mov.b32 %r6608, {%rs3755, %rs3757}; - add.s32 %r6609, %r6608, %r6573; - add.s32 %r6610, %r6609, %r6607; - add.s32 %r6611, %r6610, -1473231341; - shf.l.wrap.b32 %r6612, %r6611, %r6611, 17; - add.s32 %r6613, %r6612, %r6603; - and.b32 %r6614, %r6613, %r6603; - not.b32 %r6615, %r6613; - and.b32 %r6616, %r6593, %r6615; - or.b32 %r6617, %r6616, %r6614; - shl.b16 %rs3758, %rs985, 8; - or.b16 %rs3759, %rs984, %rs3758; - shl.b16 %rs3760, %rs987, 8; - or.b16 %rs3761, %rs986, %rs3760; - mov.b32 %r6618, {%rs3759, %rs3761}; - add.s32 %r6619, %r6618, %r6583; - add.s32 %r6620, %r6619, %r6617; - add.s32 %r6621, %r6620, -45705983; - shf.l.wrap.b32 %r6622, %r6621, %r6621, 22; - add.s32 %r6623, %r6622, %r6613; - and.b32 %r6624, %r6623, %r6613; - not.b32 %r6625, %r6623; - and.b32 %r6626, %r6603, %r6625; - or.b32 %r6627, %r6626, %r6624; - shl.b16 %rs3762, %rs990, 8; - or.b16 %rs3763, %rs989, %rs3762; - shl.b16 %rs3764, %rs992, 8; - or.b16 %rs3765, %rs991, %rs3764; - mov.b32 %r6628, {%rs3763, %rs3765}; - add.s32 %r6629, %r6628, %r6593; - add.s32 %r6630, %r6629, %r6627; - add.s32 %r6631, %r6630, 1770035416; - shf.l.wrap.b32 %r6632, %r6631, %r6631, 7; - add.s32 %r6633, %r6632, %r6623; - and.b32 %r6634, %r6633, %r6623; - not.b32 %r6635, %r6633; - and.b32 %r6636, %r6613, %r6635; - or.b32 %r6637, %r6636, %r6634; - shl.b16 %rs3766, %rs995, 8; - or.b16 %rs3767, %rs994, %rs3766; - shl.b16 %rs3768, %rs997, 8; - or.b16 %rs3769, %rs996, %rs3768; - mov.b32 %r6638, {%rs3767, %rs3769}; - add.s32 %r6639, %r6638, %r6603; - add.s32 %r6640, %r6639, %r6637; - add.s32 %r6641, %r6640, -1958414417; - shf.l.wrap.b32 %r6642, %r6641, %r6641, 12; - add.s32 %r6643, %r6642, %r6633; - and.b32 %r6644, %r6643, %r6633; - not.b32 %r6645, %r6643; - and.b32 %r6646, %r6623, %r6645; - or.b32 %r6647, %r6646, %r6644; - shl.b16 %rs3770, %rs1000, 8; - or.b16 %rs3771, %rs999, %rs3770; - shl.b16 %rs3772, %rs1002, 8; - or.b16 %rs3773, %rs1001, %rs3772; - mov.b32 %r6648, {%rs3771, %rs3773}; - add.s32 %r6649, %r6648, %r6613; - add.s32 %r6650, %r6649, %r6647; - add.s32 %r6651, %r6650, -42063; - shf.l.wrap.b32 %r6652, %r6651, %r6651, 17; - add.s32 %r6653, %r6652, %r6643; - and.b32 %r6654, %r6653, %r6643; - not.b32 %r6655, %r6653; - and.b32 %r6656, %r6633, %r6655; - or.b32 %r6657, %r6656, %r6654; - shl.b16 %rs3774, %rs1005, 8; - or.b16 %rs3775, %rs1004, %rs3774; - shl.b16 %rs3776, %rs1007, 8; - or.b16 %rs3777, %rs1006, %rs3776; - mov.b32 %r6658, {%rs3775, %rs3777}; - add.s32 %r6659, %r6658, %r6623; - add.s32 %r6660, %r6659, %r6657; - add.s32 %r6661, %r6660, -1990404162; - shf.l.wrap.b32 %r6662, %r6661, %r6661, 22; - add.s32 %r6663, %r6662, %r6653; - and.b32 %r6664, %r6663, %r6653; - not.b32 %r6665, %r6663; - and.b32 %r6666, %r6643, %r6665; - or.b32 %r6667, %r6666, %r6664; - shl.b16 %rs3778, %rs1010, 8; - or.b16 %rs3779, %rs1009, %rs3778; - shl.b16 %rs3780, %rs1012, 8; - or.b16 %rs3781, %rs1011, %rs3780; - mov.b32 %r6668, {%rs3779, %rs3781}; - add.s32 %r6669, %r6668, %r6633; - add.s32 %r6670, %r6669, %r6667; - add.s32 %r6671, %r6670, 1804603682; - shf.l.wrap.b32 %r6672, %r6671, %r6671, 7; - add.s32 %r6673, %r6672, %r6663; - and.b32 %r6674, %r6673, %r6663; - not.b32 %r6675, %r6673; - and.b32 %r6676, %r6653, %r6675; - or.b32 %r6677, %r6676, %r6674; - shl.b16 %rs3782, %rs1015, 8; - or.b16 %rs3783, %rs1014, %rs3782; - shl.b16 %rs3784, %rs1017, 8; - or.b16 %rs3785, %rs1016, %rs3784; - mov.b32 %r6678, {%rs3783, %rs3785}; - add.s32 %r6679, %r6678, %r6643; - add.s32 %r6680, %r6679, %r6677; - add.s32 %r6681, %r6680, -40341101; - shf.l.wrap.b32 %r6682, %r6681, %r6681, 12; - add.s32 %r6683, %r6682, %r6673; - mov.b32 %r6684, {%rs3723, %rs3725}; - and.b32 %r6685, %r6683, %r6673; - not.b32 %r6686, %r6683; - and.b32 %r6687, %r6663, %r6686; - or.b32 %r6688, %r6687, %r6685; - add.s32 %r6689, %r6684, %r6653; - add.s32 %r6690, %r6689, %r6688; - add.s32 %r6691, %r6690, -1502002290; - shf.l.wrap.b32 %r6692, %r6691, %r6691, 17; - add.s32 %r6693, %r6692, %r6683; - and.b32 %r6694, %r6693, %r6683; - not.b32 %r6695, %r6693; - and.b32 %r6696, %r6673, %r6695; - or.b32 %r6697, %r6696, %r6694; - add.s32 %r6698, %r6543, %r6663; - add.s32 %r6699, %r6698, %r6697; - add.s32 %r6700, %r6699, 1236535329; - shf.l.wrap.b32 %r6701, %r6700, %r6700, 22; - add.s32 %r6702, %r6701, %r6693; - and.b32 %r6703, %r6702, %r6683; - and.b32 %r6704, %r6693, %r6686; - or.b32 %r6705, %r6703, %r6704; - add.s32 %r6706, %r6558, %r6673; - add.s32 %r6707, %r6706, %r6705; - add.s32 %r6708, %r6707, -165796510; - shf.l.wrap.b32 %r6709, %r6708, %r6708, 5; - add.s32 %r6710, %r6709, %r6702; - and.b32 %r6711, %r6710, %r6693; - and.b32 %r6712, %r6702, %r6695; - or.b32 %r6713, %r6711, %r6712; - add.s32 %r6714, %r6608, %r6683; - add.s32 %r6715, %r6714, %r6713; - add.s32 %r6716, %r6715, -1069501632; - shf.l.wrap.b32 %r6717, %r6716, %r6716, 9; - add.s32 %r6718, %r6717, %r6710; - and.b32 %r6719, %r6718, %r6702; - not.b32 %r6720, %r6702; - and.b32 %r6721, %r6710, %r6720; - or.b32 %r6722, %r6719, %r6721; - add.s32 %r6723, %r6658, %r6693; - add.s32 %r6724, %r6723, %r6722; - add.s32 %r6725, %r6724, 643717713; - shf.l.wrap.b32 %r6726, %r6725, %r6725, 14; - add.s32 %r6727, %r6726, %r6718; - and.b32 %r6728, %r6727, %r6710; - not.b32 %r6729, %r6710; - and.b32 %r6730, %r6718, %r6729; - or.b32 %r6731, %r6728, %r6730; - add.s32 %r6732, %r6549, %r6702; - add.s32 %r6733, %r6732, %r6731; - add.s32 %r6734, %r6733, -373897302; - shf.l.wrap.b32 %r6735, %r6734, %r6734, 20; - add.s32 %r6736, %r6735, %r6727; - and.b32 %r6737, %r6736, %r6718; - not.b32 %r6738, %r6718; - and.b32 %r6739, %r6727, %r6738; - or.b32 %r6740, %r6737, %r6739; - add.s32 %r6741, %r6598, %r6710; - add.s32 %r6742, %r6741, %r6740; - add.s32 %r6743, %r6742, -701558691; - shf.l.wrap.b32 %r6744, %r6743, %r6743, 5; - add.s32 %r6745, %r6744, %r6736; - and.b32 %r6746, %r6745, %r6727; - not.b32 %r6747, %r6727; - and.b32 %r6748, %r6736, %r6747; - or.b32 %r6749, %r6746, %r6748; - add.s32 %r6750, %r6648, %r6718; - add.s32 %r6751, %r6750, %r6749; - add.s32 %r6752, %r6751, 38016083; - shf.l.wrap.b32 %r6753, %r6752, %r6752, 9; - add.s32 %r6754, %r6753, %r6745; - and.b32 %r6755, %r6754, %r6736; - not.b32 %r6756, %r6736; - and.b32 %r6757, %r6745, %r6756; - or.b32 %r6758, %r6755, %r6757; - add.s32 %r6759, %r6543, %r6727; - add.s32 %r6760, %r6759, %r6758; - add.s32 %r6761, %r6760, -660478335; - shf.l.wrap.b32 %r6762, %r6761, %r6761, 14; - add.s32 %r6763, %r6762, %r6754; - and.b32 %r6764, %r6763, %r6745; - not.b32 %r6765, %r6745; - and.b32 %r6766, %r6754, %r6765; - or.b32 %r6767, %r6764, %r6766; - add.s32 %r6768, %r6588, %r6736; - add.s32 %r6769, %r6768, %r6767; - add.s32 %r6770, %r6769, -405537848; - shf.l.wrap.b32 %r6771, %r6770, %r6770, 20; - add.s32 %r6772, %r6771, %r6763; - and.b32 %r6773, %r6772, %r6754; - not.b32 %r6774, %r6754; - and.b32 %r6775, %r6763, %r6774; - or.b32 %r6776, %r6773, %r6775; - add.s32 %r6777, %r6638, %r6745; - add.s32 %r6778, %r6777, %r6776; - add.s32 %r6779, %r6778, 568446438; - shf.l.wrap.b32 %r6780, %r6779, %r6779, 5; - add.s32 %r6781, %r6780, %r6772; - and.b32 %r6782, %r6781, %r6763; - not.b32 %r6783, %r6763; - and.b32 %r6784, %r6772, %r6783; - or.b32 %r6785, %r6782, %r6784; - add.s32 %r6786, %r6684, %r6754; - add.s32 %r6787, %r6786, %r6785; - add.s32 %r6788, %r6787, -1019803690; - shf.l.wrap.b32 %r6789, %r6788, %r6788, 9; - add.s32 %r6790, %r6789, %r6781; - and.b32 %r6791, %r6790, %r6772; - not.b32 %r6792, %r6772; - and.b32 %r6793, %r6781, %r6792; - or.b32 %r6794, %r6791, %r6793; - add.s32 %r6795, %r6578, %r6763; - add.s32 %r6796, %r6795, %r6794; - add.s32 %r6797, %r6796, -187363961; - shf.l.wrap.b32 %r6798, %r6797, %r6797, 14; - add.s32 %r6799, %r6798, %r6790; - and.b32 %r6800, %r6799, %r6781; - not.b32 %r6801, %r6781; - and.b32 %r6802, %r6790, %r6801; - or.b32 %r6803, %r6800, %r6802; - add.s32 %r6804, %r6628, %r6772; - add.s32 %r6805, %r6804, %r6803; - add.s32 %r6806, %r6805, 1163531501; - shf.l.wrap.b32 %r6807, %r6806, %r6806, 20; - add.s32 %r6808, %r6807, %r6799; - and.b32 %r6809, %r6808, %r6790; - not.b32 %r6810, %r6790; - and.b32 %r6811, %r6799, %r6810; - or.b32 %r6812, %r6809, %r6811; - add.s32 %r6813, %r6678, %r6781; - add.s32 %r6814, %r6813, %r6812; - add.s32 %r6815, %r6814, -1444681467; - shf.l.wrap.b32 %r6816, %r6815, %r6815, 5; - add.s32 %r6817, %r6816, %r6808; - and.b32 %r6818, %r6817, %r6799; - not.b32 %r6819, %r6799; - and.b32 %r6820, %r6808, %r6819; - or.b32 %r6821, %r6818, %r6820; - add.s32 %r6822, %r6568, %r6790; - add.s32 %r6823, %r6822, %r6821; - add.s32 %r6824, %r6823, -51403784; - shf.l.wrap.b32 %r6825, %r6824, %r6824, 9; - add.s32 %r6826, %r6825, %r6817; - and.b32 %r6827, %r6826, %r6808; - not.b32 %r6828, %r6808; - and.b32 %r6829, %r6817, %r6828; - or.b32 %r6830, %r6827, %r6829; - add.s32 %r6831, %r6618, %r6799; - add.s32 %r6832, %r6831, %r6830; - add.s32 %r6833, %r6832, 1735328473; - shf.l.wrap.b32 %r6834, %r6833, %r6833, 14; - add.s32 %r6835, %r6834, %r6826; - and.b32 %r6836, %r6835, %r6817; - not.b32 %r6837, %r6817; - and.b32 %r6838, %r6826, %r6837; - or.b32 %r6839, %r6836, %r6838; - add.s32 %r6840, %r6668, %r6808; - add.s32 %r6841, %r6840, %r6839; - add.s32 %r6842, %r6841, -1926607734; - shf.l.wrap.b32 %r6843, %r6842, %r6842, 20; - add.s32 %r6844, %r6843, %r6835; - xor.b32 %r6845, %r6844, %r6835; - xor.b32 %r6846, %r6845, %r6826; - add.s32 %r6847, %r6598, %r6817; - add.s32 %r6848, %r6847, %r6846; - add.s32 %r6849, %r6848, -378558; - shf.l.wrap.b32 %r6850, %r6849, %r6849, 4; - add.s32 %r6851, %r6850, %r6844; - xor.b32 %r6852, %r6851, %r6845; - add.s32 %r6853, %r6628, %r6826; - add.s32 %r6854, %r6853, %r6852; - add.s32 %r6855, %r6854, -2022574463; - shf.l.wrap.b32 %r6856, %r6855, %r6855, 11; - add.s32 %r6857, %r6856, %r6851; - xor.b32 %r6858, %r6857, %r6851; - xor.b32 %r6859, %r6858, %r6844; - add.s32 %r6860, %r6658, %r6835; - add.s32 %r6861, %r6860, %r6859; - add.s32 %r6862, %r6861, 1839030562; - shf.l.wrap.b32 %r6863, %r6862, %r6862, 16; - add.s32 %r6864, %r6863, %r6857; - xor.b32 %r6865, %r6864, %r6858; - add.s32 %r6866, %r6684, %r6844; - add.s32 %r6867, %r6866, %r6865; - add.s32 %r6868, %r6867, -35309556; - shf.l.wrap.b32 %r6869, %r6868, %r6868, 23; - add.s32 %r6870, %r6869, %r6864; - xor.b32 %r6871, %r6864, %r6857; - xor.b32 %r6872, %r6871, %r6870; - add.s32 %r6873, %r6558, %r6851; - add.s32 %r6874, %r6873, %r6872; - add.s32 %r6875, %r6874, -1530992060; - shf.l.wrap.b32 %r6876, %r6875, %r6875, 4; - add.s32 %r6877, %r6876, %r6870; - xor.b32 %r6878, %r6870, %r6864; - xor.b32 %r6879, %r6878, %r6877; - add.s32 %r6880, %r6588, %r6857; - add.s32 %r6881, %r6880, %r6879; - add.s32 %r6882, %r6881, 1272893353; - shf.l.wrap.b32 %r6883, %r6882, %r6882, 11; - add.s32 %r6884, %r6883, %r6877; - xor.b32 %r6885, %r6877, %r6870; - xor.b32 %r6886, %r6885, %r6884; - add.s32 %r6887, %r6618, %r6864; - add.s32 %r6888, %r6887, %r6886; - add.s32 %r6889, %r6888, -155497632; - shf.l.wrap.b32 %r6890, %r6889, %r6889, 16; - add.s32 %r6891, %r6890, %r6884; - xor.b32 %r6892, %r6884, %r6877; - xor.b32 %r6893, %r6892, %r6891; - add.s32 %r6894, %r6648, %r6870; - add.s32 %r6895, %r6894, %r6893; - add.s32 %r6896, %r6895, -1094730640; - shf.l.wrap.b32 %r6897, %r6896, %r6896, 23; - add.s32 %r6898, %r6897, %r6891; - xor.b32 %r6899, %r6891, %r6884; - xor.b32 %r6900, %r6899, %r6898; - add.s32 %r6901, %r6678, %r6877; - add.s32 %r6902, %r6901, %r6900; - add.s32 %r6903, %r6902, 681279174; - shf.l.wrap.b32 %r6904, %r6903, %r6903, 4; - add.s32 %r6905, %r6904, %r6898; - xor.b32 %r6906, %r6898, %r6891; - xor.b32 %r6907, %r6906, %r6905; - add.s32 %r6908, %r6549, %r6884; - add.s32 %r6909, %r6908, %r6907; - add.s32 %r6910, %r6909, -358537222; - shf.l.wrap.b32 %r6911, %r6910, %r6910, 11; - add.s32 %r6912, %r6911, %r6905; - xor.b32 %r6913, %r6905, %r6898; - xor.b32 %r6914, %r6913, %r6912; - add.s32 %r6915, %r6578, %r6891; - add.s32 %r6916, %r6915, %r6914; - add.s32 %r6917, %r6916, -722521979; - shf.l.wrap.b32 %r6918, %r6917, %r6917, 16; - add.s32 %r6919, %r6918, %r6912; - xor.b32 %r6920, %r6912, %r6905; - xor.b32 %r6921, %r6920, %r6919; - add.s32 %r6922, %r6608, %r6898; - add.s32 %r6923, %r6922, %r6921; - add.s32 %r6924, %r6923, 76029189; - shf.l.wrap.b32 %r6925, %r6924, %r6924, 23; - add.s32 %r6926, %r6925, %r6919; - xor.b32 %r6927, %r6919, %r6912; - xor.b32 %r6928, %r6927, %r6926; - add.s32 %r6929, %r6638, %r6905; - add.s32 %r6930, %r6929, %r6928; - add.s32 %r6931, %r6930, -640364487; - shf.l.wrap.b32 %r6932, %r6931, %r6931, 4; - add.s32 %r6933, %r6932, %r6926; - xor.b32 %r6934, %r6926, %r6919; - xor.b32 %r6935, %r6934, %r6933; - add.s32 %r6936, %r6668, %r6912; - add.s32 %r6937, %r6936, %r6935; - add.s32 %r6938, %r6937, -421815835; - shf.l.wrap.b32 %r6939, %r6938, %r6938, 11; - add.s32 %r6940, %r6939, %r6933; - xor.b32 %r6941, %r6933, %r6926; - xor.b32 %r6942, %r6941, %r6940; - add.s32 %r6943, %r6543, %r6919; - add.s32 %r6944, %r6943, %r6942; - add.s32 %r6945, %r6944, 530742520; - shf.l.wrap.b32 %r6946, %r6945, %r6945, 16; - add.s32 %r6947, %r6946, %r6940; - xor.b32 %r6948, %r6940, %r6933; - xor.b32 %r6949, %r6948, %r6947; - add.s32 %r6950, %r6568, %r6926; - add.s32 %r6951, %r6950, %r6949; - add.s32 %r6952, %r6951, -995338651; - shf.l.wrap.b32 %r6953, %r6952, %r6952, 23; - add.s32 %r6954, %r6953, %r6947; - not.b32 %r6955, %r6940; - or.b32 %r6956, %r6954, %r6955; - xor.b32 %r6957, %r6956, %r6947; - add.s32 %r6958, %r6549, %r6933; - add.s32 %r6959, %r6958, %r6957; - add.s32 %r6960, %r6959, -198630844; - shf.l.wrap.b32 %r6961, %r6960, %r6960, 6; - add.s32 %r6962, %r6961, %r6954; - not.b32 %r6963, %r6947; - or.b32 %r6964, %r6962, %r6963; - xor.b32 %r6965, %r6964, %r6954; - add.s32 %r6966, %r6618, %r6940; - add.s32 %r6967, %r6966, %r6965; - add.s32 %r6968, %r6967, 1126891415; - shf.l.wrap.b32 %r6969, %r6968, %r6968, 10; - add.s32 %r6970, %r6969, %r6962; - not.b32 %r6971, %r6954; - or.b32 %r6972, %r6970, %r6971; - xor.b32 %r6973, %r6972, %r6962; - add.s32 %r6974, %r6684, %r6947; - add.s32 %r6975, %r6974, %r6973; - add.s32 %r6976, %r6975, -1416354905; - shf.l.wrap.b32 %r6977, %r6976, %r6976, 15; - add.s32 %r6978, %r6977, %r6970; - not.b32 %r6979, %r6962; - or.b32 %r6980, %r6978, %r6979; - xor.b32 %r6981, %r6980, %r6970; - add.s32 %r6982, %r6598, %r6954; - add.s32 %r6983, %r6982, %r6981; - add.s32 %r6984, %r6983, -57434055; - shf.l.wrap.b32 %r6985, %r6984, %r6984, 21; - add.s32 %r6986, %r6985, %r6978; - not.b32 %r6987, %r6970; - or.b32 %r6988, %r6986, %r6987; - xor.b32 %r6989, %r6988, %r6978; - add.s32 %r6990, %r6668, %r6962; - add.s32 %r6991, %r6990, %r6989; - add.s32 %r6992, %r6991, 1700485571; - shf.l.wrap.b32 %r6993, %r6992, %r6992, 6; - add.s32 %r6994, %r6993, %r6986; - not.b32 %r6995, %r6978; - or.b32 %r6996, %r6994, %r6995; - xor.b32 %r6997, %r6996, %r6986; - add.s32 %r6998, %r6578, %r6970; - add.s32 %r6999, %r6998, %r6997; - add.s32 %r7000, %r6999, -1894986606; - shf.l.wrap.b32 %r7001, %r7000, %r7000, 10; - add.s32 %r7002, %r7001, %r6994; - not.b32 %r7003, %r6986; - or.b32 %r7004, %r7002, %r7003; - xor.b32 %r7005, %r7004, %r6994; - add.s32 %r7006, %r6648, %r6978; - add.s32 %r7007, %r7006, %r7005; - add.s32 %r7008, %r7007, -1051523; - shf.l.wrap.b32 %r7009, %r7008, %r7008, 15; - add.s32 %r7010, %r7009, %r7002; - not.b32 %r7011, %r6994; - or.b32 %r7012, %r7010, %r7011; - xor.b32 %r7013, %r7012, %r7002; - add.s32 %r7014, %r6558, %r6986; - add.s32 %r7015, %r7014, %r7013; - add.s32 %r7016, %r7015, -2054922799; - shf.l.wrap.b32 %r7017, %r7016, %r7016, 21; - add.s32 %r7018, %r7017, %r7010; - not.b32 %r7019, %r7002; - or.b32 %r7020, %r7018, %r7019; - xor.b32 %r7021, %r7020, %r7010; - add.s32 %r7022, %r6628, %r6994; - add.s32 %r7023, %r7022, %r7021; - add.s32 %r7024, %r7023, 1873313359; - shf.l.wrap.b32 %r7025, %r7024, %r7024, 6; - add.s32 %r7026, %r7025, %r7018; - not.b32 %r7027, %r7010; - or.b32 %r7028, %r7026, %r7027; - xor.b32 %r7029, %r7028, %r7018; - add.s32 %r7030, %r6543, %r7002; - add.s32 %r7031, %r7030, %r7029; - add.s32 %r7032, %r7031, -30611744; - shf.l.wrap.b32 %r7033, %r7032, %r7032, 10; - add.s32 %r7034, %r7033, %r7026; - not.b32 %r7035, %r7018; - or.b32 %r7036, %r7034, %r7035; - xor.b32 %r7037, %r7036, %r7026; - add.s32 %r7038, %r6608, %r7010; - add.s32 %r7039, %r7038, %r7037; - add.s32 %r7040, %r7039, -1560198380; - shf.l.wrap.b32 %r7041, %r7040, %r7040, 15; - add.s32 %r7042, %r7041, %r7034; - not.b32 %r7043, %r7026; - or.b32 %r7044, %r7042, %r7043; - xor.b32 %r7045, %r7044, %r7034; - add.s32 %r7046, %r6678, %r7018; - add.s32 %r7047, %r7046, %r7045; - add.s32 %r7048, %r7047, 1309151649; - shf.l.wrap.b32 %r7049, %r7048, %r7048, 21; - add.s32 %r7050, %r7049, %r7042; - not.b32 %r7051, %r7034; - or.b32 %r7052, %r7050, %r7051; - xor.b32 %r7053, %r7052, %r7042; - add.s32 %r7054, %r6588, %r7026; - add.s32 %r7055, %r7054, %r7053; - add.s32 %r7056, %r7055, -145523070; - shf.l.wrap.b32 %r7057, %r7056, %r7056, 6; - add.s32 %r7058, %r7057, %r7050; - not.b32 %r7059, %r7042; - or.b32 %r7060, %r7058, %r7059; - xor.b32 %r7061, %r7060, %r7050; - add.s32 %r7062, %r6658, %r7034; - add.s32 %r7063, %r7062, %r7061; - add.s32 %r7064, %r7063, -1120210379; - shf.l.wrap.b32 %r7065, %r7064, %r7064, 10; - add.s32 %r7066, %r7065, %r7058; - not.b32 %r7067, %r7050; - or.b32 %r7068, %r7066, %r7067; - xor.b32 %r7069, %r7068, %r7058; - add.s32 %r7070, %r6568, %r7042; - add.s32 %r7071, %r7070, %r7069; - add.s32 %r7072, %r7071, 718787259; - shf.l.wrap.b32 %r7073, %r7072, %r7072, 15; - add.s32 %r7074, %r7073, %r7066; - not.b32 %r7075, %r7058; - or.b32 %r7076, %r7074, %r7075; - xor.b32 %r7077, %r7076, %r7066; - add.s32 %r7078, %r6638, %r7050; - add.s32 %r7079, %r7078, %r7077; - add.s32 %r7080, %r7079, -343485551; - shf.l.wrap.b32 %r7081, %r7080, %r7080, 21; - add.s32 %r9108, %r7058, %r9108; - add.s32 %r7082, %r7074, %r9107; - add.s32 %r9107, %r7082, %r7081; - add.s32 %r9106, %r7074, %r9106; - add.s32 %r9105, %r7066, %r9105; - setp.ne.s64 %p291, %rd4262, %rd882; - add.s64 %rd4263, %rd4263, 64; - @%p291 bra $L__BB1_379; - bra.uni $L__BB1_397; - -$L__BB1_399: - setp.gt.u16 %p292, %rs1, 10; - add.u64 %rd3798, %SP, 352; - add.u64 %rd888, %SPL, 352; - mov.u16 %rs3804, 0; - st.local.v4.u16 [%rd888], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3799, %rd3798, 8; - cvta.to.local.u64 %rd889, %rd3799; - st.local.v4.u16 [%rd889], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3800, %rd3798, 16; - cvta.to.local.u64 %rd890, %rd3800; - st.local.v4.u16 [%rd890], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3801, %rd3798, 24; - cvta.to.local.u64 %rd891, %rd3801; - st.local.v4.u16 [%rd891], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3802, %rd3798, 32; - cvta.to.local.u64 %rd892, %rd3802; - st.local.v4.u16 [%rd892], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3803, %rd3798, 40; - cvta.to.local.u64 %rd893, %rd3803; - st.local.v4.u16 [%rd893], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3804, %rd3798, 48; - cvta.to.local.u64 %rd894, %rd3804; - st.local.v4.u16 [%rd894], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd3805, %rd3798, 56; - cvta.to.local.u64 %rd895, %rd3805; - st.local.v4.u16 [%rd895], {%rs3804, %rs3804, %rs3804, %rs3804}; - add.s64 %rd896, %rd3798, 64; - cvta.to.local.u64 %rd897, %rd896; - st.local.u8 [%rd897], %rs3804; - @%p292 bra $L__BB1_469; - - cvta.to.local.u64 %rd898, %rd978; - shr.u64 %rd899, %rd11, 1; - setp.eq.s64 %p293, %rd899, 0; - @%p293 bra $L__BB1_404; - - mov.u64 %rd4266, 1; - mov.u64 %rd4264, %rd898; - mov.u64 %rd4265, %rd888; - bra.uni $L__BB1_402; - -$L__BB1_403: - ld.local.u16 %rs2, [%rd4264+4]; - add.s64 %rd4266, %rd4266, 1; - add.s64 %rd4265, %rd4265, 2; - add.s64 %rd4264, %rd4264, 2; - -$L__BB1_402: - st.local.u16 [%rd4265], %rs2; - setp.ge.u64 %p294, %rd4266, %rd899; - @%p294 bra $L__BB1_404; - bra.uni $L__BB1_403; - -$L__BB1_404: - and.b64 %rd907, %rd11, 1; - setp.eq.s64 %p295, %rd907, 0; - @%p295 bra $L__BB1_407; - - and.b64 %rd3810, %rd11, 65534; - cvta.to.local.u64 %rd3812, %rd3798; - add.s64 %rd908, %rd3812, %rd3810; - add.s64 %rd3813, %rd898, %rd3810; - add.s64 %rd909, %rd3813, 2; - mov.u64 %rd4267, 0; - -$L__BB1_406: - add.s64 %rd3814, %rd909, %rd4267; - ld.local.u8 %rs3805, [%rd3814]; - add.s64 %rd3815, %rd908, %rd4267; - st.local.u8 [%rd3815], %rs3805; - add.s64 %rd4267, %rd4267, 1; - setp.lt.u64 %p296, %rd4267, %rd907; - @%p296 bra $L__BB1_406; - -$L__BB1_407: - mov.u64 %rd3816, 0; - st.local.u8 [%rd897], %rs1; - ld.local.v4.u16 {%rs3806, %rs3807, %rs3808, %rs3809}, [%rd888]; - ld.local.v4.u16 {%rs3814, %rs3815, %rs3816, %rs3817}, [%rd889]; - ld.local.v4.u16 {%rs3822, %rs3823, %rs3824, %rs3825}, [%rd890]; - ld.local.v4.u16 {%rs3830, %rs3831, %rs3832, %rs3833}, [%rd891]; - ld.local.v4.u16 {%rs3838, %rs3839, %rs3840, %rs3841}, [%rd892]; - ld.local.v4.u16 {%rs3846, %rs3847, %rs3848, %rs3849}, [%rd893]; - ld.local.v4.u16 {%rs3854, %rs3855, %rs3856, %rs3857}, [%rd894]; - ld.local.v4.u16 {%rs3862, %rs3863, %rs3864, %rs3865}, [%rd895]; - shr.u16 %rs3868, %rs3863, 8; - ld.local.v4.u16 {%rs3869, %rs3870, %rs3871, %rs3872}, [%rd897]; - and.b16 %rs3873, %rs3869, 255; - shr.u16 %rs3875, %rs3870, 8; - shr.u16 %rs3878, %rs3872, 8; - st.local.u64 [%rd1], %rd3816; - mov.u32 %r9124, -271733879; - mov.u32 %r7096, 1732584193; - st.local.v2.u32 [%rd1+8], {%r7096, %r9124}; - mov.u32 %r9121, 271733878; - mov.u32 %r9123, -1732584194; - st.local.v2.u32 [%rd1+16], {%r9123, %r9121}; - st.local.v4.u16 [%rd1+24], {%rs3806, %rs3807, %rs3808, %rs3809}; - st.local.v4.u16 [%rd1+32], {%rs3814, %rs3815, %rs3816, %rs3817}; - st.local.v4.u16 [%rd1+40], {%rs3822, %rs3823, %rs3824, %rs3825}; - st.local.v4.u16 [%rd1+48], {%rs3830, %rs3831, %rs3832, %rs3833}; - st.local.v4.u16 [%rd1+56], {%rs3838, %rs3839, %rs3840, %rs3841}; - st.local.v4.u16 [%rd1+64], {%rs3846, %rs3847, %rs3848, %rs3849}; - st.local.v4.u16 [%rd1+72], {%rs3854, %rs3855, %rs3856, %rs3857}; - st.local.u16 [%rd1+80], %rs3862; - st.local.u8 [%rd1+82], %rs3863; - st.local.u8 [%rd1+83], %rs3868; - st.local.v2.u16 [%rd1+84], {%rs3864, %rs3865}; - st.local.u16 [%rd1+88], %rs3869; - st.local.u8 [%rd1+90], %rs3870; - st.local.u8 [%rd1+91], %rs3875; - st.local.u16 [%rd1+92], %rs3871; - st.local.u8 [%rd1+94], %rs3872; - st.local.u8 [%rd1+95], %rs3878; - cvt.u64.u16 %rd3818, %rs3869; - and.b64 %rd913, %rd3818, 255; - cvt.u32.u16 %r7099, %rs3869; - and.b32 %r7100, %r7099, 255; - mul.wide.u32 %rd914, %r7100, 8; - setp.lt.u16 %p297, %rs3873, 64; - @%p297 bra $L__BB1_409; - bra.uni $L__BB1_408; - -$L__BB1_409: - add.s64 %rd3819, %rd1, %rd913; - mov.u16 %rs3881, 128; - st.local.u8 [%rd3819+24], %rs3881; - add.s64 %rd915, %rd913, 1; - setp.eq.s64 %p298, %rd915, 64; - @%p298 bra $L__BB1_416; - - add.s64 %rd3820, %rd1, %rd915; - add.s64 %rd4272, %rd3820, 24; - mov.u16 %rs3882, 3; - sub.s16 %rs3883, %rs3882, %rs3869; - and.b16 %rs1031, %rs3883, 3; - setp.eq.s16 %p299, %rs1031, 0; - @%p299 bra $L__BB1_413; - - cvt.u64.u16 %rd3821, %rs1031; - neg.s64 %rd4268, %rd3821; - mov.u64 %rd4269, %rd4272; - -$L__BB1_412: - .pragma "nounroll"; - add.s64 %rd4272, %rd4269, 1; - st.local.u8 [%rd4269], %rs3804; - add.s64 %rd4268, %rd4268, 1; - setp.ne.s64 %p300, %rd4268, 0; - mov.u64 %rd4269, %rd4272; - @%p300 bra $L__BB1_412; - -$L__BB1_413: - mov.u64 %rd3822, 62; - sub.s64 %rd3823, %rd3822, %rd913; - setp.lt.u64 %p301, %rd3823, 3; - @%p301 bra $L__BB1_416; - - sub.s64 %rd3824, %rd1, %rd4272; - add.s64 %rd4271, %rd3824, 88; - -$L__BB1_415: - st.local.u8 [%rd4272], %rs3804; - st.local.u8 [%rd4272+1], %rs3804; - st.local.u8 [%rd4272+2], %rs3804; - st.local.u8 [%rd4272+3], %rs3804; - add.s64 %rd4271, %rd4271, -4; - setp.ne.s64 %p302, %rd4271, 0; - add.s64 %rd4272, %rd4272, 4; - @%p302 bra $L__BB1_415; - -$L__BB1_416: - or.b64 %rd3825, %rd913, 7; - setp.eq.s64 %p303, %rd3825, 63; - @%p303 bra $L__BB1_438; - bra.uni $L__BB1_417; - -$L__BB1_438: - ld.local.u32 %rd3855, [%rd1+24]; - shl.b64 %rd3856, %rd3855, 8; - mov.b64 {%r7446, %r7447}, %rd3856; - mov.b32 {%rs1111, %rs3960}, %r7447; - mov.b32 {%rs1107, %rs1109}, %r7446; - shr.u16 %rs1110, %rs1109, 8; - shr.u16 %rs1108, %rs1107, 8; - mov.pred %p321, 0; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3857, [%rd1+28]; - shl.b64 %rd3858, %rd3857, 8; - mov.b64 {%r7448, %r7449}, %rd3858; - mov.b32 {%rs1116, %rs3961}, %r7449; - mov.b32 {%rs1112, %rs1114}, %r7448; - shr.u16 %rs1115, %rs1114, 8; - shr.u16 %rs1113, %rs1112, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3859, [%rd1+32]; - shl.b64 %rd3860, %rd3859, 8; - mov.b64 {%r7450, %r7451}, %rd3860; - mov.b32 {%rs1121, %rs3962}, %r7451; - mov.b32 {%rs1117, %rs1119}, %r7450; - shr.u16 %rs1120, %rs1119, 8; - shr.u16 %rs1118, %rs1117, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3861, [%rd1+36]; - shl.b64 %rd3862, %rd3861, 8; - mov.b64 {%r7452, %r7453}, %rd3862; - mov.b32 {%rs1126, %rs3963}, %r7453; - mov.b32 {%rs1122, %rs1124}, %r7452; - shr.u16 %rs1125, %rs1124, 8; - shr.u16 %rs1123, %rs1122, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3863, [%rd1+40]; - shl.b64 %rd3864, %rd3863, 8; - mov.b64 {%r7454, %r7455}, %rd3864; - mov.b32 {%rs1131, %rs3964}, %r7455; - mov.b32 {%rs1127, %rs1129}, %r7454; - shr.u16 %rs1130, %rs1129, 8; - shr.u16 %rs1128, %rs1127, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3865, [%rd1+44]; - shl.b64 %rd3866, %rd3865, 8; - mov.b64 {%r7456, %r7457}, %rd3866; - mov.b32 {%rs1136, %rs3965}, %r7457; - mov.b32 {%rs1132, %rs1134}, %r7456; - shr.u16 %rs1135, %rs1134, 8; - shr.u16 %rs1133, %rs1132, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3867, [%rd1+48]; - shl.b64 %rd3868, %rd3867, 8; - mov.b64 {%r7458, %r7459}, %rd3868; - mov.b32 {%rs1141, %rs3966}, %r7459; - mov.b32 {%rs1137, %rs1139}, %r7458; - shr.u16 %rs1140, %rs1139, 8; - shr.u16 %rs1138, %rs1137, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3869, [%rd1+52]; - shl.b64 %rd3870, %rd3869, 8; - mov.b64 {%r7460, %r7461}, %rd3870; - mov.b32 {%rs1146, %rs3967}, %r7461; - mov.b32 {%rs1142, %rs1144}, %r7460; - shr.u16 %rs1145, %rs1144, 8; - shr.u16 %rs1143, %rs1142, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3871, [%rd1+56]; - shl.b64 %rd3872, %rd3871, 8; - mov.b64 {%r7462, %r7463}, %rd3872; - mov.b32 {%rs1151, %rs3968}, %r7463; - mov.b32 {%rs1147, %rs1149}, %r7462; - shr.u16 %rs1150, %rs1149, 8; - shr.u16 %rs1148, %rs1147, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3873, [%rd1+60]; - shl.b64 %rd3874, %rd3873, 8; - mov.b64 {%r7464, %r7465}, %rd3874; - mov.b32 {%rs1156, %rs3969}, %r7465; - mov.b32 {%rs1152, %rs1154}, %r7464; - shr.u16 %rs1155, %rs1154, 8; - shr.u16 %rs1153, %rs1152, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3875, [%rd1+64]; - shl.b64 %rd3876, %rd3875, 8; - mov.b64 {%r7466, %r7467}, %rd3876; - mov.b32 {%rs1161, %rs3970}, %r7467; - mov.b32 {%rs1157, %rs1159}, %r7466; - shr.u16 %rs1160, %rs1159, 8; - shr.u16 %rs1158, %rs1157, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3877, [%rd1+68]; - shl.b64 %rd3878, %rd3877, 8; - mov.b64 {%r7468, %r7469}, %rd3878; - mov.b32 {%rs1166, %rs3971}, %r7469; - mov.b32 {%rs1162, %rs1164}, %r7468; - shr.u16 %rs1165, %rs1164, 8; - shr.u16 %rs1163, %rs1162, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3879, [%rd1+72]; - shl.b64 %rd3880, %rd3879, 8; - mov.b64 {%r7470, %r7471}, %rd3880; - mov.b32 {%rs1171, %rs3972}, %r7471; - mov.b32 {%rs1167, %rs1169}, %r7470; - shr.u16 %rs1170, %rs1169, 8; - shr.u16 %rs1168, %rs1167, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3881, [%rd1+76]; - shl.b64 %rd3882, %rd3881, 8; - mov.b64 {%r7472, %r7473}, %rd3882; - mov.b32 {%rs1176, %rs3973}, %r7473; - mov.b32 {%rs1172, %rs1174}, %r7472; - shr.u16 %rs1175, %rs1174, 8; - shr.u16 %rs1173, %rs1172, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3883, [%rd1+80]; - shl.b64 %rd3884, %rd3883, 8; - mov.b64 {%r7474, %r7475}, %rd3884; - mov.b32 {%rs1181, %rs3974}, %r7475; - mov.b32 {%rs1177, %rs1179}, %r7474; - shr.u16 %rs1180, %rs1179, 8; - shr.u16 %rs1178, %rs1177, 8; - @%p321 bra $L__BB1_454; - - ld.local.u32 %rd3885, [%rd1+84]; - shl.b64 %rd3886, %rd3885, 8; - mov.b64 {%r7476, %r7477}, %rd3886; - mov.b32 {%rs1186, %rs3975}, %r7477; - mov.b32 {%rs1182, %rs1184}, %r7476; - shr.u16 %rs1185, %rs1184, 8; - shr.u16 %rs1183, %rs1182, 8; - mov.pred %p336, -1; - @%p336 bra $L__BB1_455; - bra.uni $L__BB1_454; - -$L__BB1_455: - shl.b16 %rs3976, %rs1184, 8; - or.b16 %rs3977, %rs1183, %rs3976; - shl.b16 %rs3978, %rs1186, 8; - or.b16 %rs3979, %rs1185, %rs3978; - mov.b32 %r105, {%rs3977, %rs3979}; - shl.b16 %rs3980, %rs1179, 8; - or.b16 %rs3981, %rs1178, %rs3980; - shl.b16 %rs3982, %rs1181, 8; - or.b16 %rs3983, %rs1180, %rs3982; - mov.b32 %r106, {%rs3981, %rs3983}; - shl.b16 %rs3984, %rs1174, 8; - or.b16 %rs3985, %rs1173, %rs3984; - shl.b16 %rs3986, %rs1176, 8; - or.b16 %rs3987, %rs1175, %rs3986; - mov.b32 %r107, {%rs3985, %rs3987}; - shl.b16 %rs3988, %rs1169, 8; - or.b16 %rs3989, %rs1168, %rs3988; - shl.b16 %rs3990, %rs1171, 8; - or.b16 %rs3991, %rs1170, %rs3990; - mov.b32 %r108, {%rs3989, %rs3991}; - shl.b16 %rs3992, %rs1164, 8; - or.b16 %rs3993, %rs1163, %rs3992; - shl.b16 %rs3994, %rs1166, 8; - or.b16 %rs3995, %rs1165, %rs3994; - mov.b32 %r109, {%rs3993, %rs3995}; - shl.b16 %rs3996, %rs1159, 8; - or.b16 %rs3997, %rs1158, %rs3996; - shl.b16 %rs3998, %rs1161, 8; - or.b16 %rs3999, %rs1160, %rs3998; - mov.b32 %r110, {%rs3997, %rs3999}; - shl.b16 %rs4000, %rs1154, 8; - or.b16 %rs4001, %rs1153, %rs4000; - shl.b16 %rs4002, %rs1156, 8; - or.b16 %rs4003, %rs1155, %rs4002; - mov.b32 %r111, {%rs4001, %rs4003}; - shl.b16 %rs4004, %rs1149, 8; - or.b16 %rs4005, %rs1148, %rs4004; - shl.b16 %rs4006, %rs1151, 8; - or.b16 %rs4007, %rs1150, %rs4006; - mov.b32 %r112, {%rs4005, %rs4007}; - shl.b16 %rs4008, %rs1144, 8; - or.b16 %rs4009, %rs1143, %rs4008; - shl.b16 %rs4010, %rs1146, 8; - or.b16 %rs4011, %rs1145, %rs4010; - mov.b32 %r113, {%rs4009, %rs4011}; - shl.b16 %rs4012, %rs1139, 8; - or.b16 %rs4013, %rs1138, %rs4012; - shl.b16 %rs4014, %rs1141, 8; - or.b16 %rs4015, %rs1140, %rs4014; - mov.b32 %r114, {%rs4013, %rs4015}; - shl.b16 %rs4016, %rs1134, 8; - or.b16 %rs4017, %rs1133, %rs4016; - shl.b16 %rs4018, %rs1136, 8; - or.b16 %rs4019, %rs1135, %rs4018; - mov.b32 %r115, {%rs4017, %rs4019}; - shl.b16 %rs4020, %rs1129, 8; - or.b16 %rs4021, %rs1128, %rs4020; - shl.b16 %rs4022, %rs1131, 8; - or.b16 %rs4023, %rs1130, %rs4022; - mov.b32 %r116, {%rs4021, %rs4023}; - shl.b16 %rs4024, %rs1124, 8; - or.b16 %rs4025, %rs1123, %rs4024; - shl.b16 %rs4026, %rs1126, 8; - or.b16 %rs4027, %rs1125, %rs4026; - mov.b32 %r117, {%rs4025, %rs4027}; - shl.b16 %rs4028, %rs1119, 8; - or.b16 %rs4029, %rs1118, %rs4028; - shl.b16 %rs4030, %rs1121, 8; - or.b16 %rs4031, %rs1120, %rs4030; - mov.b32 %r118, {%rs4029, %rs4031}; - shl.b16 %rs4032, %rs1114, 8; - or.b16 %rs4033, %rs1113, %rs4032; - shl.b16 %rs4034, %rs1116, 8; - or.b16 %rs4035, %rs1115, %rs4034; - mov.b32 %r119, {%rs4033, %rs4035}; - shl.b16 %rs4036, %rs1109, 8; - or.b16 %rs4037, %rs1108, %rs4036; - shl.b16 %rs4038, %rs1111, 8; - or.b16 %rs4039, %rs1110, %rs4038; - mov.b32 %r120, {%rs4037, %rs4039}; - mov.u32 %r9134, -1043882854; - mov.u32 %r9133, -271733879; - mov.u32 %r9132, -1732584194; - mov.u32 %r9130, 271733878; - mov.u32 %r9131, %r9130; - @%p321 bra $L__BB1_457; - - add.s32 %r7483, %r120, -1; - shf.l.wrap.b32 %r7484, %r7483, %r7483, 3; - not.b32 %r7485, %r7484; - and.b32 %r7486, %r7484, -271733879; - and.b32 %r7487, %r7485, -1732584194; - or.b32 %r7488, %r7487, %r7486; - add.s32 %r7489, %r7488, %r119; - add.s32 %r7490, %r7489, 271733878; - shf.l.wrap.b32 %r7491, %r7490, %r7490, 7; - not.b32 %r7492, %r7491; - and.b32 %r7493, %r7491, %r7484; - and.b32 %r7494, %r7492, -271733879; - or.b32 %r7495, %r7494, %r7493; - add.s32 %r7496, %r7495, %r118; - add.s32 %r7497, %r7496, -1732584194; - shf.l.wrap.b32 %r7498, %r7497, %r7497, 11; - and.b32 %r7499, %r7498, %r7491; - not.b32 %r7500, %r7498; - and.b32 %r7501, %r7484, %r7500; - or.b32 %r7502, %r7501, %r7499; - add.s32 %r7503, %r7502, %r117; - add.s32 %r7504, %r7503, -271733879; - shf.l.wrap.b32 %r7505, %r7504, %r7504, 19; - and.b32 %r7506, %r7498, %r7505; - not.b32 %r7507, %r7505; - and.b32 %r7508, %r7491, %r7507; - or.b32 %r7509, %r7508, %r7506; - add.s32 %r7510, %r7509, %r7484; - add.s32 %r7511, %r7510, %r116; - shf.l.wrap.b32 %r7512, %r7511, %r7511, 3; - and.b32 %r7513, %r7512, %r7505; - not.b32 %r7514, %r7512; - and.b32 %r7515, %r7498, %r7514; - or.b32 %r7516, %r7515, %r7513; - add.s32 %r7517, %r7516, %r7491; - add.s32 %r7518, %r7517, %r115; - shf.l.wrap.b32 %r7519, %r7518, %r7518, 7; - and.b32 %r7520, %r7519, %r7512; - not.b32 %r7521, %r7519; - and.b32 %r7522, %r7505, %r7521; - or.b32 %r7523, %r7522, %r7520; - add.s32 %r7524, %r7523, %r7498; - add.s32 %r7525, %r7524, %r114; - shf.l.wrap.b32 %r7526, %r7525, %r7525, 11; - and.b32 %r7527, %r7526, %r7519; - not.b32 %r7528, %r7526; - and.b32 %r7529, %r7512, %r7528; - or.b32 %r7530, %r7529, %r7527; - add.s32 %r7531, %r7530, %r7505; - add.s32 %r7532, %r7531, %r113; - shf.l.wrap.b32 %r7533, %r7532, %r7532, 19; - and.b32 %r7534, %r7526, %r7533; - not.b32 %r7535, %r7533; - and.b32 %r7536, %r7519, %r7535; - or.b32 %r7537, %r7536, %r7534; - add.s32 %r7538, %r7537, %r7512; - add.s32 %r7539, %r7538, %r112; - shf.l.wrap.b32 %r7540, %r7539, %r7539, 3; - and.b32 %r7541, %r7540, %r7533; - not.b32 %r7542, %r7540; - and.b32 %r7543, %r7526, %r7542; - or.b32 %r7544, %r7543, %r7541; - add.s32 %r7545, %r7544, %r7519; - add.s32 %r7546, %r7545, %r111; - shf.l.wrap.b32 %r7547, %r7546, %r7546, 7; - and.b32 %r7548, %r7547, %r7540; - not.b32 %r7549, %r7547; - and.b32 %r7550, %r7533, %r7549; - or.b32 %r7551, %r7550, %r7548; - add.s32 %r7552, %r7551, %r7526; - add.s32 %r7553, %r7552, %r110; - shf.l.wrap.b32 %r7554, %r7553, %r7553, 11; - and.b32 %r7555, %r7554, %r7547; - not.b32 %r7556, %r7554; - and.b32 %r7557, %r7540, %r7556; - or.b32 %r7558, %r7557, %r7555; - add.s32 %r7559, %r7558, %r7533; - add.s32 %r7560, %r7559, %r109; - shf.l.wrap.b32 %r7561, %r7560, %r7560, 19; - and.b32 %r7562, %r7554, %r7561; - not.b32 %r7563, %r7561; - and.b32 %r7564, %r7547, %r7563; - or.b32 %r7565, %r7564, %r7562; - add.s32 %r7566, %r7565, %r7540; - add.s32 %r7567, %r7566, %r108; - shf.l.wrap.b32 %r7568, %r7567, %r7567, 3; - and.b32 %r7569, %r7568, %r7561; - not.b32 %r7570, %r7568; - and.b32 %r7571, %r7554, %r7570; - or.b32 %r7572, %r7571, %r7569; - add.s32 %r7573, %r7572, %r7547; - add.s32 %r7574, %r7573, %r107; - shf.l.wrap.b32 %r9131, %r7574, %r7574, 7; - and.b32 %r7575, %r9131, %r7568; - not.b32 %r7576, %r9131; - and.b32 %r7577, %r7561, %r7576; - or.b32 %r7578, %r7577, %r7575; - add.s32 %r7579, %r7578, %r7554; - add.s32 %r7580, %r7579, %r106; - shf.l.wrap.b32 %r9132, %r7580, %r7580, 11; - and.b32 %r9130, %r9132, %r9131; - not.b32 %r7581, %r9132; - and.b32 %r7582, %r7568, %r7581; - or.b32 %r7583, %r7582, %r9130; - add.s32 %r7584, %r7583, %r7561; - add.s32 %r7585, %r7584, %r105; - shf.l.wrap.b32 %r9133, %r7585, %r7585, 19; - add.s32 %r9134, %r7568, 1518500249; - -$L__BB1_457: - or.b32 %r7586, %r9132, %r9131; - and.b32 %r7587, %r7586, %r9133; - or.b32 %r7588, %r7587, %r9130; - add.s32 %r7589, %r9134, %r7588; - add.s32 %r7590, %r7589, %r120; - shf.l.wrap.b32 %r7591, %r7590, %r7590, 3; - or.b32 %r7592, %r9133, %r9132; - and.b32 %r7593, %r7591, %r7592; - and.b32 %r7594, %r9133, %r9132; - or.b32 %r7595, %r7593, %r7594; - add.s32 %r7596, %r9131, %r116; - add.s32 %r7597, %r7596, %r7595; - add.s32 %r7598, %r7597, 1518500249; - shf.l.wrap.b32 %r7599, %r7598, %r7598, 5; - or.b32 %r7600, %r7591, %r9133; - and.b32 %r7601, %r7599, %r7600; - and.b32 %r7602, %r7591, %r9133; - or.b32 %r7603, %r7601, %r7602; - add.s32 %r7604, %r9132, %r112; - add.s32 %r7605, %r7604, %r7603; - add.s32 %r7606, %r7605, 1518500249; - shf.l.wrap.b32 %r7607, %r7606, %r7606, 9; - or.b32 %r7608, %r7599, %r7591; - and.b32 %r7609, %r7607, %r7608; - and.b32 %r7610, %r7599, %r7591; - or.b32 %r7611, %r7609, %r7610; - add.s32 %r7612, %r9133, %r108; - add.s32 %r7613, %r7612, %r7611; - add.s32 %r7614, %r7613, 1518500249; - shf.l.wrap.b32 %r7615, %r7614, %r7614, 13; - or.b32 %r7616, %r7607, %r7599; - and.b32 %r7617, %r7615, %r7616; - and.b32 %r7618, %r7607, %r7599; - or.b32 %r7619, %r7617, %r7618; - add.s32 %r7620, %r7591, %r119; - add.s32 %r7621, %r7620, %r7619; - add.s32 %r7622, %r7621, 1518500249; - shf.l.wrap.b32 %r7623, %r7622, %r7622, 3; - or.b32 %r7624, %r7615, %r7607; - and.b32 %r7625, %r7623, %r7624; - and.b32 %r7626, %r7615, %r7607; - or.b32 %r7627, %r7625, %r7626; - add.s32 %r7628, %r115, %r7599; - add.s32 %r7629, %r7628, %r7627; - add.s32 %r7630, %r7629, 1518500249; - shf.l.wrap.b32 %r7631, %r7630, %r7630, 5; - or.b32 %r7632, %r7623, %r7615; - and.b32 %r7633, %r7631, %r7632; - and.b32 %r7634, %r7623, %r7615; - or.b32 %r7635, %r7633, %r7634; - add.s32 %r7636, %r111, %r7607; - add.s32 %r7637, %r7636, %r7635; - add.s32 %r7638, %r7637, 1518500249; - shf.l.wrap.b32 %r7639, %r7638, %r7638, 9; - or.b32 %r7640, %r7631, %r7623; - and.b32 %r7641, %r7639, %r7640; - and.b32 %r7642, %r7631, %r7623; - or.b32 %r7643, %r7641, %r7642; - add.s32 %r7644, %r107, %r7615; - add.s32 %r7645, %r7644, %r7643; - add.s32 %r7646, %r7645, 1518500249; - shf.l.wrap.b32 %r7647, %r7646, %r7646, 13; - or.b32 %r7648, %r7639, %r7631; - and.b32 %r7649, %r7647, %r7648; - and.b32 %r7650, %r7639, %r7631; - or.b32 %r7651, %r7649, %r7650; - add.s32 %r7652, %r118, %r7623; - add.s32 %r7653, %r7652, %r7651; - add.s32 %r7654, %r7653, 1518500249; - shf.l.wrap.b32 %r7655, %r7654, %r7654, 3; - or.b32 %r7656, %r7647, %r7639; - and.b32 %r7657, %r7655, %r7656; - and.b32 %r7658, %r7647, %r7639; - or.b32 %r7659, %r7657, %r7658; - add.s32 %r7660, %r114, %r7631; - add.s32 %r7661, %r7660, %r7659; - add.s32 %r7662, %r7661, 1518500249; - shf.l.wrap.b32 %r7663, %r7662, %r7662, 5; - or.b32 %r7664, %r7655, %r7647; - and.b32 %r7665, %r7663, %r7664; - and.b32 %r7666, %r7655, %r7647; - or.b32 %r7667, %r7665, %r7666; - add.s32 %r7668, %r110, %r7639; - add.s32 %r7669, %r7668, %r7667; - add.s32 %r7670, %r7669, 1518500249; - shf.l.wrap.b32 %r7671, %r7670, %r7670, 9; - or.b32 %r7672, %r7663, %r7655; - and.b32 %r7673, %r7671, %r7672; - and.b32 %r7674, %r7663, %r7655; - or.b32 %r7675, %r7673, %r7674; - add.s32 %r7676, %r106, %r7647; - add.s32 %r7677, %r7676, %r7675; - add.s32 %r7678, %r7677, 1518500249; - shf.l.wrap.b32 %r7679, %r7678, %r7678, 13; - or.b32 %r7680, %r7671, %r7663; - and.b32 %r7681, %r7679, %r7680; - and.b32 %r7682, %r7671, %r7663; - or.b32 %r7683, %r7681, %r7682; - add.s32 %r7684, %r117, %r7655; - add.s32 %r7685, %r7684, %r7683; - add.s32 %r7686, %r7685, 1518500249; - shf.l.wrap.b32 %r9138, %r7686, %r7686, 3; - or.b32 %r7687, %r7679, %r7671; - and.b32 %r7688, %r9138, %r7687; - and.b32 %r7689, %r7679, %r7671; - or.b32 %r7690, %r7688, %r7689; - add.s32 %r7691, %r113, %r7663; - add.s32 %r7692, %r7691, %r7690; - add.s32 %r7693, %r7692, 1518500249; - shf.l.wrap.b32 %r9135, %r7693, %r7693, 5; - or.b32 %r7694, %r9138, %r7679; - and.b32 %r7695, %r9135, %r7694; - and.b32 %r7696, %r9138, %r7679; - or.b32 %r7697, %r7695, %r7696; - add.s32 %r7698, %r109, %r7671; - add.s32 %r7699, %r7698, %r7697; - add.s32 %r7700, %r7699, 1518500249; - shf.l.wrap.b32 %r9136, %r7700, %r7700, 9; - or.b32 %r7701, %r9135, %r9138; - and.b32 %r7702, %r9136, %r7701; - and.b32 %r7703, %r9135, %r9138; - or.b32 %r7704, %r7702, %r7703; - add.s32 %r7705, %r105, %r7679; - add.s32 %r7706, %r7705, %r7704; - add.s32 %r7707, %r7706, 1518500249; - shf.l.wrap.b32 %r9137, %r7707, %r7707, 13; - @%p321 bra $L__BB1_459; - - xor.b32 %r7708, %r9136, %r9137; - xor.b32 %r7709, %r7708, %r9135; - add.s32 %r7710, %r9138, %r7709; - add.s32 %r7711, %r7710, %r120; - add.s32 %r7712, %r7711, 1859775393; - shf.l.wrap.b32 %r7713, %r7712, %r7712, 3; - xor.b32 %r7714, %r7713, %r7708; - add.s32 %r7715, %r9135, %r7714; - add.s32 %r7716, %r7715, %r112; - add.s32 %r7717, %r7716, 1859775393; - shf.l.wrap.b32 %r7718, %r7717, %r7717, 9; - xor.b32 %r7719, %r7713, %r9137; - xor.b32 %r7720, %r7719, %r7718; - add.s32 %r7721, %r9136, %r116; - add.s32 %r7722, %r7721, %r7720; - add.s32 %r7723, %r7722, 1859775393; - shf.l.wrap.b32 %r7724, %r7723, %r7723, 11; - xor.b32 %r7725, %r7718, %r7713; - xor.b32 %r7726, %r7725, %r7724; - add.s32 %r7727, %r9137, %r7726; - add.s32 %r7728, %r7727, %r108; - add.s32 %r7729, %r7728, 1859775393; - shf.l.wrap.b32 %r7730, %r7729, %r7729, 15; - xor.b32 %r7731, %r7724, %r7730; - xor.b32 %r7732, %r7731, %r7718; - add.s32 %r7733, %r7713, %r7732; - add.s32 %r7734, %r7733, %r118; - add.s32 %r7735, %r7734, 1859775393; - shf.l.wrap.b32 %r7736, %r7735, %r7735, 3; - xor.b32 %r7737, %r7736, %r7731; - add.s32 %r7738, %r7718, %r7737; - add.s32 %r7739, %r7738, %r110; - add.s32 %r7740, %r7739, 1859775393; - shf.l.wrap.b32 %r7741, %r7740, %r7740, 9; - xor.b32 %r7742, %r7736, %r7730; - xor.b32 %r7743, %r7742, %r7741; - add.s32 %r7744, %r7724, %r114; - add.s32 %r7745, %r7744, %r7743; - add.s32 %r7746, %r7745, 1859775393; - shf.l.wrap.b32 %r7747, %r7746, %r7746, 11; - xor.b32 %r7748, %r7741, %r7736; - xor.b32 %r7749, %r7748, %r7747; - add.s32 %r7750, %r7730, %r7749; - add.s32 %r7751, %r7750, %r106; - add.s32 %r7752, %r7751, 1859775393; - shf.l.wrap.b32 %r7753, %r7752, %r7752, 15; - xor.b32 %r7754, %r7747, %r7753; - xor.b32 %r7755, %r7754, %r7741; - add.s32 %r7756, %r7736, %r7755; - add.s32 %r7757, %r7756, %r119; - add.s32 %r7758, %r7757, 1859775393; - shf.l.wrap.b32 %r7759, %r7758, %r7758, 3; - xor.b32 %r7760, %r7759, %r7754; - add.s32 %r7761, %r7741, %r7760; - add.s32 %r7762, %r7761, %r111; - add.s32 %r7763, %r7762, 1859775393; - shf.l.wrap.b32 %r7764, %r7763, %r7763, 9; - xor.b32 %r7765, %r7759, %r7753; - xor.b32 %r7766, %r7765, %r7764; - add.s32 %r7767, %r7747, %r115; - add.s32 %r7768, %r7767, %r7766; - add.s32 %r7769, %r7768, 1859775393; - shf.l.wrap.b32 %r7770, %r7769, %r7769, 11; - xor.b32 %r7771, %r7764, %r7759; - xor.b32 %r7772, %r7771, %r7770; - add.s32 %r7773, %r7753, %r7772; - add.s32 %r7774, %r7773, %r107; - add.s32 %r7775, %r7774, 1859775393; - shf.l.wrap.b32 %r7776, %r7775, %r7775, 15; - xor.b32 %r7777, %r7770, %r7776; - xor.b32 %r7778, %r7777, %r7764; - add.s32 %r7779, %r7759, %r7778; - add.s32 %r7780, %r7779, %r117; - add.s32 %r7781, %r7780, 1859775393; - shf.l.wrap.b32 %r9138, %r7781, %r7781, 3; - xor.b32 %r7782, %r9138, %r7777; - add.s32 %r7783, %r7764, %r7782; - add.s32 %r7784, %r7783, %r109; - add.s32 %r7785, %r7784, 1859775393; - shf.l.wrap.b32 %r9135, %r7785, %r7785, 9; - xor.b32 %r7786, %r9138, %r7776; - xor.b32 %r7787, %r7786, %r9135; - add.s32 %r7788, %r7770, %r113; - add.s32 %r7789, %r7788, %r7787; - add.s32 %r7790, %r7789, 1859775393; - shf.l.wrap.b32 %r9136, %r7790, %r7790, 11; - xor.b32 %r7791, %r9135, %r9138; - xor.b32 %r7792, %r7791, %r9136; - add.s32 %r7793, %r7776, %r7792; - add.s32 %r7794, %r7793, %r105; - add.s32 %r7795, %r7794, 1859775393; - shf.l.wrap.b32 %r9137, %r7795, %r7795, 15; - -$L__BB1_459: - add.s32 %r143, %r9138, 1732584193; - add.s32 %r144, %r9137, -271733879; - add.s32 %r145, %r9136, -1732584194; - add.s32 %r146, %r9135, 271733878; - mov.b64 {%r147, %r148}, %rd914; - cvt.u64.u32 %rd3887, %r147; - shl.b64 %rd3888, %rd3887, 8; - mov.b64 {%r7796, %r7797}, %rd3888; - mov.b32 {%rs1191, %rs4040}, %r7797; - mov.b32 {%rs1187, %rs1189}, %r7796; - shr.u16 %rs1190, %rs1189, 8; - shr.u16 %rs1188, %rs1187, 8; - @%p321 bra $L__BB1_461; - - cvt.u64.u32 %rd3889, %r148; - shl.b64 %rd3890, %rd3889, 8; - mov.b64 {%r7798, %r7799}, %rd3890; - mov.b32 {%rs1196, %rs4041}, %r7799; - mov.b32 {%rs1192, %rs1194}, %r7798; - shr.u16 %rs1195, %rs1194, 8; - shr.u16 %rs1193, %rs1192, 8; - @%p336 bra $L__BB1_462; - bra.uni $L__BB1_461; - -$L__BB1_462: - shl.b16 %rs4042, %rs1194, 8; - or.b16 %rs4043, %rs1193, %rs4042; - shl.b16 %rs4044, %rs1196, 8; - or.b16 %rs4045, %rs1195, %rs4044; - mov.b32 %r149, {%rs4043, %rs4045}; - shl.b16 %rs4046, %rs1189, 8; - or.b16 %rs4047, %rs1188, %rs4046; - shl.b16 %rs4048, %rs1191, 8; - or.b16 %rs4049, %rs1190, %rs4048; - mov.b32 %r150, {%rs4047, %rs4049}; - @%p321 bra $L__BB1_464; - bra.uni $L__BB1_463; - -$L__BB1_464: - and.b32 %r9139, %r146, %r145; - mov.u32 %r9140, %r146; - mov.u32 %r9141, %r145; - mov.u32 %r9142, %r144; - mov.u32 %r9143, %r143; - bra.uni $L__BB1_465; - -$L__BB1_228: - setp.gt.u16 %p154, %rs1, 10; - add.u64 %rd2231, %SP, 352; - add.u64 %rd723, %SPL, 352; - mov.u16 %rs2770, 0; - st.local.v4.u16 [%rd723], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2232, %rd2231, 8; - cvta.to.local.u64 %rd724, %rd2232; - st.local.v4.u16 [%rd724], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2233, %rd2231, 16; - cvta.to.local.u64 %rd725, %rd2233; - st.local.v4.u16 [%rd725], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2234, %rd2231, 24; - cvta.to.local.u64 %rd726, %rd2234; - st.local.v4.u16 [%rd726], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2235, %rd2231, 32; - cvta.to.local.u64 %rd727, %rd2235; - st.local.v4.u16 [%rd727], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2236, %rd2231, 40; - cvta.to.local.u64 %rd728, %rd2236; - st.local.v4.u16 [%rd728], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2237, %rd2231, 48; - cvta.to.local.u64 %rd729, %rd2237; - st.local.v4.u16 [%rd729], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd2238, %rd2231, 56; - cvta.to.local.u64 %rd730, %rd2238; - st.local.v4.u16 [%rd730], {%rs2770, %rs2770, %rs2770, %rs2770}; - add.s64 %rd731, %rd2231, 64; - cvta.to.local.u64 %rd732, %rd731; - st.local.u8 [%rd732], %rs2770; - @%p154 bra $L__BB1_249; - - cvta.to.local.u64 %rd733, %rd978; - shr.u64 %rd734, %rd11, 1; - setp.eq.s64 %p155, %rd734, 0; - @%p155 bra $L__BB1_233; - - mov.u64 %rd4227, 1; - mov.u64 %rd4225, %rd733; - mov.u64 %rd4226, %rd723; - bra.uni $L__BB1_231; - -$L__BB1_232: - ld.local.u16 %rs2, [%rd4225+4]; - add.s64 %rd4227, %rd4227, 1; - add.s64 %rd4226, %rd4226, 2; - add.s64 %rd4225, %rd4225, 2; - -$L__BB1_231: - st.local.u16 [%rd4226], %rs2; - setp.ge.u64 %p156, %rd4227, %rd734; - @%p156 bra $L__BB1_233; - bra.uni $L__BB1_232; - -$L__BB1_233: - and.b64 %rd742, %rd11, 1; - setp.eq.s64 %p157, %rd742, 0; - @%p157 bra $L__BB1_236; - - and.b64 %rd2243, %rd11, 65534; - cvta.to.local.u64 %rd2245, %rd2231; - add.s64 %rd743, %rd2245, %rd2243; - add.s64 %rd2246, %rd733, %rd2243; - add.s64 %rd744, %rd2246, 2; - mov.u64 %rd4228, 0; - -$L__BB1_235: - add.s64 %rd2247, %rd744, %rd4228; - ld.local.u8 %rs2771, [%rd2247]; - add.s64 %rd2248, %rd743, %rd4228; - st.local.u8 [%rd2248], %rs2771; - add.s64 %rd4228, %rd4228, 1; - setp.lt.u64 %p158, %rd4228, %rd742; - @%p158 bra $L__BB1_235; - -$L__BB1_236: - mov.u64 %rd2249, 0; - st.local.u8 [%rd732], %rs1; - ld.local.v4.u16 {%rs2772, %rs2773, %rs2774, %rs2775}, [%rd723]; - ld.local.v4.u16 {%rs2780, %rs2781, %rs2782, %rs2783}, [%rd724]; - ld.local.v4.u16 {%rs2788, %rs2789, %rs2790, %rs2791}, [%rd725]; - ld.local.v4.u16 {%rs2796, %rs2797, %rs2798, %rs2799}, [%rd726]; - ld.local.v4.u16 {%rs2804, %rs2805, %rs2806, %rs2807}, [%rd727]; - ld.local.v4.u16 {%rs2812, %rs2813, %rs2814, %rs2815}, [%rd728]; - ld.local.v4.u16 {%rs2820, %rs2821, %rs2822, %rs2823}, [%rd729]; - mov.u32 %r759, 0; - shr.u16 %rs2826, %rs2823, 8; - ld.local.v4.u16 {%rs2827, %rs2828, %rs2829, %rs2830}, [%rd730]; - ld.local.v4.u16 {%rs2835, %rs2836, %rs2837, %rs2838}, [%rd732]; - and.b16 %rs2842, %rs2835, 255; - st.local.u64 [%rd1], %rd2249; - mov.u32 %r760, 914150663; - mov.u32 %r761, -1056596264; - st.local.v2.u32 [%rd1+8], {%r761, %r760}; - mov.u32 %r762, -150054599; - mov.u32 %r763, 812702999; - st.local.v2.u32 [%rd1+16], {%r763, %r762}; - mov.u32 %r764, 1750603025; - mov.u32 %r765, -4191439; - st.local.v2.u32 [%rd1+24], {%r765, %r764}; - mov.u32 %r766, -1090891868; - mov.u32 %r767, 1694076839; - st.local.v2.u32 [%rd1+32], {%r767, %r766}; - st.local.v4.u16 [%rd1+40], {%rs2772, %rs2773, %rs2774, %rs2775}; - st.local.v4.u16 [%rd1+48], {%rs2780, %rs2781, %rs2782, %rs2783}; - st.local.v4.u16 [%rd1+56], {%rs2788, %rs2789, %rs2790, %rs2791}; - st.local.v4.u16 [%rd1+64], {%rs2796, %rs2797, %rs2798, %rs2799}; - st.local.v4.u16 [%rd1+72], {%rs2804, %rs2805, %rs2806, %rs2807}; - st.local.v4.u16 [%rd1+80], {%rs2812, %rs2813, %rs2814, %rs2815}; - st.local.v2.u16 [%rd1+88], {%rs2820, %rs2821}; - st.local.u16 [%rd1+92], %rs2822; - st.local.u8 [%rd1+94], %rs2823; - st.local.u8 [%rd1+95], %rs2826; - st.local.v4.u16 [%rd1+96], {%rs2827, %rs2828, %rs2829, %rs2830}; - st.local.v4.u16 [%rd1+104], {%rs2835, %rs2836, %rs2837, %rs2838}; - cvt.u64.u16 %rd2251, %rs2835; - and.b64 %rd748, %rd2251, 255; - cvt.u32.u16 %r768, %rs2835; - and.b32 %r769, %r768, 255; - mul.wide.u32 %rd2252, %r769, 8; - { - .reg .b32 %temp; - mov.b64 {%r770, %temp}, %rd2252; - } - { - .reg .b32 %temp; - mov.b64 {%temp, %r771}, %rd2252; - } - mov.u32 %r772, 291; - prmt.b32 %r773, %r770, %r759, %r772; - prmt.b32 %r774, %r771, %r759, %r772; - mov.b64 %rd749, {%r774, %r773}; - setp.lt.u16 %p159, %rs2842, 64; - @%p159 bra $L__BB1_238; - bra.uni $L__BB1_237; - -$L__BB1_238: - add.s64 %rd2253, %rd1, %rd748; - mov.u16 %rs2845, 128; - st.local.u8 [%rd2253+40], %rs2845; - add.s64 %rd750, %rd748, 1; - setp.eq.s64 %p160, %rd750, 64; - @%p160 bra $L__BB1_245; - - add.s64 %rd2254, %rd1, %rd750; - add.s64 %rd4233, %rd2254, 40; - mov.u16 %rs2846, 3; - sub.s16 %rs2847, %rs2846, %rs2835; - and.b16 %rs539, %rs2847, 3; - setp.eq.s16 %p161, %rs539, 0; - @%p161 bra $L__BB1_242; - - cvt.u64.u16 %rd2255, %rs539; - neg.s64 %rd4229, %rd2255; - mov.u64 %rd4230, %rd4233; - -$L__BB1_241: - .pragma "nounroll"; - add.s64 %rd4233, %rd4230, 1; - st.local.u8 [%rd4230], %rs2770; - add.s64 %rd4229, %rd4229, 1; - setp.ne.s64 %p162, %rd4229, 0; - mov.u64 %rd4230, %rd4233; - @%p162 bra $L__BB1_241; - -$L__BB1_242: - mov.u64 %rd2256, 62; - sub.s64 %rd2257, %rd2256, %rd748; - setp.lt.u64 %p163, %rd2257, 3; - @%p163 bra $L__BB1_245; - - sub.s64 %rd2258, %rd1, %rd4233; - add.s64 %rd4232, %rd2258, 104; - -$L__BB1_244: - st.local.u8 [%rd4233], %rs2770; - st.local.u8 [%rd4233+1], %rs2770; - st.local.u8 [%rd4233+2], %rs2770; - st.local.u8 [%rd4233+3], %rs2770; - add.s64 %rd4232, %rd4232, -4; - setp.ne.s64 %p164, %rd4232, 0; - add.s64 %rd4233, %rd4233, 4; - @%p164 bra $L__BB1_244; - -$L__BB1_245: - add.s64 %rd764, %rd968, 40; - or.b64 %rd2260, %rd748, 7; - setp.eq.s64 %p165, %rd2260, 63; - add.s64 %rd765, %rd968, 8; - @%p165 bra $L__BB1_247; - bra.uni $L__BB1_246; - -$L__BB1_247: - mov.u64 %rd2262, 1; - { // callseq 29, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd765; - .param .b64 param1; - st.param.b64 [param1+0], %rd764; - .param .b64 param2; - st.param.b64 [param2+0], %rd2262; - call.uni - _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE, - ( - param0, - param1, - param2 - ); - } // callseq 29 - add.u64 %rd2263, %SP, 504; - add.u64 %rd2264, %SPL, 504; - st.local.u8 [%rd2264], %rs2770; - st.local.u8 [%rd2264+1], %rs2770; - st.local.u8 [%rd2264+2], %rs2770; - st.local.u8 [%rd2264+3], %rs2770; - st.local.u8 [%rd2264+4], %rs2770; - st.local.u8 [%rd2264+5], %rs2770; - st.local.u8 [%rd2264+6], %rs2770; - st.local.u8 [%rd2264+7], %rs2770; - st.local.u8 [%rd2264+8], %rs2770; - st.local.u8 [%rd2264+9], %rs2770; - st.local.u8 [%rd2264+10], %rs2770; - st.local.u8 [%rd2264+11], %rs2770; - st.local.u8 [%rd2264+12], %rs2770; - st.local.u8 [%rd2264+13], %rs2770; - st.local.u8 [%rd2264+14], %rs2770; - st.local.u8 [%rd2264+15], %rs2770; - st.local.u8 [%rd2264+16], %rs2770; - st.local.u8 [%rd2264+17], %rs2770; - st.local.u8 [%rd2264+18], %rs2770; - st.local.u8 [%rd2264+19], %rs2770; - st.local.u8 [%rd2264+20], %rs2770; - st.local.u8 [%rd2264+21], %rs2770; - st.local.u8 [%rd2264+22], %rs2770; - st.local.u8 [%rd2264+23], %rs2770; - st.local.u8 [%rd2264+24], %rs2770; - st.local.u8 [%rd2264+25], %rs2770; - st.local.u8 [%rd2264+26], %rs2770; - st.local.u8 [%rd2264+27], %rs2770; - st.local.u8 [%rd2264+28], %rs2770; - st.local.u8 [%rd2264+29], %rs2770; - st.local.u8 [%rd2264+30], %rs2770; - st.local.u8 [%rd2264+31], %rs2770; - st.local.u8 [%rd2264+32], %rs2770; - st.local.u8 [%rd2264+33], %rs2770; - st.local.u8 [%rd2264+34], %rs2770; - st.local.u8 [%rd2264+35], %rs2770; - st.local.u8 [%rd2264+36], %rs2770; - st.local.u8 [%rd2264+37], %rs2770; - st.local.u8 [%rd2264+38], %rs2770; - st.local.u8 [%rd2264+39], %rs2770; - st.local.u8 [%rd2264+40], %rs2770; - st.local.u8 [%rd2264+41], %rs2770; - st.local.u8 [%rd2264+42], %rs2770; - st.local.u8 [%rd2264+43], %rs2770; - st.local.u8 [%rd2264+44], %rs2770; - st.local.u8 [%rd2264+45], %rs2770; - st.local.u8 [%rd2264+46], %rs2770; - st.local.u8 [%rd2264+47], %rs2770; - st.local.u8 [%rd2264+48], %rs2770; - st.local.u8 [%rd2264+49], %rs2770; - st.local.u8 [%rd2264+50], %rs2770; - st.local.u8 [%rd2264+51], %rs2770; - st.local.u8 [%rd2264+52], %rs2770; - st.local.u8 [%rd2264+53], %rs2770; - st.local.u8 [%rd2264+54], %rs2770; - st.local.u8 [%rd2264+55], %rs2770; - shr.u64 %rd2265, %rd749, 56; - st.local.u8 [%rd2264+63], %rd2265; - shr.u64 %rd2266, %rd749, 48; - st.local.u8 [%rd2264+62], %rd2266; - shr.u64 %rd2267, %rd749, 40; - st.local.u8 [%rd2264+61], %rd2267; - shr.u64 %rd2268, %rd749, 32; - st.local.u8 [%rd2264+60], %rd2268; - shr.u64 %rd2269, %rd749, 24; - st.local.u8 [%rd2264+59], %rd2269; - shr.u64 %rd2270, %rd749, 16; - st.local.u8 [%rd2264+58], %rd2270; - shr.u64 %rd2271, %rd749, 8; - st.local.u8 [%rd2264+57], %rd2271; - st.local.u8 [%rd2264+56], %rd749; - { // callseq 30, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd765; - .param .b64 param1; - st.param.b64 [param1+0], %rd2263; - .param .b64 param2; - st.param.b64 [param2+0], %rd2262; - call.uni - _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE, - ( - param0, - param1, - param2 - ); - } // callseq 30 - bra.uni $L__BB1_248; - -$L__BB1_250: - setp.gt.u16 %p166, %rs1, 10; - add.u64 %rd2272, %SP, 352; - add.u64 %rd766, %SPL, 352; - mov.u16 %rs2909, 0; - st.local.v4.u16 [%rd766], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2273, %rd2272, 8; - cvta.to.local.u64 %rd767, %rd2273; - st.local.v4.u16 [%rd767], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2274, %rd2272, 16; - cvta.to.local.u64 %rd768, %rd2274; - st.local.v4.u16 [%rd768], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2275, %rd2272, 24; - cvta.to.local.u64 %rd769, %rd2275; - st.local.v4.u16 [%rd769], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2276, %rd2272, 32; - cvta.to.local.u64 %rd770, %rd2276; - st.local.v4.u16 [%rd770], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2277, %rd2272, 40; - cvta.to.local.u64 %rd771, %rd2277; - st.local.v4.u16 [%rd771], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2278, %rd2272, 48; - cvta.to.local.u64 %rd772, %rd2278; - st.local.v4.u16 [%rd772], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd2279, %rd2272, 56; - cvta.to.local.u64 %rd773, %rd2279; - st.local.v4.u16 [%rd773], {%rs2909, %rs2909, %rs2909, %rs2909}; - add.s64 %rd774, %rd2272, 64; - cvta.to.local.u64 %rd775, %rd774; - st.local.u8 [%rd775], %rs2909; - @%p166 bra $L__BB1_326; - - cvta.to.local.u64 %rd776, %rd978; - shr.u64 %rd777, %rd11, 1; - setp.eq.s64 %p167, %rd777, 0; - @%p167 bra $L__BB1_255; - - mov.u64 %rd4236, 1; - mov.u64 %rd4234, %rd776; - mov.u64 %rd4235, %rd766; - bra.uni $L__BB1_253; - -$L__BB1_254: - ld.local.u16 %rs2, [%rd4234+4]; - add.s64 %rd4236, %rd4236, 1; - add.s64 %rd4235, %rd4235, 2; - add.s64 %rd4234, %rd4234, 2; - -$L__BB1_253: - st.local.u16 [%rd4235], %rs2; - setp.ge.u64 %p168, %rd4236, %rd777; - @%p168 bra $L__BB1_255; - bra.uni $L__BB1_254; - -$L__BB1_255: - and.b64 %rd785, %rd11, 1; - setp.eq.s64 %p169, %rd785, 0; - @%p169 bra $L__BB1_258; - - and.b64 %rd2284, %rd11, 65534; - cvta.to.local.u64 %rd2286, %rd2272; - add.s64 %rd786, %rd2286, %rd2284; - add.s64 %rd2287, %rd776, %rd2284; - add.s64 %rd787, %rd2287, 2; - mov.u64 %rd4237, 0; - -$L__BB1_257: - add.s64 %rd2288, %rd787, %rd4237; - ld.local.u8 %rs2910, [%rd2288]; - add.s64 %rd2289, %rd786, %rd4237; - st.local.u8 [%rd2289], %rs2910; - add.s64 %rd4237, %rd4237, 1; - setp.lt.u64 %p170, %rd4237, %rd785; - @%p170 bra $L__BB1_257; - -$L__BB1_258: - mov.u64 %rd2290, 0; - st.local.u8 [%rd775], %rs1; - ld.local.v4.u16 {%rs2911, %rs2912, %rs2913, %rs2914}, [%rd766]; - ld.local.v4.u16 {%rs2919, %rs2920, %rs2921, %rs2922}, [%rd767]; - ld.local.v4.u16 {%rs2927, %rs2928, %rs2929, %rs2930}, [%rd768]; - ld.local.v4.u16 {%rs2935, %rs2936, %rs2937, %rs2938}, [%rd769]; - ld.local.v4.u16 {%rs2943, %rs2944, %rs2945, %rs2946}, [%rd770]; - ld.local.v4.u16 {%rs2951, %rs2952, %rs2953, %rs2954}, [%rd771]; - ld.local.v4.u16 {%rs2959, %rs2960, %rs2961, %rs2962}, [%rd772]; - ld.local.v4.u16 {%rs2967, %rs2968, %rs2969, %rs2970}, [%rd773]; - mov.u32 %r859, 0; - ld.local.v4.u16 {%rs2973, %rs2974, %rs2975, %rs2976}, [%rd775]; - and.b16 %rs2977, %rs2973, 255; - st.local.u64 [%rd1], %rd2290; - mov.u32 %r9086, -271733879; - mov.u32 %r9085, 1732584193; - st.local.v2.u32 [%rd1+8], {%r9085, %r9086}; - mov.u32 %r9088, 271733878; - mov.u32 %r9087, -1732584194; - st.local.v2.u32 [%rd1+16], {%r9087, %r9088}; - mov.u32 %r9089, -1009589776; - st.local.u32 [%rd1+24], %r9089; - st.local.v4.u16 [%rd1+32], {%rs2911, %rs2912, %rs2913, %rs2914}; - st.local.v4.u16 [%rd1+40], {%rs2919, %rs2920, %rs2921, %rs2922}; - st.local.v4.u16 [%rd1+48], {%rs2927, %rs2928, %rs2929, %rs2930}; - st.local.v4.u16 [%rd1+56], {%rs2935, %rs2936, %rs2937, %rs2938}; - st.local.v4.u16 [%rd1+64], {%rs2943, %rs2944, %rs2945, %rs2946}; - st.local.v4.u16 [%rd1+72], {%rs2951, %rs2952, %rs2953, %rs2954}; - st.local.v4.u16 [%rd1+80], {%rs2959, %rs2960, %rs2961, %rs2962}; - st.local.u16 [%rd1+88], %rs2967; - st.local.u16 [%rd1+90], %rs2968; - st.local.v2.u16 [%rd1+92], {%rs2969, %rs2970}; - st.local.u16 [%rd1+96], %rs2973; - st.local.u16 [%rd1+98], %rs2974; - st.local.u16 [%rd1+100], %rs2975; - st.local.u16 [%rd1+102], %rs2976; - cvt.u64.u16 %rd2292, %rs2973; - and.b64 %rd791, %rd2292, 255; - cvt.u32.u16 %r865, %rs2973; - and.b32 %r866, %r865, 255; - mul.wide.u32 %rd2293, %r866, 8; - { - .reg .b32 %temp; - mov.b64 {%r867, %temp}, %rd2293; - } - { - .reg .b32 %temp; - mov.b64 {%temp, %r868}, %rd2293; - } - mov.u32 %r869, 291; - prmt.b32 %r870, %r867, %r859, %r869; - prmt.b32 %r871, %r868, %r859, %r869; - mov.b64 %rd792, {%r871, %r870}; - setp.lt.u16 %p171, %rs2977, 64; - @%p171 bra $L__BB1_260; - bra.uni $L__BB1_259; - -$L__BB1_260: - add.s64 %rd2294, %rd1, %rd791; - add.s64 %rd793, %rd1, 96; - mov.u16 %rs2983, 128; - st.local.u8 [%rd2294+32], %rs2983; - add.s64 %rd794, %rd791, 1; - setp.eq.s64 %p172, %rd794, 64; - @%p172 bra $L__BB1_267; - - add.s64 %rd2295, %rd1, %rd794; - add.s64 %rd4242, %rd2295, 32; - mov.u16 %rs2984, 3; - sub.s16 %rs2985, %rs2984, %rs2973; - and.b16 %rs543, %rs2985, 3; - setp.eq.s16 %p173, %rs543, 0; - @%p173 bra $L__BB1_264; - - cvt.u64.u16 %rd2296, %rs543; - neg.s64 %rd4238, %rd2296; - mov.u64 %rd4239, %rd4242; - -$L__BB1_263: - .pragma "nounroll"; - add.s64 %rd4242, %rd4239, 1; - st.local.u8 [%rd4239], %rs2909; - add.s64 %rd4238, %rd4238, 1; - setp.ne.s64 %p174, %rd4238, 0; - mov.u64 %rd4239, %rd4242; - @%p174 bra $L__BB1_263; - -$L__BB1_264: - mov.u64 %rd2297, 62; - sub.s64 %rd2298, %rd2297, %rd791; - setp.lt.u64 %p175, %rd2298, 3; - @%p175 bra $L__BB1_267; - - sub.s64 %rd4241, %rd793, %rd4242; - -$L__BB1_266: - st.local.u8 [%rd4242], %rs2909; - st.local.u8 [%rd4242+1], %rs2909; - st.local.u8 [%rd4242+2], %rs2909; - st.local.u8 [%rd4242+3], %rs2909; - add.s64 %rd4241, %rd4241, -4; - setp.ne.s64 %p176, %rd4241, 0; - add.s64 %rd4242, %rd4242, 4; - @%p176 bra $L__BB1_266; - -$L__BB1_267: - or.b64 %rd2299, %rd791, 7; - setp.eq.s64 %p177, %rd2299, 63; - add.s64 %rd4243, %rd1, 32; - @%p177 bra $L__BB1_287; - bra.uni $L__BB1_268; - -$L__BB1_287: - mov.u32 %r9089, -1009589776; - mov.u32 %r9088, 271733878; - mov.u32 %r9087, -1732584194; - mov.u32 %r9086, -271733879; - mov.u32 %r9085, 1732584193; - mov.pred %p195, 0; - mov.pred %p210, -1; - mov.u64 %rd4246, %rd4243; - -$L__BB1_288: - ld.local.u32 %rd2690, [%rd4246]; - shl.b64 %rd2691, %rd2690, 8; - mov.b64 {%r2354, %r2355}, %rd2691; - mov.b32 {%rs628, %rs3132}, %r2355; - mov.b32 {%rs624, %rs626}, %r2354; - shr.u16 %rs627, %rs626, 8; - shr.u16 %rs625, %rs624, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2692, [%rd4246+4]; - shl.b64 %rd2693, %rd2692, 8; - mov.b64 {%r2356, %r2357}, %rd2693; - mov.b32 {%rs633, %rs3133}, %r2357; - mov.b32 {%rs629, %rs631}, %r2356; - shr.u16 %rs632, %rs631, 8; - shr.u16 %rs630, %rs629, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2694, [%rd4246+8]; - shl.b64 %rd2695, %rd2694, 8; - mov.b64 {%r2358, %r2359}, %rd2695; - mov.b32 {%rs638, %rs3134}, %r2359; - mov.b32 {%rs634, %rs636}, %r2358; - shr.u16 %rs637, %rs636, 8; - shr.u16 %rs635, %rs634, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2696, [%rd4246+12]; - shl.b64 %rd2697, %rd2696, 8; - mov.b64 {%r2360, %r2361}, %rd2697; - mov.b32 {%rs643, %rs3135}, %r2361; - mov.b32 {%rs639, %rs641}, %r2360; - shr.u16 %rs642, %rs641, 8; - shr.u16 %rs640, %rs639, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2698, [%rd4246+16]; - shl.b64 %rd2699, %rd2698, 8; - mov.b64 {%r2362, %r2363}, %rd2699; - mov.b32 {%rs648, %rs3136}, %r2363; - mov.b32 {%rs644, %rs646}, %r2362; - shr.u16 %rs647, %rs646, 8; - shr.u16 %rs645, %rs644, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2700, [%rd4246+20]; - shl.b64 %rd2701, %rd2700, 8; - mov.b64 {%r2364, %r2365}, %rd2701; - mov.b32 {%rs653, %rs3137}, %r2365; - mov.b32 {%rs649, %rs651}, %r2364; - shr.u16 %rs652, %rs651, 8; - shr.u16 %rs650, %rs649, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2702, [%rd4246+24]; - shl.b64 %rd2703, %rd2702, 8; - mov.b64 {%r2366, %r2367}, %rd2703; - mov.b32 {%rs658, %rs3138}, %r2367; - mov.b32 {%rs654, %rs656}, %r2366; - shr.u16 %rs657, %rs656, 8; - shr.u16 %rs655, %rs654, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2704, [%rd4246+28]; - shl.b64 %rd2705, %rd2704, 8; - mov.b64 {%r2368, %r2369}, %rd2705; - mov.b32 {%rs663, %rs3139}, %r2369; - mov.b32 {%rs659, %rs661}, %r2368; - shr.u16 %rs662, %rs661, 8; - shr.u16 %rs660, %rs659, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2706, [%rd4246+32]; - shl.b64 %rd2707, %rd2706, 8; - mov.b64 {%r2370, %r2371}, %rd2707; - mov.b32 {%rs668, %rs3140}, %r2371; - mov.b32 {%rs664, %rs666}, %r2370; - shr.u16 %rs667, %rs666, 8; - shr.u16 %rs665, %rs664, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2708, [%rd4246+36]; - shl.b64 %rd2709, %rd2708, 8; - mov.b64 {%r2372, %r2373}, %rd2709; - mov.b32 {%rs673, %rs3141}, %r2373; - mov.b32 {%rs669, %rs671}, %r2372; - shr.u16 %rs672, %rs671, 8; - shr.u16 %rs670, %rs669, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2710, [%rd4246+40]; - shl.b64 %rd2711, %rd2710, 8; - mov.b64 {%r2374, %r2375}, %rd2711; - mov.b32 {%rs678, %rs3142}, %r2375; - mov.b32 {%rs674, %rs676}, %r2374; - shr.u16 %rs677, %rs676, 8; - shr.u16 %rs675, %rs674, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2712, [%rd4246+44]; - shl.b64 %rd2713, %rd2712, 8; - mov.b64 {%r2376, %r2377}, %rd2713; - mov.b32 {%rs683, %rs3143}, %r2377; - mov.b32 {%rs679, %rs681}, %r2376; - shr.u16 %rs682, %rs681, 8; - shr.u16 %rs680, %rs679, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2714, [%rd4246+48]; - shl.b64 %rd2715, %rd2714, 8; - mov.b64 {%r2378, %r2379}, %rd2715; - mov.b32 {%rs688, %rs3144}, %r2379; - mov.b32 {%rs684, %rs686}, %r2378; - shr.u16 %rs687, %rs686, 8; - shr.u16 %rs685, %rs684, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2716, [%rd4246+52]; - shl.b64 %rd2717, %rd2716, 8; - mov.b64 {%r2380, %r2381}, %rd2717; - mov.b32 {%rs693, %rs3145}, %r2381; - mov.b32 {%rs689, %rs691}, %r2380; - shr.u16 %rs692, %rs691, 8; - shr.u16 %rs690, %rs689, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2718, [%rd4246+56]; - shl.b64 %rd2719, %rd2718, 8; - mov.b64 {%r2382, %r2383}, %rd2719; - mov.b32 {%rs698, %rs3146}, %r2383; - mov.b32 {%rs694, %rs696}, %r2382; - shr.u16 %rs697, %rs696, 8; - shr.u16 %rs695, %rs694, 8; - @%p195 bra $L__BB1_304; - - ld.local.u32 %rd2720, [%rd4246+60]; - shl.b64 %rd2721, %rd2720, 8; - mov.b64 {%r2384, %r2385}, %rd2721; - mov.b32 {%rs703, %rs3147}, %r2385; - mov.b32 {%rs699, %rs701}, %r2384; - shr.u16 %rs702, %rs701, 8; - shr.u16 %rs700, %rs699, 8; - @%p210 bra $L__BB1_305; - bra.uni $L__BB1_304; - -$L__BB1_305: - add.s64 %rd4243, %rd4243, 64; - shl.b16 %rs3148, %rs626, 8; - or.b16 %rs3149, %rs625, %rs3148; - shl.b16 %rs3150, %rs628, 8; - or.b16 %rs3151, %rs627, %rs3150; - mov.b32 %r2386, {%rs3149, %rs3151}; - shr.u32 %r2387, %r2386, 24; - shr.u32 %r2388, %r2386, 8; - and.b32 %r2389, %r2388, 65280; - or.b32 %r2390, %r2389, %r2387; - shl.b32 %r2391, %r2386, 24; - shl.b32 %r2392, %r2386, 8; - and.b32 %r2393, %r2392, 16711680; - or.b32 %r2394, %r2391, %r2393; - or.b32 %r2395, %r2394, %r2390; - shl.b16 %rs3152, %rs631, 8; - or.b16 %rs3153, %rs630, %rs3152; - shl.b16 %rs3154, %rs633, 8; - or.b16 %rs3155, %rs632, %rs3154; - mov.b32 %r2396, {%rs3153, %rs3155}; - shr.u32 %r2397, %r2396, 24; - shr.u32 %r2398, %r2396, 8; - and.b32 %r2399, %r2398, 65280; - or.b32 %r2400, %r2399, %r2397; - shl.b32 %r2401, %r2396, 24; - shl.b32 %r2402, %r2396, 8; - and.b32 %r2403, %r2402, 16711680; - or.b32 %r2404, %r2401, %r2403; - or.b32 %r2405, %r2404, %r2400; - shl.b16 %rs3156, %rs636, 8; - or.b16 %rs3157, %rs635, %rs3156; - shl.b16 %rs3158, %rs638, 8; - or.b16 %rs3159, %rs637, %rs3158; - mov.b32 %r2406, {%rs3157, %rs3159}; - shr.u32 %r2407, %r2406, 24; - shr.u32 %r2408, %r2406, 8; - and.b32 %r2409, %r2408, 65280; - or.b32 %r2410, %r2409, %r2407; - shl.b32 %r2411, %r2406, 24; - shl.b32 %r2412, %r2406, 8; - and.b32 %r2413, %r2412, 16711680; - or.b32 %r2414, %r2411, %r2413; - or.b32 %r2415, %r2414, %r2410; - xor.b16 %rs3160, %rs635, %rs625; - xor.b16 %rs3161, %rs636, %rs626; - shl.b16 %rs3162, %rs3161, 8; - or.b16 %rs3163, %rs3160, %rs3162; - xor.b16 %rs3164, %rs637, %rs627; - xor.b16 %rs3165, %rs638, %rs628; - shl.b16 %rs3166, %rs3165, 8; - or.b16 %rs3167, %rs3164, %rs3166; - mov.b32 %r2416, {%rs3163, %rs3167}; - shl.b16 %rs3168, %rs641, 8; - or.b16 %rs3169, %rs640, %rs3168; - shl.b16 %rs3170, %rs643, 8; - or.b16 %rs3171, %rs642, %rs3170; - mov.b32 %r2417, {%rs3169, %rs3171}; - shr.u32 %r2418, %r2417, 24; - shr.u32 %r2419, %r2417, 8; - and.b32 %r2420, %r2419, 65280; - or.b32 %r2421, %r2420, %r2418; - shl.b32 %r2422, %r2417, 24; - shl.b32 %r2423, %r2417, 8; - and.b32 %r2424, %r2423, 16711680; - or.b32 %r2425, %r2422, %r2424; - or.b32 %r2426, %r2425, %r2421; - xor.b16 %rs3172, %rs640, %rs630; - xor.b16 %rs3173, %rs641, %rs631; - shl.b16 %rs3174, %rs3173, 8; - or.b16 %rs3175, %rs3172, %rs3174; - xor.b16 %rs3176, %rs642, %rs632; - xor.b16 %rs3177, %rs643, %rs633; - shl.b16 %rs3178, %rs3177, 8; - or.b16 %rs3179, %rs3176, %rs3178; - mov.b32 %r2427, {%rs3175, %rs3179}; - shl.b16 %rs3180, %rs646, 8; - or.b16 %rs3181, %rs645, %rs3180; - shl.b16 %rs3182, %rs648, 8; - or.b16 %rs3183, %rs647, %rs3182; - mov.b32 %r2428, {%rs3181, %rs3183}; - shr.u32 %r2429, %r2428, 24; - shr.u32 %r2430, %r2428, 8; - and.b32 %r2431, %r2430, 65280; - or.b32 %r2432, %r2431, %r2429; - shl.b32 %r2433, %r2428, 24; - shl.b32 %r2434, %r2428, 8; - and.b32 %r2435, %r2434, 16711680; - or.b32 %r2436, %r2433, %r2435; - or.b32 %r2437, %r2436, %r2432; - xor.b16 %rs3184, %rs645, %rs635; - xor.b16 %rs3185, %rs646, %rs636; - shl.b16 %rs3186, %rs3185, 8; - or.b16 %rs3187, %rs3184, %rs3186; - xor.b16 %rs3188, %rs647, %rs637; - xor.b16 %rs3189, %rs648, %rs638; - shl.b16 %rs3190, %rs3189, 8; - or.b16 %rs3191, %rs3188, %rs3190; - mov.b32 %r2438, {%rs3187, %rs3191}; - shl.b16 %rs3192, %rs651, 8; - or.b16 %rs3193, %rs650, %rs3192; - shl.b16 %rs3194, %rs653, 8; - or.b16 %rs3195, %rs652, %rs3194; - mov.b32 %r2439, {%rs3193, %rs3195}; - shr.u32 %r2440, %r2439, 24; - shr.u32 %r2441, %r2439, 8; - and.b32 %r2442, %r2441, 65280; - or.b32 %r2443, %r2442, %r2440; - shl.b32 %r2444, %r2439, 24; - shl.b32 %r2445, %r2439, 8; - and.b32 %r2446, %r2445, 16711680; - or.b32 %r2447, %r2444, %r2446; - or.b32 %r2448, %r2447, %r2443; - xor.b16 %rs3196, %rs650, %rs640; - xor.b16 %rs3197, %rs651, %rs641; - shl.b16 %rs3198, %rs3197, 8; - or.b16 %rs3199, %rs3196, %rs3198; - xor.b16 %rs3200, %rs652, %rs642; - xor.b16 %rs3201, %rs653, %rs643; - shl.b16 %rs3202, %rs3201, 8; - or.b16 %rs3203, %rs3200, %rs3202; - mov.b32 %r2449, {%rs3199, %rs3203}; - shl.b16 %rs3204, %rs656, 8; - or.b16 %rs3205, %rs655, %rs3204; - shl.b16 %rs3206, %rs658, 8; - or.b16 %rs3207, %rs657, %rs3206; - mov.b32 %r2450, {%rs3205, %rs3207}; - shr.u32 %r2451, %r2450, 24; - shr.u32 %r2452, %r2450, 8; - and.b32 %r2453, %r2452, 65280; - or.b32 %r2454, %r2453, %r2451; - shl.b32 %r2455, %r2450, 24; - shl.b32 %r2456, %r2450, 8; - and.b32 %r2457, %r2456, 16711680; - or.b32 %r2458, %r2455, %r2457; - or.b32 %r2459, %r2458, %r2454; - xor.b16 %rs3208, %rs655, %rs645; - xor.b16 %rs3209, %rs656, %rs646; - shl.b16 %rs3210, %rs3209, 8; - or.b16 %rs3211, %rs3208, %rs3210; - xor.b16 %rs3212, %rs657, %rs647; - xor.b16 %rs3213, %rs658, %rs648; - shl.b16 %rs3214, %rs3213, 8; - or.b16 %rs3215, %rs3212, %rs3214; - mov.b32 %r2460, {%rs3211, %rs3215}; - shl.b16 %rs3216, %rs661, 8; - or.b16 %rs3217, %rs660, %rs3216; - shl.b16 %rs3218, %rs663, 8; - or.b16 %rs3219, %rs662, %rs3218; - mov.b32 %r2461, {%rs3217, %rs3219}; - shr.u32 %r2462, %r2461, 24; - shr.u32 %r2463, %r2461, 8; - and.b32 %r2464, %r2463, 65280; - or.b32 %r2465, %r2464, %r2462; - shl.b32 %r2466, %r2461, 24; - shl.b32 %r2467, %r2461, 8; - and.b32 %r2468, %r2467, 16711680; - or.b32 %r2469, %r2466, %r2468; - or.b32 %r2470, %r2469, %r2465; - xor.b16 %rs3220, %rs660, %rs650; - xor.b16 %rs3221, %rs661, %rs651; - shl.b16 %rs3222, %rs3221, 8; - or.b16 %rs3223, %rs3220, %rs3222; - xor.b16 %rs3224, %rs662, %rs652; - xor.b16 %rs3225, %rs663, %rs653; - shl.b16 %rs3226, %rs3225, 8; - or.b16 %rs3227, %rs3224, %rs3226; - mov.b32 %r2471, {%rs3223, %rs3227}; - shl.b16 %rs3228, %rs696, 8; - or.b16 %rs3229, %rs695, %rs3228; - shl.b16 %rs3230, %rs698, 8; - or.b16 %rs3231, %rs697, %rs3230; - mov.b32 %r2472, {%rs3229, %rs3231}; - shr.u32 %r2473, %r2472, 24; - shr.u32 %r2474, %r2472, 8; - and.b32 %r2475, %r2474, 65280; - or.b32 %r2476, %r2475, %r2473; - shl.b32 %r2477, %r2472, 24; - shl.b32 %r2478, %r2472, 8; - and.b32 %r2479, %r2478, 16711680; - or.b32 %r2480, %r2477, %r2479; - or.b32 %r2481, %r2480, %r2476; - shl.b16 %rs3232, %rs701, 8; - or.b16 %rs3233, %rs700, %rs3232; - shl.b16 %rs3234, %rs703, 8; - or.b16 %rs3235, %rs702, %rs3234; - mov.b32 %r2482, {%rs3233, %rs3235}; - shr.u32 %r2483, %r2482, 24; - shr.u32 %r2484, %r2482, 8; - and.b32 %r2485, %r2484, 65280; - or.b32 %r2486, %r2485, %r2483; - shl.b32 %r2487, %r2482, 24; - shl.b32 %r2488, %r2482, 8; - and.b32 %r2489, %r2488, 16711680; - or.b32 %r2490, %r2487, %r2489; - or.b32 %r2491, %r2490, %r2486; - xor.b32 %r2492, %r9088, %r9087; - and.b32 %r2493, %r2492, %r9086; - xor.b32 %r2494, %r2493, %r9088; - shf.l.wrap.b32 %r2495, %r9085, %r9085, 5; - add.s32 %r2496, %r2495, %r9089; - add.s32 %r2497, %r2496, %r2494; - add.s32 %r2498, %r2497, %r2395; - add.s32 %r2499, %r2498, 1518500249; - shf.l.wrap.b32 %r2500, %r2499, %r2499, 5; - shf.l.wrap.b32 %r2501, %r9086, %r9086, 30; - xor.b32 %r2502, %r2501, %r9087; - and.b32 %r2503, %r2502, %r9085; - xor.b32 %r2504, %r2503, %r9087; - add.s32 %r2505, %r9088, %r2504; - add.s32 %r2506, %r2505, %r2405; - add.s32 %r2507, %r2506, %r2500; - add.s32 %r2508, %r2507, 1518500249; - shf.l.wrap.b32 %r2509, %r2508, %r2508, 5; - shf.l.wrap.b32 %r2510, %r9085, %r9085, 30; - xor.b32 %r2511, %r2501, %r2510; - and.b32 %r2512, %r2499, %r2511; - xor.b32 %r2513, %r2512, %r2501; - add.s32 %r2514, %r9087, %r2415; - add.s32 %r2515, %r2514, %r2513; - add.s32 %r2516, %r2515, %r2509; - add.s32 %r2517, %r2516, 1518500249; - shf.l.wrap.b32 %r2518, %r2499, %r2499, 30; - shf.l.wrap.b32 %r2519, %r2517, %r2517, 5; - xor.b32 %r2520, %r2518, %r2510; - and.b32 %r2521, %r2508, %r2520; - xor.b32 %r2522, %r2521, %r2510; - add.s32 %r2523, %r2501, %r2426; - add.s32 %r2524, %r2523, %r2522; - add.s32 %r2525, %r2524, %r2519; - add.s32 %r2526, %r2525, 1518500249; - shf.l.wrap.b32 %r2527, %r2508, %r2508, 30; - shf.l.wrap.b32 %r2528, %r2526, %r2526, 5; - xor.b32 %r2529, %r2527, %r2518; - and.b32 %r2530, %r2529, %r2517; - xor.b32 %r2531, %r2530, %r2518; - add.s32 %r2532, %r2510, %r2437; - add.s32 %r2533, %r2532, %r2531; - add.s32 %r2534, %r2533, %r2528; - add.s32 %r2535, %r2534, 1518500249; - shf.l.wrap.b32 %r2536, %r2517, %r2517, 30; - shf.l.wrap.b32 %r2537, %r2535, %r2535, 5; - xor.b32 %r2538, %r2536, %r2527; - and.b32 %r2539, %r2538, %r2526; - xor.b32 %r2540, %r2539, %r2527; - add.s32 %r2541, %r2518, %r2448; - add.s32 %r2542, %r2541, %r2540; - add.s32 %r2543, %r2542, %r2537; - add.s32 %r2544, %r2543, 1518500249; - shf.l.wrap.b32 %r2545, %r2526, %r2526, 30; - shf.l.wrap.b32 %r2546, %r2544, %r2544, 5; - xor.b32 %r2547, %r2545, %r2536; - and.b32 %r2548, %r2535, %r2547; - xor.b32 %r2549, %r2548, %r2536; - add.s32 %r2550, %r2527, %r2459; - add.s32 %r2551, %r2550, %r2549; - add.s32 %r2552, %r2551, %r2546; - add.s32 %r2553, %r2552, 1518500249; - shf.l.wrap.b32 %r2554, %r2535, %r2535, 30; - shf.l.wrap.b32 %r2555, %r2553, %r2553, 5; - xor.b32 %r2556, %r2554, %r2545; - and.b32 %r2557, %r2544, %r2556; - xor.b32 %r2558, %r2557, %r2545; - add.s32 %r2559, %r2536, %r2470; - add.s32 %r2560, %r2559, %r2558; - add.s32 %r2561, %r2560, %r2555; - add.s32 %r2562, %r2561, 1518500249; - shf.l.wrap.b32 %r2563, %r2544, %r2544, 30; - cvt.u64.u32 %rd2722, %r2554; - cvt.u64.u32 %rd2723, %r2563; - cvt.u64.u32 %rd2724, %r2553; - cvt.u64.u32 %rd2725, %r2562; - bfi.b64 %rd2726, %rd2724, %rd2725, 32, 32; - bfi.b64 %rd2727, %rd2722, %rd2723, 32, 32; - mov.b64 {%r2564, %r2565}, %rd2726; - mov.b64 {%r2566, %r2567}, %rd2727; - shl.b16 %rs3236, %rs681, 8; - or.b16 %rs3237, %rs680, %rs3236; - shl.b16 %rs3238, %rs683, 8; - or.b16 %rs3239, %rs682, %rs3238; - mov.b32 %r2568, {%rs3237, %rs3239}; - shr.u32 %r2569, %r2568, 24; - shr.u32 %r2570, %r2568, 8; - and.b32 %r2571, %r2570, 65280; - or.b32 %r2572, %r2571, %r2569; - shl.b32 %r2573, %r2568, 24; - shl.b32 %r2574, %r2568, 8; - and.b32 %r2575, %r2574, 16711680; - or.b32 %r2576, %r2573, %r2575; - or.b32 %r2577, %r2576, %r2572; - cvt.u64.u32 %rd2728, %r2577; - shl.b16 %rs3240, %rs676, 8; - or.b16 %rs3241, %rs675, %rs3240; - shl.b16 %rs3242, %rs678, 8; - or.b16 %rs3243, %rs677, %rs3242; - mov.b32 %r2578, {%rs3241, %rs3243}; - shr.u32 %r2579, %r2578, 24; - shr.u32 %r2580, %r2578, 8; - and.b32 %r2581, %r2580, 65280; - or.b32 %r2582, %r2581, %r2579; - shl.b32 %r2583, %r2578, 24; - shl.b32 %r2584, %r2578, 8; - and.b32 %r2585, %r2584, 16711680; - or.b32 %r2586, %r2583, %r2585; - or.b32 %r2587, %r2586, %r2582; - shl.b16 %rs3244, %rs671, 8; - or.b16 %rs3245, %rs670, %rs3244; - shl.b16 %rs3246, %rs673, 8; - or.b16 %rs3247, %rs672, %rs3246; - mov.b32 %r2588, {%rs3245, %rs3247}; - shr.u32 %r2589, %r2588, 24; - shr.u32 %r2590, %r2588, 8; - and.b32 %r2591, %r2590, 65280; - or.b32 %r2592, %r2591, %r2589; - shl.b32 %r2593, %r2588, 24; - shl.b32 %r2594, %r2588, 8; - and.b32 %r2595, %r2594, 16711680; - or.b32 %r2596, %r2593, %r2595; - or.b32 %r2597, %r2596, %r2592; - cvt.u64.u32 %rd2729, %r2597; - shl.b16 %rs3248, %rs666, 8; - or.b16 %rs3249, %rs665, %rs3248; - shl.b16 %rs3250, %rs668, 8; - or.b16 %rs3251, %rs667, %rs3250; - mov.b32 %r2598, {%rs3249, %rs3251}; - shr.u32 %r2599, %r2598, 24; - shr.u32 %r2600, %r2598, 8; - and.b32 %r2601, %r2600, 65280; - or.b32 %r2602, %r2601, %r2599; - shl.b32 %r2603, %r2598, 24; - shl.b32 %r2604, %r2598, 8; - and.b32 %r2605, %r2604, 16711680; - or.b32 %r2606, %r2603, %r2605; - or.b32 %r2607, %r2606, %r2602; - cvt.u64.u32 %rd2730, %r2607; - cvt.u64.u32 %rd2731, %r2587; - bfi.b64 %rd2732, %rd2728, %rd2731, 32, 32; - bfi.b64 %rd2733, %rd2729, %rd2730, 32, 32; - mov.b64 {%r2608, %r2609}, %rd2733; - mov.b64 {%r2610, %r2611}, %rd2732; - cvt.u64.u32 %rd2734, %r2567; - cvt.u64.u32 %rd2735, %r2565; - cvt.u64.u32 %rd2736, %r2566; - bfi.b64 %rd2737, %rd2735, %rd2725, 32, 32; - bfi.b64 %rd2738, %rd2734, %rd2736, 32, 32; - mov.b64 {%r2612, %r2613}, %rd2737; - mov.b64 {%r2614, %r2615}, %rd2738; - shf.l.wrap.b32 %r2616, %r2612, %r2612, 5; - xor.b32 %r2617, %r2615, %r2614; - and.b32 %r2618, %r2617, %r2613; - xor.b32 %r2619, %r2618, %r2615; - add.s32 %r2620, %r2545, %r2608; - add.s32 %r2621, %r2620, %r2616; - add.s32 %r2622, %r2621, %r2619; - add.s32 %r2623, %r2622, 1518500249; - shf.l.wrap.b32 %r2624, %r2613, %r2613, 30; - shf.l.wrap.b32 %r2625, %r2623, %r2623, 5; - xor.b32 %r2626, %r2624, %r2614; - and.b32 %r2627, %r2626, %r2612; - xor.b32 %r2628, %r2627, %r2614; - add.s32 %r2629, %r2609, %r2615; - add.s32 %r2630, %r2629, %r2628; - add.s32 %r2631, %r2630, %r2625; - add.s32 %r2632, %r2631, 1518500249; - shf.l.wrap.b32 %r2633, %r2612, %r2612, 30; - shf.l.wrap.b32 %r2634, %r2632, %r2632, 5; - xor.b32 %r2635, %r2624, %r2633; - and.b32 %r2636, %r2623, %r2635; - xor.b32 %r2637, %r2636, %r2624; - add.s32 %r2638, %r2610, %r2614; - add.s32 %r2639, %r2638, %r2637; - add.s32 %r2640, %r2639, %r2634; - add.s32 %r2641, %r2640, 1518500249; - shf.l.wrap.b32 %r2642, %r2623, %r2623, 30; - shf.l.wrap.b32 %r2643, %r2641, %r2641, 5; - xor.b32 %r2644, %r2642, %r2633; - and.b32 %r2645, %r2632, %r2644; - xor.b32 %r2646, %r2645, %r2633; - add.s32 %r2647, %r2611, %r2624; - add.s32 %r2648, %r2647, %r2646; - add.s32 %r2649, %r2648, %r2643; - add.s32 %r2650, %r2649, 1518500249; - shf.l.wrap.b32 %r2651, %r2632, %r2632, 30; - cvt.u64.u32 %rd2739, %r2491; - shl.b16 %rs3252, %rs691, 8; - or.b16 %rs3253, %rs690, %rs3252; - shl.b16 %rs3254, %rs693, 8; - or.b16 %rs3255, %rs692, %rs3254; - mov.b32 %r2652, {%rs3253, %rs3255}; - shr.u32 %r2653, %r2652, 24; - shr.u32 %r2654, %r2652, 8; - and.b32 %r2655, %r2654, 65280; - or.b32 %r2656, %r2655, %r2653; - shl.b32 %r2657, %r2652, 24; - shl.b32 %r2658, %r2652, 8; - and.b32 %r2659, %r2658, 16711680; - or.b32 %r2660, %r2657, %r2659; - or.b32 %r2661, %r2660, %r2656; - cvt.u64.u32 %rd2740, %r2661; - shl.b16 %rs3256, %rs686, 8; - or.b16 %rs3257, %rs685, %rs3256; - shl.b16 %rs3258, %rs688, 8; - or.b16 %rs3259, %rs687, %rs3258; - mov.b32 %r2662, {%rs3257, %rs3259}; - shr.u32 %r2663, %r2662, 24; - shr.u32 %r2664, %r2662, 8; - and.b32 %r2665, %r2664, 65280; - or.b32 %r2666, %r2665, %r2663; - shl.b32 %r2667, %r2662, 24; - shl.b32 %r2668, %r2662, 8; - and.b32 %r2669, %r2668, 16711680; - or.b32 %r2670, %r2667, %r2669; - or.b32 %r2671, %r2670, %r2666; - cvt.u64.u32 %rd2741, %r2671; - cvt.u64.u32 %rd2742, %r2481; - bfi.b64 %rd2743, %rd2739, %rd2742, 32, 32; - bfi.b64 %rd2744, %rd2740, %rd2741, 32, 32; - mov.b64 {%r2672, %r2673}, %rd2744; - mov.b64 {%r2674, %r2675}, %rd2743; - shf.l.wrap.b32 %r2676, %r2650, %r2650, 5; - xor.b32 %r2677, %r2651, %r2642; - and.b32 %r2678, %r2677, %r2641; - xor.b32 %r2679, %r2678, %r2642; - add.s32 %r2680, %r2672, %r2633; - add.s32 %r2681, %r2680, %r2679; - add.s32 %r2682, %r2681, %r2676; - add.s32 %r2683, %r2682, 1518500249; - shf.l.wrap.b32 %r2684, %r2641, %r2641, 30; - shf.l.wrap.b32 %r2685, %r2683, %r2683, 5; - xor.b32 %r2686, %r2684, %r2651; - and.b32 %r2687, %r2686, %r2650; - xor.b32 %r2688, %r2687, %r2651; - add.s32 %r2689, %r2673, %r2642; - add.s32 %r2690, %r2689, %r2688; - add.s32 %r2691, %r2690, %r2685; - add.s32 %r2692, %r2691, 1518500249; - shf.l.wrap.b32 %r2693, %r2650, %r2650, 30; - shf.l.wrap.b32 %r2694, %r2692, %r2692, 5; - xor.b32 %r2695, %r2693, %r2684; - and.b32 %r2696, %r2683, %r2695; - xor.b32 %r2697, %r2696, %r2684; - add.s32 %r2698, %r2674, %r2651; - add.s32 %r2699, %r2698, %r2697; - add.s32 %r2700, %r2699, %r2694; - add.s32 %r2701, %r2700, 1518500249; - shf.l.wrap.b32 %r2702, %r2683, %r2683, 30; - shf.l.wrap.b32 %r2703, %r2701, %r2701, 5; - xor.b32 %r2704, %r2702, %r2693; - and.b32 %r2705, %r2692, %r2704; - xor.b32 %r2706, %r2705, %r2693; - add.s32 %r2707, %r2675, %r2684; - add.s32 %r2708, %r2707, %r2706; - add.s32 %r2709, %r2708, %r2703; - add.s32 %r2710, %r2709, 1518500249; - shf.l.wrap.b32 %r2711, %r2692, %r2692, 30; - cvt.u64.u32 %rd2745, %r2702; - cvt.u64.u32 %rd2746, %r2711; - cvt.u64.u32 %rd2747, %r2701; - cvt.u64.u32 %rd2748, %r2710; - bfi.b64 %rd2749, %rd2747, %rd2748, 32, 32; - bfi.b64 %rd2750, %rd2745, %rd2746, 32, 32; - mov.b64 {%r2712, %r2713}, %rd2749; - mov.b64 {%r2714, %r2715}, %rd2750; - shr.u32 %r2716, %r2449, 24; - shr.u32 %r2717, %r2449, 8; - and.b32 %r2718, %r2717, 65280; - or.b32 %r2719, %r2718, %r2716; - shl.b32 %r2720, %r2449, 24; - shl.b32 %r2721, %r2449, 8; - and.b32 %r2722, %r2721, 16711680; - or.b32 %r2723, %r2720, %r2722; - or.b32 %r2724, %r2723, %r2719; - cvt.u64.u32 %rd2751, %r2724; - shr.u32 %r2725, %r2438, 24; - shr.u32 %r2726, %r2438, 8; - and.b32 %r2727, %r2726, 65280; - or.b32 %r2728, %r2727, %r2725; - shl.b32 %r2729, %r2438, 24; - shl.b32 %r2730, %r2438, 8; - and.b32 %r2731, %r2730, 16711680; - or.b32 %r2732, %r2729, %r2731; - or.b32 %r2733, %r2732, %r2728; - shr.u32 %r2734, %r2427, 24; - shr.u32 %r2735, %r2427, 8; - and.b32 %r2736, %r2735, 65280; - or.b32 %r2737, %r2736, %r2734; - shl.b32 %r2738, %r2427, 24; - shl.b32 %r2739, %r2427, 8; - and.b32 %r2740, %r2739, 16711680; - or.b32 %r2741, %r2738, %r2740; - or.b32 %r2742, %r2741, %r2737; - cvt.u64.u32 %rd2752, %r2742; - shr.u32 %r2743, %r2416, 24; - shr.u32 %r2744, %r2416, 8; - and.b32 %r2745, %r2744, 65280; - or.b32 %r2746, %r2745, %r2743; - shl.b32 %r2747, %r2416, 24; - shl.b32 %r2748, %r2416, 8; - and.b32 %r2749, %r2748, 16711680; - or.b32 %r2750, %r2747, %r2749; - or.b32 %r2751, %r2750, %r2746; - cvt.u64.u32 %rd2753, %r2751; - cvt.u64.u32 %rd2754, %r2733; - bfi.b64 %rd2755, %rd2751, %rd2754, 32, 32; - bfi.b64 %rd2756, %rd2752, %rd2753, 32, 32; - mov.b64 {%r2752, %r2753}, %rd2756; - mov.b64 {%r2754, %r2755}, %rd2755; - xor.b16 %rs3260, %rs665, %rs3160; - xor.b16 %rs3261, %rs666, %rs3161; - shl.b16 %rs3262, %rs3261, 8; - or.b16 %rs3263, %rs3260, %rs3262; - xor.b16 %rs3264, %rs667, %rs3164; - xor.b16 %rs3265, %rs668, %rs3165; - shl.b16 %rs3266, %rs3265, 8; - or.b16 %rs3267, %rs3264, %rs3266; - mov.b32 %r2756, {%rs3263, %rs3267}; - shr.u32 %r2757, %r2756, 24; - shr.u32 %r2758, %r2756, 8; - and.b32 %r2759, %r2758, 65280; - or.b32 %r2760, %r2759, %r2757; - shl.b32 %r2761, %r2756, 24; - shl.b32 %r2762, %r2756, 8; - and.b32 %r2763, %r2762, 16711680; - or.b32 %r2764, %r2761, %r2763; - or.b32 %r2765, %r2764, %r2760; - xor.b32 %r2766, %r2609, %r2753; - xor.b32 %r2767, %r2610, %r2754; - xor.b32 %r2768, %r2611, %r2755; - xor.b32 %r2769, %r2673, %r2765; - xor.b32 %r2770, %r2766, %r2674; - shf.l.wrap.b32 %r2771, %r2770, %r2770, 1; - xor.b32 %r2772, %r2767, %r2675; - shf.l.wrap.b32 %r2773, %r2772, %r2772, 1; - shf.l.wrap.b32 %r2774, %r2769, %r2769, 1; - xor.b32 %r2775, %r2768, %r2774; - shf.l.wrap.b32 %r2776, %r2775, %r2775, 1; - cvt.u64.u32 %rd2757, %r2776; - cvt.u64.u32 %rd2758, %r2771; - cvt.u64.u32 %rd2759, %r2774; - cvt.u64.u32 %rd2760, %r2773; - bfi.b64 %rd2761, %rd2757, %rd2760, 32, 32; - bfi.b64 %rd2762, %rd2758, %rd2759, 32, 32; - mov.b64 {%r2777, %r2778}, %rd2762; - mov.b64 {%r2779, %r2780}, %rd2761; - cvt.u64.u32 %rd2763, %r2715; - cvt.u64.u32 %rd2764, %r2713; - cvt.u64.u32 %rd2765, %r2714; - bfi.b64 %rd2766, %rd2764, %rd2748, 32, 32; - bfi.b64 %rd2767, %rd2763, %rd2765, 32, 32; - mov.b64 {%r2781, %r2782}, %rd2766; - mov.b64 {%r2783, %r2784}, %rd2767; - shf.l.wrap.b32 %r2785, %r2781, %r2781, 5; - xor.b32 %r2786, %r2784, %r2783; - and.b32 %r2787, %r2786, %r2782; - xor.b32 %r2788, %r2787, %r2784; - add.s32 %r2789, %r2777, %r2693; - add.s32 %r2790, %r2789, %r2785; - add.s32 %r2791, %r2790, %r2788; - add.s32 %r2792, %r2791, 1518500249; - shf.l.wrap.b32 %r2793, %r2782, %r2782, 30; - shf.l.wrap.b32 %r2794, %r2792, %r2792, 5; - xor.b32 %r2795, %r2793, %r2783; - and.b32 %r2796, %r2795, %r2781; - xor.b32 %r2797, %r2796, %r2783; - add.s32 %r2798, %r2778, %r2784; - add.s32 %r2799, %r2798, %r2797; - add.s32 %r2800, %r2799, %r2794; - add.s32 %r2801, %r2800, 1518500249; - shf.l.wrap.b32 %r2802, %r2781, %r2781, 30; - shf.l.wrap.b32 %r2803, %r2801, %r2801, 5; - xor.b32 %r2804, %r2793, %r2802; - and.b32 %r2805, %r2792, %r2804; - xor.b32 %r2806, %r2805, %r2793; - add.s32 %r2807, %r2779, %r2783; - add.s32 %r2808, %r2807, %r2806; - add.s32 %r2809, %r2808, %r2803; - add.s32 %r2810, %r2809, 1518500249; - shf.l.wrap.b32 %r2811, %r2792, %r2792, 30; - shf.l.wrap.b32 %r2812, %r2810, %r2810, 5; - xor.b32 %r2813, %r2811, %r2802; - and.b32 %r2814, %r2801, %r2813; - xor.b32 %r2815, %r2814, %r2802; - add.s32 %r2816, %r2780, %r2793; - add.s32 %r2817, %r2816, %r2815; - add.s32 %r2818, %r2817, %r2812; - add.s32 %r2819, %r2818, 1518500249; - shf.l.wrap.b32 %r2820, %r2801, %r2801, 30; - xor.b32 %r2821, %r2608, %r2459; - xor.b32 %r2822, %r2609, %r2470; - cvt.u64.u32 %rd2768, %r2822; - shr.u32 %r2823, %r2471, 24; - shr.u32 %r2824, %r2471, 8; - and.b32 %r2825, %r2824, 65280; - or.b32 %r2826, %r2825, %r2823; - shl.b32 %r2827, %r2471, 24; - shl.b32 %r2828, %r2471, 8; - and.b32 %r2829, %r2828, 16711680; - or.b32 %r2830, %r2827, %r2829; - or.b32 %r2831, %r2830, %r2826; - cvt.u64.u32 %rd2769, %r2831; - shr.u32 %r2832, %r2460, 24; - shr.u32 %r2833, %r2460, 8; - and.b32 %r2834, %r2833, 65280; - or.b32 %r2835, %r2834, %r2832; - shl.b32 %r2836, %r2460, 24; - shl.b32 %r2837, %r2460, 8; - and.b32 %r2838, %r2837, 16711680; - or.b32 %r2839, %r2836, %r2838; - or.b32 %r2840, %r2839, %r2835; - cvt.u64.u32 %rd2770, %r2840; - cvt.u64.u32 %rd2771, %r2821; - bfi.b64 %rd2772, %rd2768, %rd2771, 32, 32; - bfi.b64 %rd2773, %rd2769, %rd2770, 32, 32; - mov.b64 {%r2841, %r2842}, %rd2773; - mov.b64 {%r2843, %r2844}, %rd2772; - xor.b16 %rs3268, %rs3208, %rs685; - xor.b16 %rs3269, %rs3209, %rs686; - shl.b16 %rs3270, %rs3269, 8; - or.b16 %rs3271, %rs3268, %rs3270; - xor.b16 %rs3272, %rs3212, %rs687; - xor.b16 %rs3273, %rs3213, %rs688; - shl.b16 %rs3274, %rs3273, 8; - or.b16 %rs3275, %rs3272, %rs3274; - mov.b32 %r2845, {%rs3271, %rs3275}; - shr.u32 %r2846, %r2845, 24; - shr.u32 %r2847, %r2845, 8; - and.b32 %r2848, %r2847, 65280; - or.b32 %r2849, %r2848, %r2846; - shl.b32 %r2850, %r2845, 24; - shl.b32 %r2851, %r2845, 8; - and.b32 %r2852, %r2851, 16711680; - or.b32 %r2853, %r2850, %r2852; - or.b32 %r2854, %r2853, %r2849; - xor.b32 %r2855, %r2842, %r2673; - xor.b32 %r2856, %r2843, %r2674; - xor.b32 %r2857, %r2844, %r2675; - xor.b32 %r2858, %r2778, %r2854; - xor.b32 %r2859, %r2855, %r2779; - shf.l.wrap.b32 %r2860, %r2859, %r2859, 1; - xor.b32 %r2861, %r2856, %r2780; - shf.l.wrap.b32 %r2862, %r2861, %r2861, 1; - shf.l.wrap.b32 %r2863, %r2858, %r2858, 1; - xor.b32 %r2864, %r2857, %r2863; - shf.l.wrap.b32 %r2865, %r2864, %r2864, 1; - cvt.u64.u32 %rd2774, %r2865; - cvt.u64.u32 %rd2775, %r2860; - cvt.u64.u32 %rd2776, %r2862; - bfi.b64 %rd2777, %rd2774, %rd2776, 32, 32; - cvt.u64.u32 %rd2778, %r2863; - bfi.b64 %rd2779, %rd2775, %rd2778, 32, 32; - mov.b64 {%r2866, %r2867}, %rd2779; - mov.b64 {%r2868, %r2869}, %rd2777; - cvt.u64.u32 %rd2780, %r2869; - cvt.u64.u32 %rd2781, %r2867; - cvt.u64.u32 %rd2782, %r2868; - bfi.b64 %rd2783, %rd2780, %rd2782, 32, 32; - bfi.b64 %rd2784, %rd2781, %rd2778, 32, 32; - mov.b64 {%r2870, %r2871}, %rd2784; - mov.b64 {%r2872, %r2873}, %rd2783; - shf.l.wrap.b32 %r2874, %r2819, %r2819, 5; - xor.b32 %r2875, %r2820, %r2811; - xor.b32 %r2876, %r2875, %r2810; - add.s32 %r2877, %r2870, %r2802; - add.s32 %r2878, %r2877, %r2876; - add.s32 %r2879, %r2878, %r2874; - add.s32 %r2880, %r2879, 1859775393; - shf.l.wrap.b32 %r2881, %r2810, %r2810, 30; - shf.l.wrap.b32 %r2882, %r2880, %r2880, 5; - xor.b32 %r2883, %r2881, %r2820; - xor.b32 %r2884, %r2883, %r2819; - add.s32 %r2885, %r2871, %r2811; - add.s32 %r2886, %r2885, %r2884; - add.s32 %r2887, %r2886, %r2882; - add.s32 %r2888, %r2887, 1859775393; - shf.l.wrap.b32 %r2889, %r2819, %r2819, 30; - shf.l.wrap.b32 %r2890, %r2888, %r2888, 5; - xor.b32 %r2891, %r2889, %r2881; - xor.b32 %r2892, %r2891, %r2880; - add.s32 %r2893, %r2872, %r2820; - add.s32 %r2894, %r2893, %r2892; - add.s32 %r2895, %r2894, %r2890; - add.s32 %r2896, %r2895, 1859775393; - shf.l.wrap.b32 %r2897, %r2880, %r2880, 30; - shf.l.wrap.b32 %r2898, %r2896, %r2896, 5; - xor.b32 %r2899, %r2897, %r2889; - xor.b32 %r2900, %r2899, %r2888; - add.s32 %r2901, %r2873, %r2881; - add.s32 %r2902, %r2901, %r2900; - add.s32 %r2903, %r2902, %r2898; - add.s32 %r2904, %r2903, 1859775393; - shf.l.wrap.b32 %r2905, %r2888, %r2888, 30; - cvt.u64.u32 %rd2785, %r2897; - cvt.u64.u32 %rd2786, %r2905; - cvt.u64.u32 %rd2787, %r2896; - cvt.u64.u32 %rd2788, %r2904; - bfi.b64 %rd2789, %rd2787, %rd2788, 32, 32; - bfi.b64 %rd2790, %rd2785, %rd2786, 32, 32; - mov.b64 {%r2906, %r2907}, %rd2789; - mov.b64 {%r2908, %r2909}, %rd2790; - xor.b32 %r2910, %r2611, %r2609; - xor.b32 %r2911, %r2672, %r2610; - xor.b32 %r2912, %r2673, %r2611; - cvt.u64.u32 %rd2791, %r2912; - cvt.u64.u32 %rd2792, %r2910; - xor.b32 %r2913, %r2610, %r2608; - cvt.u64.u32 %rd2793, %r2913; - cvt.u64.u32 %rd2794, %r2911; - bfi.b64 %rd2795, %rd2791, %rd2794, 32, 32; - bfi.b64 %rd2796, %rd2792, %rd2793, 32, 32; - mov.b64 {%r2914, %r2915}, %rd2796; - mov.b64 {%r2916, %r2917}, %rd2795; - xor.b32 %r2918, %r2774, %r2913; - xor.b32 %r2919, %r2778, %r2915; - xor.b32 %r2920, %r2779, %r2916; - xor.b32 %r2921, %r2780, %r2917; - xor.b32 %r2922, %r2871, %r2918; - xor.b32 %r2923, %r2919, %r2872; - shf.l.wrap.b32 %r2924, %r2923, %r2923, 1; - xor.b32 %r2925, %r2920, %r2873; - shf.l.wrap.b32 %r2926, %r2925, %r2925, 1; - shf.l.wrap.b32 %r2927, %r2922, %r2922, 1; - xor.b32 %r2928, %r2921, %r2927; - shf.l.wrap.b32 %r2929, %r2928, %r2928, 1; - cvt.u64.u32 %rd2797, %r2929; - cvt.u64.u32 %rd2798, %r2924; - cvt.u64.u32 %rd2799, %r2926; - bfi.b64 %rd2800, %rd2797, %rd2799, 32, 32; - cvt.u64.u32 %rd2801, %r2927; - bfi.b64 %rd2802, %rd2798, %rd2801, 32, 32; - mov.b64 {%r2930, %r2931}, %rd2802; - mov.b64 {%r2932, %r2933}, %rd2800; - cvt.u64.u32 %rd2803, %r2933; - cvt.u64.u32 %rd2804, %r2931; - cvt.u64.u32 %rd2805, %r2932; - bfi.b64 %rd2806, %rd2803, %rd2805, 32, 32; - bfi.b64 %rd2807, %rd2804, %rd2801, 32, 32; - mov.b64 {%r2934, %r2935}, %rd2807; - mov.b64 {%r2936, %r2937}, %rd2806; - cvt.u64.u32 %rd2808, %r2909; - cvt.u64.u32 %rd2809, %r2907; - cvt.u64.u32 %rd2810, %r2908; - bfi.b64 %rd2811, %rd2809, %rd2788, 32, 32; - bfi.b64 %rd2812, %rd2808, %rd2810, 32, 32; - mov.b64 {%r2938, %r2939}, %rd2811; - mov.b64 {%r2940, %r2941}, %rd2812; - shf.l.wrap.b32 %r2942, %r2938, %r2938, 5; - xor.b32 %r2943, %r2940, %r2939; - xor.b32 %r2944, %r2943, %r2941; - add.s32 %r2945, %r2934, %r2889; - add.s32 %r2946, %r2945, %r2942; - add.s32 %r2947, %r2946, %r2944; - add.s32 %r2948, %r2947, 1859775393; - shf.l.wrap.b32 %r2949, %r2939, %r2939, 30; - shf.l.wrap.b32 %r2950, %r2948, %r2948, 5; - xor.b32 %r2951, %r2940, %r2938; - xor.b32 %r2952, %r2951, %r2949; - add.s32 %r2953, %r2935, %r2941; - add.s32 %r2954, %r2953, %r2952; - add.s32 %r2955, %r2954, %r2950; - add.s32 %r2956, %r2955, 1859775393; - shf.l.wrap.b32 %r2957, %r2938, %r2938, 30; - shf.l.wrap.b32 %r2958, %r2956, %r2956, 5; - xor.b32 %r2959, %r2949, %r2957; - xor.b32 %r2960, %r2959, %r2948; - add.s32 %r2961, %r2936, %r2940; - add.s32 %r2962, %r2961, %r2960; - add.s32 %r2963, %r2962, %r2958; - add.s32 %r2964, %r2963, 1859775393; - shf.l.wrap.b32 %r2965, %r2948, %r2948, 30; - shf.l.wrap.b32 %r2966, %r2964, %r2964, 5; - xor.b32 %r2967, %r2965, %r2957; - xor.b32 %r2968, %r2967, %r2956; - add.s32 %r2969, %r2937, %r2949; - add.s32 %r2970, %r2969, %r2968; - add.s32 %r2971, %r2970, %r2966; - add.s32 %r2972, %r2971, 1859775393; - shf.l.wrap.b32 %r2973, %r2956, %r2956, 30; - xor.b32 %r2974, %r2675, %r2673; - xor.b32 %r2975, %r2777, %r2674; - xor.b32 %r2976, %r2778, %r2675; - cvt.u64.u32 %rd2813, %r2976; - cvt.u64.u32 %rd2814, %r2974; - xor.b32 %r2977, %r2674, %r2672; - cvt.u64.u32 %rd2815, %r2977; - cvt.u64.u32 %rd2816, %r2975; - bfi.b64 %rd2817, %rd2813, %rd2816, 32, 32; - bfi.b64 %rd2818, %rd2814, %rd2815, 32, 32; - mov.b64 {%r2978, %r2979}, %rd2818; - mov.b64 {%r2980, %r2981}, %rd2817; - xor.b32 %r2982, %r2863, %r2977; - xor.b32 %r2983, %r2871, %r2979; - xor.b32 %r2984, %r2872, %r2980; - xor.b32 %r2985, %r2873, %r2981; - xor.b32 %r2986, %r2935, %r2982; - xor.b32 %r2987, %r2983, %r2936; - shf.l.wrap.b32 %r2988, %r2987, %r2987, 1; - xor.b32 %r2989, %r2984, %r2937; - shf.l.wrap.b32 %r2990, %r2989, %r2989, 1; - shf.l.wrap.b32 %r2991, %r2986, %r2986, 1; - xor.b32 %r2992, %r2985, %r2991; - shf.l.wrap.b32 %r2993, %r2992, %r2992, 1; - cvt.u64.u32 %rd2819, %r2993; - cvt.u64.u32 %rd2820, %r2988; - cvt.u64.u32 %rd2821, %r2990; - bfi.b64 %rd2822, %rd2819, %rd2821, 32, 32; - cvt.u64.u32 %rd2823, %r2991; - bfi.b64 %rd2824, %rd2820, %rd2823, 32, 32; - mov.b64 {%r2994, %r2995}, %rd2824; - mov.b64 {%r2996, %r2997}, %rd2822; - cvt.u64.u32 %rd2825, %r2997; - cvt.u64.u32 %rd2826, %r2995; - cvt.u64.u32 %rd2827, %r2996; - bfi.b64 %rd2828, %rd2825, %rd2827, 32, 32; - bfi.b64 %rd2829, %rd2826, %rd2823, 32, 32; - mov.b64 {%r2998, %r2999}, %rd2829; - mov.b64 {%r3000, %r3001}, %rd2828; - shf.l.wrap.b32 %r3002, %r2972, %r2972, 5; - xor.b32 %r3003, %r2973, %r2965; - xor.b32 %r3004, %r3003, %r2964; - add.s32 %r3005, %r2998, %r2957; - add.s32 %r3006, %r3005, %r3004; - add.s32 %r3007, %r3006, %r3002; - add.s32 %r3008, %r3007, 1859775393; - shf.l.wrap.b32 %r3009, %r2964, %r2964, 30; - shf.l.wrap.b32 %r3010, %r3008, %r3008, 5; - xor.b32 %r3011, %r3009, %r2973; - xor.b32 %r3012, %r3011, %r2972; - add.s32 %r3013, %r2999, %r2965; - add.s32 %r3014, %r3013, %r3012; - add.s32 %r3015, %r3014, %r3010; - add.s32 %r3016, %r3015, 1859775393; - shf.l.wrap.b32 %r3017, %r2972, %r2972, 30; - shf.l.wrap.b32 %r3018, %r3016, %r3016, 5; - xor.b32 %r3019, %r3017, %r3009; - xor.b32 %r3020, %r3019, %r3008; - add.s32 %r3021, %r3000, %r2973; - add.s32 %r3022, %r3021, %r3020; - add.s32 %r3023, %r3022, %r3018; - add.s32 %r3024, %r3023, 1859775393; - shf.l.wrap.b32 %r3025, %r3008, %r3008, 30; - shf.l.wrap.b32 %r3026, %r3024, %r3024, 5; - xor.b32 %r3027, %r3025, %r3017; - xor.b32 %r3028, %r3027, %r3016; - add.s32 %r3029, %r3001, %r3009; - add.s32 %r3030, %r3029, %r3028; - add.s32 %r3031, %r3030, %r3026; - add.s32 %r3032, %r3031, 1859775393; - shf.l.wrap.b32 %r3033, %r3016, %r3016, 30; - cvt.u64.u32 %rd2830, %r3025; - cvt.u64.u32 %rd2831, %r3033; - cvt.u64.u32 %rd2832, %r3024; - cvt.u64.u32 %rd2833, %r3032; - bfi.b64 %rd2834, %rd2832, %rd2833, 32, 32; - bfi.b64 %rd2835, %rd2830, %rd2831, 32, 32; - mov.b64 {%r3034, %r3035}, %rd2834; - mov.b64 {%r3036, %r3037}, %rd2835; - xor.b32 %r3038, %r2780, %r2778; - xor.b32 %r3039, %r2870, %r2779; - xor.b32 %r3040, %r2871, %r2780; - cvt.u64.u32 %rd2836, %r3040; - cvt.u64.u32 %rd2837, %r3038; - xor.b32 %r3041, %r2779, %r2777; - cvt.u64.u32 %rd2838, %r3041; - cvt.u64.u32 %rd2839, %r3039; - bfi.b64 %rd2840, %rd2836, %rd2839, 32, 32; - bfi.b64 %rd2841, %rd2837, %rd2838, 32, 32; - mov.b64 {%r3042, %r3043}, %rd2841; - mov.b64 {%r3044, %r3045}, %rd2840; - xor.b32 %r3046, %r2927, %r3041; - xor.b32 %r3047, %r2935, %r3043; - xor.b32 %r3048, %r2936, %r3044; - xor.b32 %r3049, %r2937, %r3045; - xor.b32 %r3050, %r2999, %r3046; - xor.b32 %r3051, %r3047, %r3000; - shf.l.wrap.b32 %r3052, %r3051, %r3051, 1; - xor.b32 %r3053, %r3048, %r3001; - shf.l.wrap.b32 %r3054, %r3053, %r3053, 1; - shf.l.wrap.b32 %r3055, %r3050, %r3050, 1; - xor.b32 %r3056, %r3049, %r3055; - shf.l.wrap.b32 %r3057, %r3056, %r3056, 1; - cvt.u64.u32 %rd2842, %r3057; - cvt.u64.u32 %rd2843, %r3052; - cvt.u64.u32 %rd2844, %r3054; - bfi.b64 %rd2845, %rd2842, %rd2844, 32, 32; - cvt.u64.u32 %rd2846, %r3055; - bfi.b64 %rd2847, %rd2843, %rd2846, 32, 32; - mov.b64 {%r3058, %r3059}, %rd2847; - mov.b64 {%r3060, %r3061}, %rd2845; - cvt.u64.u32 %rd2848, %r3061; - cvt.u64.u32 %rd2849, %r3059; - cvt.u64.u32 %rd2850, %r3060; - bfi.b64 %rd2851, %rd2848, %rd2850, 32, 32; - bfi.b64 %rd2852, %rd2849, %rd2846, 32, 32; - mov.b64 {%r3062, %r3063}, %rd2852; - mov.b64 {%r3064, %r3065}, %rd2851; - cvt.u64.u32 %rd2853, %r3037; - cvt.u64.u32 %rd2854, %r3035; - cvt.u64.u32 %rd2855, %r3036; - bfi.b64 %rd2856, %rd2854, %rd2833, 32, 32; - bfi.b64 %rd2857, %rd2853, %rd2855, 32, 32; - mov.b64 {%r3066, %r3067}, %rd2856; - mov.b64 {%r3068, %r3069}, %rd2857; - shf.l.wrap.b32 %r3070, %r3066, %r3066, 5; - xor.b32 %r3071, %r3068, %r3067; - xor.b32 %r3072, %r3071, %r3069; - add.s32 %r3073, %r3062, %r3017; - add.s32 %r3074, %r3073, %r3070; - add.s32 %r3075, %r3074, %r3072; - add.s32 %r3076, %r3075, 1859775393; - shf.l.wrap.b32 %r3077, %r3067, %r3067, 30; - shf.l.wrap.b32 %r3078, %r3076, %r3076, 5; - xor.b32 %r3079, %r3068, %r3066; - xor.b32 %r3080, %r3079, %r3077; - add.s32 %r3081, %r3063, %r3069; - add.s32 %r3082, %r3081, %r3080; - add.s32 %r3083, %r3082, %r3078; - add.s32 %r3084, %r3083, 1859775393; - shf.l.wrap.b32 %r3085, %r3066, %r3066, 30; - shf.l.wrap.b32 %r3086, %r3084, %r3084, 5; - xor.b32 %r3087, %r3077, %r3085; - xor.b32 %r3088, %r3087, %r3076; - add.s32 %r3089, %r3064, %r3068; - add.s32 %r3090, %r3089, %r3088; - add.s32 %r3091, %r3090, %r3086; - add.s32 %r3092, %r3091, 1859775393; - shf.l.wrap.b32 %r3093, %r3076, %r3076, 30; - shf.l.wrap.b32 %r3094, %r3092, %r3092, 5; - xor.b32 %r3095, %r3093, %r3085; - xor.b32 %r3096, %r3095, %r3084; - add.s32 %r3097, %r3065, %r3077; - add.s32 %r3098, %r3097, %r3096; - add.s32 %r3099, %r3098, %r3094; - add.s32 %r3100, %r3099, 1859775393; - shf.l.wrap.b32 %r3101, %r3084, %r3084, 30; - xor.b32 %r3102, %r2873, %r2871; - xor.b32 %r3103, %r2934, %r2872; - xor.b32 %r3104, %r2935, %r2873; - cvt.u64.u32 %rd2858, %r3104; - cvt.u64.u32 %rd2859, %r3102; - xor.b32 %r3105, %r2872, %r2870; - cvt.u64.u32 %rd2860, %r3105; - cvt.u64.u32 %rd2861, %r3103; - bfi.b64 %rd2862, %rd2858, %rd2861, 32, 32; - bfi.b64 %rd2863, %rd2859, %rd2860, 32, 32; - mov.b64 {%r3106, %r3107}, %rd2863; - mov.b64 {%r3108, %r3109}, %rd2862; - xor.b32 %r3110, %r2991, %r3105; - xor.b32 %r3111, %r2999, %r3107; - xor.b32 %r3112, %r3000, %r3108; - xor.b32 %r3113, %r3001, %r3109; - xor.b32 %r3114, %r3063, %r3110; - xor.b32 %r3115, %r3111, %r3064; - shf.l.wrap.b32 %r3116, %r3115, %r3115, 1; - xor.b32 %r3117, %r3112, %r3065; - shf.l.wrap.b32 %r3118, %r3117, %r3117, 1; - shf.l.wrap.b32 %r3119, %r3114, %r3114, 1; - xor.b32 %r3120, %r3113, %r3119; - shf.l.wrap.b32 %r3121, %r3120, %r3120, 1; - cvt.u64.u32 %rd2864, %r3121; - cvt.u64.u32 %rd2865, %r3116; - cvt.u64.u32 %rd2866, %r3119; - cvt.u64.u32 %rd2867, %r3118; - bfi.b64 %rd2868, %rd2864, %rd2867, 32, 32; - bfi.b64 %rd2869, %rd2865, %rd2866, 32, 32; - mov.b64 {%r3122, %r3123}, %rd2869; - mov.b64 {%r3124, %r3125}, %rd2868; - shf.l.wrap.b32 %r3126, %r3100, %r3100, 5; - xor.b32 %r3127, %r3101, %r3093; - xor.b32 %r3128, %r3127, %r3092; - add.s32 %r3129, %r3122, %r3085; - add.s32 %r3130, %r3129, %r3128; - add.s32 %r3131, %r3130, %r3126; - add.s32 %r3132, %r3131, 1859775393; - shf.l.wrap.b32 %r3133, %r3092, %r3092, 30; - shf.l.wrap.b32 %r3134, %r3132, %r3132, 5; - xor.b32 %r3135, %r3133, %r3101; - xor.b32 %r3136, %r3135, %r3100; - add.s32 %r3137, %r3123, %r3093; - add.s32 %r3138, %r3137, %r3136; - add.s32 %r3139, %r3138, %r3134; - add.s32 %r3140, %r3139, 1859775393; - shf.l.wrap.b32 %r3141, %r3100, %r3100, 30; - shf.l.wrap.b32 %r3142, %r3140, %r3140, 5; - xor.b32 %r3143, %r3141, %r3133; - xor.b32 %r3144, %r3143, %r3132; - add.s32 %r3145, %r3124, %r3101; - add.s32 %r3146, %r3145, %r3144; - add.s32 %r3147, %r3146, %r3142; - add.s32 %r3148, %r3147, 1859775393; - shf.l.wrap.b32 %r3149, %r3132, %r3132, 30; - shf.l.wrap.b32 %r3150, %r3148, %r3148, 5; - xor.b32 %r3151, %r3149, %r3141; - xor.b32 %r3152, %r3151, %r3140; - add.s32 %r3153, %r3125, %r3133; - add.s32 %r3154, %r3153, %r3152; - add.s32 %r3155, %r3154, %r3150; - add.s32 %r3156, %r3155, 1859775393; - shf.l.wrap.b32 %r3157, %r3140, %r3140, 30; - cvt.u64.u32 %rd2870, %r3149; - cvt.u64.u32 %rd2871, %r3157; - cvt.u64.u32 %rd2872, %r3148; - cvt.u64.u32 %rd2873, %r3156; - bfi.b64 %rd2874, %rd2872, %rd2873, 32, 32; - bfi.b64 %rd2875, %rd2870, %rd2871, 32, 32; - mov.b64 {%r3158, %r3159}, %rd2874; - mov.b64 {%r3160, %r3161}, %rd2875; - xor.b32 %r3162, %r2937, %r2935; - xor.b32 %r3163, %r2998, %r2936; - xor.b32 %r3164, %r2999, %r2937; - cvt.u64.u32 %rd2876, %r3164; - cvt.u64.u32 %rd2877, %r3162; - xor.b32 %r3165, %r2936, %r2934; - cvt.u64.u32 %rd2878, %r3165; - cvt.u64.u32 %rd2879, %r3163; - bfi.b64 %rd2880, %rd2876, %rd2879, 32, 32; - bfi.b64 %rd2881, %rd2877, %rd2878, 32, 32; - mov.b64 {%r3166, %r3167}, %rd2881; - mov.b64 {%r3168, %r3169}, %rd2880; - xor.b32 %r3170, %r3055, %r3165; - xor.b32 %r3171, %r3063, %r3167; - xor.b32 %r3172, %r3064, %r3168; - xor.b32 %r3173, %r3065, %r3169; - xor.b32 %r3174, %r3123, %r3170; - xor.b32 %r3175, %r3171, %r3124; - shf.l.wrap.b32 %r3176, %r3175, %r3175, 1; - xor.b32 %r3177, %r3172, %r3125; - shf.l.wrap.b32 %r3178, %r3177, %r3177, 1; - shf.l.wrap.b32 %r3179, %r3174, %r3174, 1; - xor.b32 %r3180, %r3173, %r3179; - shf.l.wrap.b32 %r3181, %r3180, %r3180, 1; - cvt.u64.u32 %rd2882, %r3181; - cvt.u64.u32 %rd2883, %r3176; - cvt.u64.u32 %rd2884, %r3178; - bfi.b64 %rd2885, %rd2882, %rd2884, 32, 32; - cvt.u64.u32 %rd2886, %r3179; - bfi.b64 %rd2887, %rd2883, %rd2886, 32, 32; - mov.b64 {%r3182, %r3183}, %rd2887; - mov.b64 {%r3184, %r3185}, %rd2885; - cvt.u64.u32 %rd2888, %r3185; - cvt.u64.u32 %rd2889, %r3183; - cvt.u64.u32 %rd2890, %r3184; - bfi.b64 %rd2891, %rd2888, %rd2890, 32, 32; - bfi.b64 %rd2892, %rd2889, %rd2886, 32, 32; - mov.b64 {%r3186, %r3187}, %rd2892; - mov.b64 {%r3188, %r3189}, %rd2891; - cvt.u64.u32 %rd2893, %r3161; - cvt.u64.u32 %rd2894, %r3159; - cvt.u64.u32 %rd2895, %r3160; - bfi.b64 %rd2896, %rd2894, %rd2873, 32, 32; - bfi.b64 %rd2897, %rd2893, %rd2895, 32, 32; - mov.b64 {%r3190, %r3191}, %rd2896; - mov.b64 {%r3192, %r3193}, %rd2897; - shf.l.wrap.b32 %r3194, %r3190, %r3190, 5; - xor.b32 %r3195, %r3193, %r3192; - and.b32 %r3196, %r3195, %r3191; - and.b32 %r3197, %r3193, %r3192; - xor.b32 %r3198, %r3196, %r3197; - add.s32 %r3199, %r3186, %r3141; - add.s32 %r3200, %r3199, %r3194; - add.s32 %r3201, %r3200, %r3198; - add.s32 %r3202, %r3201, -1894007588; - shf.l.wrap.b32 %r3203, %r3191, %r3191, 30; - shf.l.wrap.b32 %r3204, %r3202, %r3202, 5; - xor.b32 %r3205, %r3203, %r3192; - and.b32 %r3206, %r3205, %r3190; - and.b32 %r3207, %r3203, %r3192; - xor.b32 %r3208, %r3206, %r3207; - add.s32 %r3209, %r3187, %r3193; - add.s32 %r3210, %r3209, %r3208; - add.s32 %r3211, %r3210, %r3204; - add.s32 %r3212, %r3211, -1894007588; - shf.l.wrap.b32 %r3213, %r3190, %r3190, 30; - shf.l.wrap.b32 %r3214, %r3212, %r3212, 5; - xor.b32 %r3215, %r3203, %r3213; - and.b32 %r3216, %r3202, %r3215; - and.b32 %r3217, %r3203, %r3213; - xor.b32 %r3218, %r3216, %r3217; - add.s32 %r3219, %r3188, %r3192; - add.s32 %r3220, %r3219, %r3218; - add.s32 %r3221, %r3220, %r3214; - add.s32 %r3222, %r3221, -1894007588; - shf.l.wrap.b32 %r3223, %r3202, %r3202, 30; - shf.l.wrap.b32 %r3224, %r3222, %r3222, 5; - xor.b32 %r3225, %r3223, %r3213; - and.b32 %r3226, %r3212, %r3225; - and.b32 %r3227, %r3223, %r3213; - xor.b32 %r3228, %r3226, %r3227; - add.s32 %r3229, %r3189, %r3203; - add.s32 %r3230, %r3229, %r3228; - add.s32 %r3231, %r3230, %r3224; - add.s32 %r3232, %r3231, -1894007588; - shf.l.wrap.b32 %r3233, %r3212, %r3212, 30; - xor.b32 %r3234, %r3001, %r2999; - xor.b32 %r3235, %r3062, %r3000; - xor.b32 %r3236, %r3063, %r3001; - cvt.u64.u32 %rd2898, %r3236; - cvt.u64.u32 %rd2899, %r3234; - xor.b32 %r3237, %r3000, %r2998; - cvt.u64.u32 %rd2900, %r3237; - cvt.u64.u32 %rd2901, %r3235; - bfi.b64 %rd2902, %rd2898, %rd2901, 32, 32; - bfi.b64 %rd2903, %rd2899, %rd2900, 32, 32; - mov.b64 {%r3238, %r3239}, %rd2903; - mov.b64 {%r3240, %r3241}, %rd2902; - xor.b32 %r3242, %r3119, %r3237; - xor.b32 %r3243, %r3123, %r3239; - xor.b32 %r3244, %r3124, %r3240; - xor.b32 %r3245, %r3125, %r3241; - xor.b32 %r3246, %r3187, %r3242; - xor.b32 %r3247, %r3243, %r3188; - shf.l.wrap.b32 %r3248, %r3247, %r3247, 1; - xor.b32 %r3249, %r3244, %r3189; - shf.l.wrap.b32 %r3250, %r3249, %r3249, 1; - shf.l.wrap.b32 %r3251, %r3246, %r3246, 1; - xor.b32 %r3252, %r3245, %r3251; - shf.l.wrap.b32 %r3253, %r3252, %r3252, 1; - cvt.u64.u32 %rd2904, %r3253; - cvt.u64.u32 %rd2905, %r3248; - cvt.u64.u32 %rd2906, %r3250; - bfi.b64 %rd2907, %rd2904, %rd2906, 32, 32; - cvt.u64.u32 %rd2908, %r3251; - bfi.b64 %rd2909, %rd2905, %rd2908, 32, 32; - mov.b64 {%r3254, %r3255}, %rd2909; - mov.b64 {%r3256, %r3257}, %rd2907; - cvt.u64.u32 %rd2910, %r3257; - cvt.u64.u32 %rd2911, %r3255; - cvt.u64.u32 %rd2912, %r3256; - bfi.b64 %rd2913, %rd2910, %rd2912, 32, 32; - bfi.b64 %rd2914, %rd2911, %rd2908, 32, 32; - mov.b64 {%r3258, %r3259}, %rd2914; - mov.b64 {%r3260, %r3261}, %rd2913; - shf.l.wrap.b32 %r3262, %r3232, %r3232, 5; - xor.b32 %r3263, %r3233, %r3223; - and.b32 %r3264, %r3263, %r3222; - and.b32 %r3265, %r3233, %r3223; - xor.b32 %r3266, %r3264, %r3265; - add.s32 %r3267, %r3258, %r3213; - add.s32 %r3268, %r3267, %r3266; - add.s32 %r3269, %r3268, %r3262; - add.s32 %r3270, %r3269, -1894007588; - shf.l.wrap.b32 %r3271, %r3222, %r3222, 30; - shf.l.wrap.b32 %r3272, %r3270, %r3270, 5; - xor.b32 %r3273, %r3271, %r3233; - and.b32 %r3274, %r3273, %r3232; - and.b32 %r3275, %r3271, %r3233; - xor.b32 %r3276, %r3274, %r3275; - add.s32 %r3277, %r3259, %r3223; - add.s32 %r3278, %r3277, %r3276; - add.s32 %r3279, %r3278, %r3272; - add.s32 %r3280, %r3279, -1894007588; - shf.l.wrap.b32 %r3281, %r3232, %r3232, 30; - shf.l.wrap.b32 %r3282, %r3280, %r3280, 5; - xor.b32 %r3283, %r3281, %r3271; - and.b32 %r3284, %r3270, %r3283; - and.b32 %r3285, %r3281, %r3271; - xor.b32 %r3286, %r3284, %r3285; - add.s32 %r3287, %r3260, %r3233; - add.s32 %r3288, %r3287, %r3286; - add.s32 %r3289, %r3288, %r3282; - add.s32 %r3290, %r3289, -1894007588; - shf.l.wrap.b32 %r3291, %r3270, %r3270, 30; - shf.l.wrap.b32 %r3292, %r3290, %r3290, 5; - xor.b32 %r3293, %r3291, %r3281; - and.b32 %r3294, %r3280, %r3293; - and.b32 %r3295, %r3291, %r3281; - xor.b32 %r3296, %r3294, %r3295; - add.s32 %r3297, %r3261, %r3271; - add.s32 %r3298, %r3297, %r3296; - add.s32 %r3299, %r3298, %r3292; - add.s32 %r3300, %r3299, -1894007588; - shf.l.wrap.b32 %r3301, %r3280, %r3280, 30; - cvt.u64.u32 %rd2915, %r3291; - cvt.u64.u32 %rd2916, %r3301; - cvt.u64.u32 %rd2917, %r3290; - cvt.u64.u32 %rd2918, %r3300; - bfi.b64 %rd2919, %rd2917, %rd2918, 32, 32; - bfi.b64 %rd2920, %rd2915, %rd2916, 32, 32; - mov.b64 {%r3302, %r3303}, %rd2919; - mov.b64 {%r3304, %r3305}, %rd2920; - xor.b32 %r3306, %r3065, %r3063; - xor.b32 %r3307, %r3122, %r3064; - xor.b32 %r3308, %r3123, %r3065; - cvt.u64.u32 %rd2921, %r3308; - cvt.u64.u32 %rd2922, %r3306; - xor.b32 %r3309, %r3064, %r3062; - cvt.u64.u32 %rd2923, %r3309; - cvt.u64.u32 %rd2924, %r3307; - bfi.b64 %rd2925, %rd2921, %rd2924, 32, 32; - bfi.b64 %rd2926, %rd2922, %rd2923, 32, 32; - mov.b64 {%r3310, %r3311}, %rd2926; - mov.b64 {%r3312, %r3313}, %rd2925; - xor.b32 %r3314, %r3179, %r3309; - xor.b32 %r3315, %r3187, %r3311; - xor.b32 %r3316, %r3188, %r3312; - xor.b32 %r3317, %r3189, %r3313; - xor.b32 %r3318, %r3259, %r3314; - xor.b32 %r3319, %r3315, %r3260; - shf.l.wrap.b32 %r3320, %r3319, %r3319, 1; - xor.b32 %r3321, %r3316, %r3261; - shf.l.wrap.b32 %r3322, %r3321, %r3321, 1; - shf.l.wrap.b32 %r3323, %r3318, %r3318, 1; - xor.b32 %r3324, %r3317, %r3323; - shf.l.wrap.b32 %r3325, %r3324, %r3324, 1; - cvt.u64.u32 %rd2927, %r3325; - cvt.u64.u32 %rd2928, %r3320; - cvt.u64.u32 %rd2929, %r3322; - bfi.b64 %rd2930, %rd2927, %rd2929, 32, 32; - cvt.u64.u32 %rd2931, %r3323; - bfi.b64 %rd2932, %rd2928, %rd2931, 32, 32; - mov.b64 {%r3326, %r3327}, %rd2932; - mov.b64 {%r3328, %r3329}, %rd2930; - cvt.u64.u32 %rd2933, %r3329; - cvt.u64.u32 %rd2934, %r3327; - cvt.u64.u32 %rd2935, %r3328; - bfi.b64 %rd2936, %rd2933, %rd2935, 32, 32; - bfi.b64 %rd2937, %rd2934, %rd2931, 32, 32; - mov.b64 {%r3330, %r3331}, %rd2937; - mov.b64 {%r3332, %r3333}, %rd2936; - cvt.u64.u32 %rd2938, %r3305; - cvt.u64.u32 %rd2939, %r3303; - cvt.u64.u32 %rd2940, %r3304; - bfi.b64 %rd2941, %rd2939, %rd2918, 32, 32; - bfi.b64 %rd2942, %rd2938, %rd2940, 32, 32; - mov.b64 {%r3334, %r3335}, %rd2941; - mov.b64 {%r3336, %r3337}, %rd2942; - shf.l.wrap.b32 %r3338, %r3334, %r3334, 5; - xor.b32 %r3339, %r3337, %r3336; - and.b32 %r3340, %r3339, %r3335; - and.b32 %r3341, %r3337, %r3336; - xor.b32 %r3342, %r3340, %r3341; - add.s32 %r3343, %r3330, %r3281; - add.s32 %r3344, %r3343, %r3338; - add.s32 %r3345, %r3344, %r3342; - add.s32 %r3346, %r3345, -1894007588; - shf.l.wrap.b32 %r3347, %r3335, %r3335, 30; - shf.l.wrap.b32 %r3348, %r3346, %r3346, 5; - xor.b32 %r3349, %r3347, %r3336; - and.b32 %r3350, %r3349, %r3334; - and.b32 %r3351, %r3347, %r3336; - xor.b32 %r3352, %r3350, %r3351; - add.s32 %r3353, %r3331, %r3337; - add.s32 %r3354, %r3353, %r3352; - add.s32 %r3355, %r3354, %r3348; - add.s32 %r3356, %r3355, -1894007588; - shf.l.wrap.b32 %r3357, %r3334, %r3334, 30; - shf.l.wrap.b32 %r3358, %r3356, %r3356, 5; - xor.b32 %r3359, %r3347, %r3357; - and.b32 %r3360, %r3346, %r3359; - and.b32 %r3361, %r3347, %r3357; - xor.b32 %r3362, %r3360, %r3361; - add.s32 %r3363, %r3332, %r3336; - add.s32 %r3364, %r3363, %r3362; - add.s32 %r3365, %r3364, %r3358; - add.s32 %r3366, %r3365, -1894007588; - shf.l.wrap.b32 %r3367, %r3346, %r3346, 30; - shf.l.wrap.b32 %r3368, %r3366, %r3366, 5; - xor.b32 %r3369, %r3367, %r3357; - and.b32 %r3370, %r3356, %r3369; - and.b32 %r3371, %r3367, %r3357; - xor.b32 %r3372, %r3370, %r3371; - add.s32 %r3373, %r3333, %r3347; - add.s32 %r3374, %r3373, %r3372; - add.s32 %r3375, %r3374, %r3368; - add.s32 %r3376, %r3375, -1894007588; - shf.l.wrap.b32 %r3377, %r3356, %r3356, 30; - xor.b32 %r3378, %r3125, %r3123; - xor.b32 %r3379, %r3186, %r3124; - xor.b32 %r3380, %r3187, %r3125; - cvt.u64.u32 %rd2943, %r3380; - cvt.u64.u32 %rd2944, %r3378; - xor.b32 %r3381, %r3124, %r3122; - cvt.u64.u32 %rd2945, %r3381; - cvt.u64.u32 %rd2946, %r3379; - bfi.b64 %rd2947, %rd2943, %rd2946, 32, 32; - bfi.b64 %rd2948, %rd2944, %rd2945, 32, 32; - mov.b64 {%r3382, %r3383}, %rd2948; - mov.b64 {%r3384, %r3385}, %rd2947; - xor.b32 %r3386, %r3251, %r3381; - xor.b32 %r3387, %r3259, %r3383; - xor.b32 %r3388, %r3260, %r3384; - xor.b32 %r3389, %r3261, %r3385; - xor.b32 %r3390, %r3331, %r3386; - xor.b32 %r3391, %r3387, %r3332; - shf.l.wrap.b32 %r3392, %r3391, %r3391, 1; - xor.b32 %r3393, %r3388, %r3333; - shf.l.wrap.b32 %r3394, %r3393, %r3393, 1; - shf.l.wrap.b32 %r3395, %r3390, %r3390, 1; - xor.b32 %r3396, %r3389, %r3395; - shf.l.wrap.b32 %r3397, %r3396, %r3396, 1; - cvt.u64.u32 %rd2949, %r3397; - cvt.u64.u32 %rd2950, %r3392; - cvt.u64.u32 %rd2951, %r3394; - bfi.b64 %rd2952, %rd2949, %rd2951, 32, 32; - cvt.u64.u32 %rd2953, %r3395; - bfi.b64 %rd2954, %rd2950, %rd2953, 32, 32; - mov.b64 {%r3398, %r3399}, %rd2954; - mov.b64 {%r3400, %r3401}, %rd2952; - cvt.u64.u32 %rd2955, %r3401; - cvt.u64.u32 %rd2956, %r3399; - cvt.u64.u32 %rd2957, %r3400; - bfi.b64 %rd2958, %rd2955, %rd2957, 32, 32; - bfi.b64 %rd2959, %rd2956, %rd2953, 32, 32; - mov.b64 {%r3402, %r3403}, %rd2959; - mov.b64 {%r3404, %r3405}, %rd2958; - shf.l.wrap.b32 %r3406, %r3376, %r3376, 5; - xor.b32 %r3407, %r3377, %r3367; - and.b32 %r3408, %r3407, %r3366; - and.b32 %r3409, %r3377, %r3367; - xor.b32 %r3410, %r3408, %r3409; - add.s32 %r3411, %r3402, %r3357; - add.s32 %r3412, %r3411, %r3410; - add.s32 %r3413, %r3412, %r3406; - add.s32 %r3414, %r3413, -1894007588; - shf.l.wrap.b32 %r3415, %r3366, %r3366, 30; - shf.l.wrap.b32 %r3416, %r3414, %r3414, 5; - xor.b32 %r3417, %r3415, %r3377; - and.b32 %r3418, %r3417, %r3376; - and.b32 %r3419, %r3415, %r3377; - xor.b32 %r3420, %r3418, %r3419; - add.s32 %r3421, %r3403, %r3367; - add.s32 %r3422, %r3421, %r3420; - add.s32 %r3423, %r3422, %r3416; - add.s32 %r3424, %r3423, -1894007588; - shf.l.wrap.b32 %r3425, %r3376, %r3376, 30; - shf.l.wrap.b32 %r3426, %r3424, %r3424, 5; - xor.b32 %r3427, %r3425, %r3415; - and.b32 %r3428, %r3414, %r3427; - and.b32 %r3429, %r3425, %r3415; - xor.b32 %r3430, %r3428, %r3429; - add.s32 %r3431, %r3404, %r3377; - add.s32 %r3432, %r3431, %r3430; - add.s32 %r3433, %r3432, %r3426; - add.s32 %r3434, %r3433, -1894007588; - shf.l.wrap.b32 %r3435, %r3414, %r3414, 30; - shf.l.wrap.b32 %r3436, %r3434, %r3434, 5; - xor.b32 %r3437, %r3435, %r3425; - and.b32 %r3438, %r3424, %r3437; - and.b32 %r3439, %r3435, %r3425; - xor.b32 %r3440, %r3438, %r3439; - add.s32 %r3441, %r3405, %r3415; - add.s32 %r3442, %r3441, %r3440; - add.s32 %r3443, %r3442, %r3436; - add.s32 %r3444, %r3443, -1894007588; - shf.l.wrap.b32 %r3445, %r3424, %r3424, 30; - cvt.u64.u32 %rd2960, %r3435; - cvt.u64.u32 %rd2961, %r3445; - cvt.u64.u32 %rd2962, %r3434; - cvt.u64.u32 %rd2963, %r3444; - bfi.b64 %rd2964, %rd2962, %rd2963, 32, 32; - bfi.b64 %rd2965, %rd2960, %rd2961, 32, 32; - mov.b64 {%r3446, %r3447}, %rd2964; - mov.b64 {%r3448, %r3449}, %rd2965; - xor.b32 %r3450, %r3189, %r3187; - xor.b32 %r3451, %r3258, %r3188; - xor.b32 %r3452, %r3259, %r3189; - cvt.u64.u32 %rd2966, %r3452; - cvt.u64.u32 %rd2967, %r3450; - xor.b32 %r3453, %r3188, %r3186; - cvt.u64.u32 %rd2968, %r3453; - cvt.u64.u32 %rd2969, %r3451; - bfi.b64 %rd2970, %rd2966, %rd2969, 32, 32; - bfi.b64 %rd2971, %rd2967, %rd2968, 32, 32; - mov.b64 {%r3454, %r3455}, %rd2971; - mov.b64 {%r3456, %r3457}, %rd2970; - xor.b32 %r3458, %r3323, %r3453; - xor.b32 %r3459, %r3331, %r3455; - xor.b32 %r3460, %r3332, %r3456; - xor.b32 %r3461, %r3333, %r3457; - xor.b32 %r3462, %r3403, %r3458; - xor.b32 %r3463, %r3459, %r3404; - shf.l.wrap.b32 %r3464, %r3463, %r3463, 1; - xor.b32 %r3465, %r3460, %r3405; - shf.l.wrap.b32 %r3466, %r3465, %r3465, 1; - shf.l.wrap.b32 %r3467, %r3462, %r3462, 1; - xor.b32 %r3468, %r3461, %r3467; - shf.l.wrap.b32 %r3469, %r3468, %r3468, 1; - cvt.u64.u32 %rd2972, %r3469; - cvt.u64.u32 %rd2973, %r3464; - cvt.u64.u32 %rd2974, %r3467; - cvt.u64.u32 %rd2975, %r3466; - bfi.b64 %rd2976, %rd2972, %rd2975, 32, 32; - bfi.b64 %rd2977, %rd2973, %rd2974, 32, 32; - mov.b64 {%r3470, %r3471}, %rd2977; - mov.b64 {%r3472, %r3473}, %rd2976; - cvt.u64.u32 %rd2978, %r3449; - cvt.u64.u32 %rd2979, %r3447; - cvt.u64.u32 %rd2980, %r3448; - bfi.b64 %rd2981, %rd2979, %rd2963, 32, 32; - bfi.b64 %rd2982, %rd2978, %rd2980, 32, 32; - mov.b64 {%r3474, %r3475}, %rd2981; - mov.b64 {%r3476, %r3477}, %rd2982; - shf.l.wrap.b32 %r3478, %r3474, %r3474, 5; - xor.b32 %r3479, %r3477, %r3476; - and.b32 %r3480, %r3479, %r3475; - and.b32 %r3481, %r3477, %r3476; - xor.b32 %r3482, %r3480, %r3481; - add.s32 %r3483, %r3470, %r3425; - add.s32 %r3484, %r3483, %r3478; - add.s32 %r3485, %r3484, %r3482; - add.s32 %r3486, %r3485, -1894007588; - shf.l.wrap.b32 %r3487, %r3475, %r3475, 30; - shf.l.wrap.b32 %r3488, %r3486, %r3486, 5; - xor.b32 %r3489, %r3487, %r3476; - and.b32 %r3490, %r3489, %r3474; - and.b32 %r3491, %r3487, %r3476; - xor.b32 %r3492, %r3490, %r3491; - add.s32 %r3493, %r3471, %r3477; - add.s32 %r3494, %r3493, %r3492; - add.s32 %r3495, %r3494, %r3488; - add.s32 %r3496, %r3495, -1894007588; - shf.l.wrap.b32 %r3497, %r3474, %r3474, 30; - shf.l.wrap.b32 %r3498, %r3496, %r3496, 5; - xor.b32 %r3499, %r3487, %r3497; - and.b32 %r3500, %r3486, %r3499; - and.b32 %r3501, %r3487, %r3497; - xor.b32 %r3502, %r3500, %r3501; - add.s32 %r3503, %r3472, %r3476; - add.s32 %r3504, %r3503, %r3502; - add.s32 %r3505, %r3504, %r3498; - add.s32 %r3506, %r3505, -1894007588; - shf.l.wrap.b32 %r3507, %r3486, %r3486, 30; - shf.l.wrap.b32 %r3508, %r3506, %r3506, 5; - xor.b32 %r3509, %r3507, %r3497; - and.b32 %r3510, %r3496, %r3509; - and.b32 %r3511, %r3507, %r3497; - xor.b32 %r3512, %r3510, %r3511; - add.s32 %r3513, %r3473, %r3487; - add.s32 %r3514, %r3513, %r3512; - add.s32 %r3515, %r3514, %r3508; - add.s32 %r3516, %r3515, -1894007588; - shf.l.wrap.b32 %r3517, %r3496, %r3496, 30; - xor.b32 %r3518, %r3261, %r3259; - xor.b32 %r3519, %r3330, %r3260; - xor.b32 %r3520, %r3331, %r3261; - cvt.u64.u32 %rd2983, %r3520; - cvt.u64.u32 %rd2984, %r3518; - xor.b32 %r3521, %r3260, %r3258; - cvt.u64.u32 %rd2985, %r3521; - cvt.u64.u32 %rd2986, %r3519; - bfi.b64 %rd2987, %rd2983, %rd2986, 32, 32; - bfi.b64 %rd2988, %rd2984, %rd2985, 32, 32; - mov.b64 {%r3522, %r3523}, %rd2988; - mov.b64 {%r3524, %r3525}, %rd2987; - xor.b32 %r3526, %r3395, %r3521; - xor.b32 %r3527, %r3403, %r3523; - xor.b32 %r3528, %r3404, %r3524; - xor.b32 %r3529, %r3405, %r3525; - xor.b32 %r3530, %r3471, %r3526; - xor.b32 %r3531, %r3527, %r3472; - shf.l.wrap.b32 %r3532, %r3531, %r3531, 1; - xor.b32 %r3533, %r3528, %r3473; - shf.l.wrap.b32 %r3534, %r3533, %r3533, 1; - shf.l.wrap.b32 %r3535, %r3530, %r3530, 1; - xor.b32 %r3536, %r3529, %r3535; - shf.l.wrap.b32 %r3537, %r3536, %r3536, 1; - cvt.u64.u32 %rd2989, %r3537; - cvt.u64.u32 %rd2990, %r3532; - cvt.u64.u32 %rd2991, %r3534; - bfi.b64 %rd2992, %rd2989, %rd2991, 32, 32; - cvt.u64.u32 %rd2993, %r3535; - bfi.b64 %rd2994, %rd2990, %rd2993, 32, 32; - mov.b64 {%r3538, %r3539}, %rd2994; - mov.b64 {%r3540, %r3541}, %rd2992; - cvt.u64.u32 %rd2995, %r3541; - cvt.u64.u32 %rd2996, %r3539; - cvt.u64.u32 %rd2997, %r3540; - bfi.b64 %rd2998, %rd2995, %rd2997, 32, 32; - bfi.b64 %rd2999, %rd2996, %rd2993, 32, 32; - mov.b64 {%r3542, %r3543}, %rd2999; - mov.b64 {%r3544, %r3545}, %rd2998; - shf.l.wrap.b32 %r3546, %r3516, %r3516, 5; - xor.b32 %r3547, %r3517, %r3507; - xor.b32 %r3548, %r3547, %r3506; - add.s32 %r3549, %r3542, %r3497; - add.s32 %r3550, %r3549, %r3548; - add.s32 %r3551, %r3550, %r3546; - add.s32 %r3552, %r3551, -899497514; - shf.l.wrap.b32 %r3553, %r3506, %r3506, 30; - shf.l.wrap.b32 %r3554, %r3552, %r3552, 5; - xor.b32 %r3555, %r3553, %r3517; - xor.b32 %r3556, %r3555, %r3516; - add.s32 %r3557, %r3543, %r3507; - add.s32 %r3558, %r3557, %r3556; - add.s32 %r3559, %r3558, %r3554; - add.s32 %r3560, %r3559, -899497514; - shf.l.wrap.b32 %r3561, %r3516, %r3516, 30; - shf.l.wrap.b32 %r3562, %r3560, %r3560, 5; - xor.b32 %r3563, %r3561, %r3553; - xor.b32 %r3564, %r3563, %r3552; - add.s32 %r3565, %r3544, %r3517; - add.s32 %r3566, %r3565, %r3564; - add.s32 %r3567, %r3566, %r3562; - add.s32 %r3568, %r3567, -899497514; - shf.l.wrap.b32 %r3569, %r3552, %r3552, 30; - shf.l.wrap.b32 %r3570, %r3568, %r3568, 5; - xor.b32 %r3571, %r3569, %r3561; - xor.b32 %r3572, %r3571, %r3560; - add.s32 %r3573, %r3545, %r3553; - add.s32 %r3574, %r3573, %r3572; - add.s32 %r3575, %r3574, %r3570; - add.s32 %r3576, %r3575, -899497514; - shf.l.wrap.b32 %r3577, %r3560, %r3560, 30; - cvt.u64.u32 %rd3000, %r3569; - cvt.u64.u32 %rd3001, %r3577; - cvt.u64.u32 %rd3002, %r3568; - cvt.u64.u32 %rd3003, %r3576; - bfi.b64 %rd3004, %rd3002, %rd3003, 32, 32; - bfi.b64 %rd3005, %rd3000, %rd3001, 32, 32; - mov.b64 {%r3578, %r3579}, %rd3004; - mov.b64 {%r3580, %r3581}, %rd3005; - xor.b32 %r3582, %r3333, %r3331; - xor.b32 %r3583, %r3402, %r3332; - xor.b32 %r3584, %r3403, %r3333; - cvt.u64.u32 %rd3006, %r3584; - cvt.u64.u32 %rd3007, %r3582; - xor.b32 %r3585, %r3332, %r3330; - cvt.u64.u32 %rd3008, %r3585; - cvt.u64.u32 %rd3009, %r3583; - bfi.b64 %rd3010, %rd3006, %rd3009, 32, 32; - bfi.b64 %rd3011, %rd3007, %rd3008, 32, 32; - mov.b64 {%r3586, %r3587}, %rd3011; - mov.b64 {%r3588, %r3589}, %rd3010; - xor.b32 %r3590, %r3467, %r3585; - xor.b32 %r3591, %r3471, %r3587; - xor.b32 %r3592, %r3472, %r3588; - xor.b32 %r3593, %r3473, %r3589; - xor.b32 %r3594, %r3543, %r3590; - xor.b32 %r3595, %r3591, %r3544; - shf.l.wrap.b32 %r3596, %r3595, %r3595, 1; - xor.b32 %r3597, %r3592, %r3545; - shf.l.wrap.b32 %r3598, %r3597, %r3597, 1; - shf.l.wrap.b32 %r3599, %r3594, %r3594, 1; - xor.b32 %r3600, %r3593, %r3599; - shf.l.wrap.b32 %r3601, %r3600, %r3600, 1; - cvt.u64.u32 %rd3012, %r3601; - cvt.u64.u32 %rd3013, %r3596; - cvt.u64.u32 %rd3014, %r3598; - bfi.b64 %rd3015, %rd3012, %rd3014, 32, 32; - cvt.u64.u32 %rd3016, %r3599; - bfi.b64 %rd3017, %rd3013, %rd3016, 32, 32; - mov.b64 {%r3602, %r3603}, %rd3017; - mov.b64 {%r3604, %r3605}, %rd3015; - cvt.u64.u32 %rd3018, %r3605; - cvt.u64.u32 %rd3019, %r3603; - cvt.u64.u32 %rd3020, %r3604; - bfi.b64 %rd3021, %rd3018, %rd3020, 32, 32; - bfi.b64 %rd3022, %rd3019, %rd3016, 32, 32; - mov.b64 {%r3606, %r3607}, %rd3022; - mov.b64 {%r3608, %r3609}, %rd3021; - cvt.u64.u32 %rd3023, %r3581; - cvt.u64.u32 %rd3024, %r3579; - cvt.u64.u32 %rd3025, %r3580; - bfi.b64 %rd3026, %rd3024, %rd3003, 32, 32; - bfi.b64 %rd3027, %rd3023, %rd3025, 32, 32; - mov.b64 {%r3610, %r3611}, %rd3026; - mov.b64 {%r3612, %r3613}, %rd3027; - shf.l.wrap.b32 %r3614, %r3610, %r3610, 5; - xor.b32 %r3615, %r3612, %r3611; - xor.b32 %r3616, %r3615, %r3613; - add.s32 %r3617, %r3606, %r3561; - add.s32 %r3618, %r3617, %r3614; - add.s32 %r3619, %r3618, %r3616; - add.s32 %r3620, %r3619, -899497514; - shf.l.wrap.b32 %r3621, %r3611, %r3611, 30; - shf.l.wrap.b32 %r3622, %r3620, %r3620, 5; - xor.b32 %r3623, %r3612, %r3610; - xor.b32 %r3624, %r3623, %r3621; - add.s32 %r3625, %r3607, %r3613; - add.s32 %r3626, %r3625, %r3624; - add.s32 %r3627, %r3626, %r3622; - add.s32 %r3628, %r3627, -899497514; - shf.l.wrap.b32 %r3629, %r3610, %r3610, 30; - shf.l.wrap.b32 %r3630, %r3628, %r3628, 5; - xor.b32 %r3631, %r3621, %r3629; - xor.b32 %r3632, %r3631, %r3620; - add.s32 %r3633, %r3608, %r3612; - add.s32 %r3634, %r3633, %r3632; - add.s32 %r3635, %r3634, %r3630; - add.s32 %r3636, %r3635, -899497514; - shf.l.wrap.b32 %r3637, %r3620, %r3620, 30; - shf.l.wrap.b32 %r3638, %r3636, %r3636, 5; - xor.b32 %r3639, %r3637, %r3629; - xor.b32 %r3640, %r3639, %r3628; - add.s32 %r3641, %r3609, %r3621; - add.s32 %r3642, %r3641, %r3640; - add.s32 %r3643, %r3642, %r3638; - add.s32 %r3644, %r3643, -899497514; - shf.l.wrap.b32 %r3645, %r3628, %r3628, 30; - xor.b32 %r3646, %r3405, %r3403; - xor.b32 %r3647, %r3470, %r3404; - xor.b32 %r3648, %r3471, %r3405; - cvt.u64.u32 %rd3028, %r3648; - cvt.u64.u32 %rd3029, %r3646; - xor.b32 %r3649, %r3404, %r3402; - cvt.u64.u32 %rd3030, %r3649; - cvt.u64.u32 %rd3031, %r3647; - bfi.b64 %rd3032, %rd3028, %rd3031, 32, 32; - bfi.b64 %rd3033, %rd3029, %rd3030, 32, 32; - mov.b64 {%r3650, %r3651}, %rd3033; - mov.b64 {%r3652, %r3653}, %rd3032; - xor.b32 %r3654, %r3535, %r3649; - xor.b32 %r3655, %r3543, %r3651; - xor.b32 %r3656, %r3544, %r3652; - xor.b32 %r3657, %r3545, %r3653; - xor.b32 %r3658, %r3607, %r3654; - xor.b32 %r3659, %r3655, %r3608; - shf.l.wrap.b32 %r3660, %r3659, %r3659, 1; - xor.b32 %r3661, %r3656, %r3609; - shf.l.wrap.b32 %r3662, %r3661, %r3661, 1; - shf.l.wrap.b32 %r3663, %r3658, %r3658, 1; - xor.b32 %r3664, %r3657, %r3663; - shf.l.wrap.b32 %r3665, %r3664, %r3664, 1; - cvt.u64.u32 %rd3034, %r3665; - cvt.u64.u32 %rd3035, %r3660; - cvt.u64.u32 %rd3036, %r3662; - bfi.b64 %rd3037, %rd3034, %rd3036, 32, 32; - cvt.u64.u32 %rd3038, %r3663; - bfi.b64 %rd3039, %rd3035, %rd3038, 32, 32; - mov.b64 {%r3666, %r3667}, %rd3039; - mov.b64 {%r3668, %r3669}, %rd3037; - cvt.u64.u32 %rd3040, %r3669; - cvt.u64.u32 %rd3041, %r3667; - cvt.u64.u32 %rd3042, %r3668; - bfi.b64 %rd3043, %rd3040, %rd3042, 32, 32; - bfi.b64 %rd3044, %rd3041, %rd3038, 32, 32; - mov.b64 {%r3670, %r3671}, %rd3044; - mov.b64 {%r3672, %r3673}, %rd3043; - shf.l.wrap.b32 %r3674, %r3644, %r3644, 5; - xor.b32 %r3675, %r3645, %r3637; - xor.b32 %r3676, %r3675, %r3636; - add.s32 %r3677, %r3670, %r3629; - add.s32 %r3678, %r3677, %r3676; - add.s32 %r3679, %r3678, %r3674; - add.s32 %r3680, %r3679, -899497514; - shf.l.wrap.b32 %r3681, %r3636, %r3636, 30; - shf.l.wrap.b32 %r3682, %r3680, %r3680, 5; - xor.b32 %r3683, %r3681, %r3645; - xor.b32 %r3684, %r3683, %r3644; - add.s32 %r3685, %r3671, %r3637; - add.s32 %r3686, %r3685, %r3684; - add.s32 %r3687, %r3686, %r3682; - add.s32 %r3688, %r3687, -899497514; - shf.l.wrap.b32 %r3689, %r3644, %r3644, 30; - shf.l.wrap.b32 %r3690, %r3688, %r3688, 5; - xor.b32 %r3691, %r3689, %r3681; - xor.b32 %r3692, %r3691, %r3680; - add.s32 %r3693, %r3672, %r3645; - add.s32 %r3694, %r3693, %r3692; - add.s32 %r3695, %r3694, %r3690; - add.s32 %r3696, %r3695, -899497514; - shf.l.wrap.b32 %r3697, %r3680, %r3680, 30; - shf.l.wrap.b32 %r3698, %r3696, %r3696, 5; - xor.b32 %r3699, %r3697, %r3689; - xor.b32 %r3700, %r3699, %r3688; - add.s32 %r3701, %r3673, %r3681; - add.s32 %r3702, %r3701, %r3700; - add.s32 %r3703, %r3702, %r3698; - add.s32 %r3704, %r3703, -899497514; - shf.l.wrap.b32 %r3705, %r3688, %r3688, 30; - cvt.u64.u32 %rd3045, %r3697; - cvt.u64.u32 %rd3046, %r3705; - cvt.u64.u32 %rd3047, %r3696; - cvt.u64.u32 %rd3048, %r3704; - bfi.b64 %rd3049, %rd3047, %rd3048, 32, 32; - bfi.b64 %rd3050, %rd3045, %rd3046, 32, 32; - mov.b64 {%r3706, %r3707}, %rd3049; - mov.b64 {%r3708, %r3709}, %rd3050; - xor.b32 %r3710, %r3473, %r3471; - xor.b32 %r3711, %r3542, %r3472; - xor.b32 %r3712, %r3543, %r3473; - cvt.u64.u32 %rd3051, %r3712; - cvt.u64.u32 %rd3052, %r3710; - xor.b32 %r3713, %r3472, %r3470; - cvt.u64.u32 %rd3053, %r3713; - cvt.u64.u32 %rd3054, %r3711; - bfi.b64 %rd3055, %rd3051, %rd3054, 32, 32; - bfi.b64 %rd3056, %rd3052, %rd3053, 32, 32; - mov.b64 {%r3714, %r3715}, %rd3056; - mov.b64 {%r3716, %r3717}, %rd3055; - xor.b32 %r3718, %r3599, %r3713; - xor.b32 %r3719, %r3607, %r3715; - xor.b32 %r3720, %r3608, %r3716; - xor.b32 %r3721, %r3609, %r3717; - xor.b32 %r3722, %r3671, %r3718; - shf.l.wrap.b32 %r3723, %r3722, %r3722, 1; - xor.b32 %r3724, %r3719, %r3672; - shf.l.wrap.b32 %r3725, %r3724, %r3724, 1; - xor.b32 %r3726, %r3720, %r3673; - shf.l.wrap.b32 %r3727, %r3726, %r3726, 1; - xor.b32 %r3728, %r3721, %r3723; - shf.l.wrap.b32 %r3729, %r3728, %r3728, 1; - cvt.u64.u32 %rd3057, %r3729; - cvt.u64.u32 %rd3058, %r3725; - cvt.u64.u32 %rd3059, %r3727; - bfi.b64 %rd3060, %rd3057, %rd3059, 32, 32; - cvt.u64.u32 %rd3061, %r3723; - bfi.b64 %rd3062, %rd3058, %rd3061, 32, 32; - mov.b64 {%r3730, %r3731}, %rd3062; - mov.b64 {%r3732, %r3733}, %rd3060; - cvt.u64.u32 %rd3063, %r3733; - cvt.u64.u32 %rd3064, %r3731; - cvt.u64.u32 %rd3065, %r3732; - bfi.b64 %rd3066, %rd3063, %rd3065, 32, 32; - bfi.b64 %rd3067, %rd3064, %rd3061, 32, 32; - mov.b64 {%r3734, %r3735}, %rd3067; - mov.b64 {%r3736, %r3737}, %rd3066; - cvt.u64.u32 %rd3068, %r3709; - cvt.u64.u32 %rd3069, %r3707; - cvt.u64.u32 %rd3070, %r3708; - bfi.b64 %rd3071, %rd3069, %rd3048, 32, 32; - bfi.b64 %rd3072, %rd3068, %rd3070, 32, 32; - mov.b64 {%r3738, %r3739}, %rd3071; - mov.b64 {%r3740, %r3741}, %rd3072; - shf.l.wrap.b32 %r3742, %r3738, %r3738, 5; - xor.b32 %r3743, %r3740, %r3739; - xor.b32 %r3744, %r3743, %r3741; - add.s32 %r3745, %r3689, %r3734; - add.s32 %r3746, %r3745, %r3742; - add.s32 %r3747, %r3746, %r3744; - add.s32 %r3748, %r3747, -899497514; - shf.l.wrap.b32 %r3749, %r3739, %r3739, 30; - shf.l.wrap.b32 %r3750, %r3748, %r3748, 5; - xor.b32 %r3751, %r3740, %r3738; - xor.b32 %r3752, %r3751, %r3749; - add.s32 %r3753, %r3735, %r3741; - add.s32 %r3754, %r3753, %r3752; - add.s32 %r3755, %r3754, %r3750; - add.s32 %r3756, %r3755, -899497514; - shf.l.wrap.b32 %r3757, %r3738, %r3738, 30; - shf.l.wrap.b32 %r3758, %r3756, %r3756, 5; - xor.b32 %r3759, %r3749, %r3757; - xor.b32 %r3760, %r3759, %r3748; - add.s32 %r3761, %r3736, %r3740; - add.s32 %r3762, %r3761, %r3760; - add.s32 %r3763, %r3762, %r3758; - add.s32 %r3764, %r3763, -899497514; - shf.l.wrap.b32 %r3765, %r3748, %r3748, 30; - shf.l.wrap.b32 %r3766, %r3764, %r3764, 5; - xor.b32 %r3767, %r3765, %r3757; - xor.b32 %r3768, %r3767, %r3756; - add.s32 %r3769, %r3737, %r3749; - add.s32 %r3770, %r3769, %r3768; - add.s32 %r3771, %r3770, %r3766; - add.s32 %r3772, %r3771, -899497514; - shf.l.wrap.b32 %r3773, %r3756, %r3756, 30; - xor.b32 %r3774, %r3545, %r3543; - xor.b32 %r3775, %r3606, %r3544; - xor.b32 %r3776, %r3607, %r3545; - cvt.u64.u32 %rd3073, %r3776; - cvt.u64.u32 %rd3074, %r3774; - xor.b32 %r3777, %r3544, %r3542; - cvt.u64.u32 %rd3075, %r3777; - cvt.u64.u32 %rd3076, %r3775; - bfi.b64 %rd3077, %rd3073, %rd3076, 32, 32; - bfi.b64 %rd3078, %rd3074, %rd3075, 32, 32; - mov.b64 {%r3778, %r3779}, %rd3078; - mov.b64 {%r3780, %r3781}, %rd3077; - xor.b32 %r3782, %r3663, %r3777; - xor.b32 %r3783, %r3671, %r3779; - xor.b32 %r3784, %r3672, %r3780; - xor.b32 %r3785, %r3673, %r3781; - xor.b32 %r3786, %r3735, %r3782; - shf.l.wrap.b32 %r3787, %r3786, %r3786, 1; - xor.b32 %r3788, %r3783, %r3736; - shf.l.wrap.b32 %r3789, %r3788, %r3788, 1; - xor.b32 %r3790, %r3784, %r3737; - shf.l.wrap.b32 %r3791, %r3790, %r3790, 1; - xor.b32 %r3792, %r3785, %r3787; - shf.l.wrap.b32 %r3793, %r3792, %r3792, 1; - shf.l.wrap.b32 %r3794, %r3772, %r3772, 5; - xor.b32 %r3795, %r3773, %r3765; - xor.b32 %r3796, %r3795, %r3764; - add.s32 %r3797, %r3787, %r3757; - add.s32 %r3798, %r3797, %r3796; - add.s32 %r3799, %r3798, %r3794; - add.s32 %r3800, %r3799, -899497514; - shf.l.wrap.b32 %r3801, %r3764, %r3764, 30; - shf.l.wrap.b32 %r3802, %r3800, %r3800, 5; - xor.b32 %r3803, %r3801, %r3773; - xor.b32 %r3804, %r3803, %r3772; - add.s32 %r3805, %r3789, %r3765; - add.s32 %r3806, %r3805, %r3804; - add.s32 %r3807, %r3806, %r3802; - add.s32 %r3808, %r3807, -899497514; - shf.l.wrap.b32 %r3809, %r3772, %r3772, 30; - shf.l.wrap.b32 %r3810, %r3808, %r3808, 5; - xor.b32 %r3811, %r3809, %r3801; - xor.b32 %r3812, %r3811, %r3800; - add.s32 %r3813, %r3791, %r3773; - add.s32 %r3814, %r3813, %r3812; - add.s32 %r3815, %r3814, %r3810; - add.s32 %r3816, %r3815, -899497514; - shf.l.wrap.b32 %r3817, %r3800, %r3800, 30; - shf.l.wrap.b32 %r3818, %r3816, %r3816, 5; - xor.b32 %r3819, %r3817, %r3809; - xor.b32 %r3820, %r3819, %r3808; - shf.l.wrap.b32 %r3821, %r3808, %r3808, 30; - add.s32 %r3822, %r9085, %r3793; - add.s32 %r3823, %r3822, %r3801; - add.s32 %r3824, %r3823, %r3820; - add.s32 %r3825, %r3824, %r3818; - add.s32 %r9085, %r3825, -899497514; - add.s32 %r9086, %r3816, %r9086; - add.s32 %r9087, %r3821, %r9087; - add.s32 %r9088, %r3817, %r9088; - add.s32 %r9089, %r3809, %r9089; - setp.ne.s64 %p211, %rd4243, %rd793; - add.s64 %rd4246, %rd4246, 64; - @%p211 bra $L__BB1_288; - - add.u64 %rd4247, %SPL, 504; - mov.u16 %rs4344, 0; - st.local.u8 [%rd4247], %rs4344; - st.local.u8 [%rd4247+1], %rs4344; - st.local.u8 [%rd4247+2], %rs4344; - st.local.u8 [%rd4247+3], %rs4344; - st.local.u8 [%rd4247+4], %rs4344; - st.local.u8 [%rd4247+5], %rs4344; - st.local.u8 [%rd4247+6], %rs4344; - st.local.u8 [%rd4247+7], %rs4344; - st.local.u8 [%rd4247+8], %rs4344; - st.local.u8 [%rd4247+9], %rs4344; - st.local.u8 [%rd4247+10], %rs4344; - st.local.u8 [%rd4247+11], %rs4344; - st.local.u8 [%rd4247+12], %rs4344; - st.local.u8 [%rd4247+13], %rs4344; - st.local.u8 [%rd4247+14], %rs4344; - st.local.u8 [%rd4247+15], %rs4344; - st.local.u8 [%rd4247+16], %rs4344; - st.local.u8 [%rd4247+17], %rs4344; - st.local.u8 [%rd4247+18], %rs4344; - st.local.u8 [%rd4247+19], %rs4344; - st.local.u8 [%rd4247+20], %rs4344; - st.local.u8 [%rd4247+21], %rs4344; - st.local.u8 [%rd4247+22], %rs4344; - st.local.u8 [%rd4247+23], %rs4344; - st.local.u8 [%rd4247+24], %rs4344; - st.local.u8 [%rd4247+25], %rs4344; - st.local.u8 [%rd4247+26], %rs4344; - st.local.u8 [%rd4247+27], %rs4344; - st.local.u8 [%rd4247+28], %rs4344; - st.local.u8 [%rd4247+29], %rs4344; - st.local.u8 [%rd4247+30], %rs4344; - st.local.u8 [%rd4247+31], %rs4344; - st.local.u8 [%rd4247+32], %rs4344; - st.local.u8 [%rd4247+33], %rs4344; - st.local.u8 [%rd4247+34], %rs4344; - st.local.u8 [%rd4247+35], %rs4344; - st.local.u8 [%rd4247+36], %rs4344; - st.local.u8 [%rd4247+37], %rs4344; - st.local.u8 [%rd4247+38], %rs4344; - st.local.u8 [%rd4247+39], %rs4344; - st.local.u8 [%rd4247+40], %rs4344; - st.local.u8 [%rd4247+41], %rs4344; - st.local.u8 [%rd4247+42], %rs4344; - st.local.u8 [%rd4247+43], %rs4344; - st.local.u8 [%rd4247+44], %rs4344; - st.local.u8 [%rd4247+45], %rs4344; - st.local.u8 [%rd4247+46], %rs4344; - st.local.u8 [%rd4247+47], %rs4344; - st.local.u8 [%rd4247+48], %rs4344; - st.local.u8 [%rd4247+49], %rs4344; - st.local.u8 [%rd4247+50], %rs4344; - st.local.u8 [%rd4247+51], %rs4344; - st.local.u8 [%rd4247+52], %rs4344; - st.local.u8 [%rd4247+53], %rs4344; - st.local.u8 [%rd4247+54], %rs4344; - st.local.u8 [%rd4247+55], %rs4344; - shr.u64 %rd3079, %rd792, 56; - st.local.u8 [%rd4247+63], %rd3079; - shr.u64 %rd3080, %rd792, 48; - st.local.u8 [%rd4247+62], %rd3080; - shr.u64 %rd3081, %rd792, 40; - st.local.u8 [%rd4247+61], %rd3081; - shr.u64 %rd3082, %rd792, 32; - st.local.u8 [%rd4247+60], %rd3082; - shr.u64 %rd3083, %rd792, 24; - st.local.u8 [%rd4247+59], %rd3083; - shr.u64 %rd3084, %rd792, 16; - st.local.u8 [%rd4247+58], %rd3084; - shr.u64 %rd3085, %rd792, 8; - st.local.u8 [%rd4247+57], %rd3085; - st.local.u8 [%rd4247+56], %rd792; - add.s64 %rd821, %rd4247, 64; - mov.u64 %rd4248, %rd4247; - -$L__BB1_307: - ld.local.u8 %rd3086, [%rd4248]; - ld.local.u8 %rd3087, [%rd4248+1]; - bfi.b64 %rd3088, %rd3087, %rd3086, 8, 8; - ld.local.u8 %rd3089, [%rd4248+2]; - ld.local.u8 %rd3090, [%rd4248+3]; - bfi.b64 %rd3091, %rd3090, %rd3089, 8, 56; - bfi.b64 %rd3092, %rd3091, %rd3088, 16, 48; - shl.b64 %rd3093, %rd3092, 8; - mov.b64 {%r3826, %r3827}, %rd3093; - mov.b32 {%rs708, %rs3277}, %r3827; - mov.b32 {%rs704, %rs706}, %r3826; - shr.u16 %rs707, %rs706, 8; - shr.u16 %rs705, %rs704, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3094, [%rd4248+4]; - ld.local.u8 %rd3095, [%rd4248+5]; - bfi.b64 %rd3096, %rd3095, %rd3094, 8, 8; - ld.local.u8 %rd3097, [%rd4248+6]; - ld.local.u8 %rd3098, [%rd4248+7]; - bfi.b64 %rd3099, %rd3098, %rd3097, 8, 56; - bfi.b64 %rd3100, %rd3099, %rd3096, 16, 48; - shl.b64 %rd3101, %rd3100, 8; - mov.b64 {%r3828, %r3829}, %rd3101; - mov.b32 {%rs713, %rs3278}, %r3829; - mov.b32 {%rs709, %rs711}, %r3828; - shr.u16 %rs712, %rs711, 8; - shr.u16 %rs710, %rs709, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3102, [%rd4248+8]; - ld.local.u8 %rd3103, [%rd4248+9]; - bfi.b64 %rd3104, %rd3103, %rd3102, 8, 8; - ld.local.u8 %rd3105, [%rd4248+10]; - ld.local.u8 %rd3106, [%rd4248+11]; - bfi.b64 %rd3107, %rd3106, %rd3105, 8, 56; - bfi.b64 %rd3108, %rd3107, %rd3104, 16, 48; - shl.b64 %rd3109, %rd3108, 8; - mov.b64 {%r3830, %r3831}, %rd3109; - mov.b32 {%rs718, %rs3279}, %r3831; - mov.b32 {%rs714, %rs716}, %r3830; - shr.u16 %rs717, %rs716, 8; - shr.u16 %rs715, %rs714, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3110, [%rd4248+12]; - ld.local.u8 %rd3111, [%rd4248+13]; - bfi.b64 %rd3112, %rd3111, %rd3110, 8, 8; - ld.local.u8 %rd3113, [%rd4248+14]; - ld.local.u8 %rd3114, [%rd4248+15]; - bfi.b64 %rd3115, %rd3114, %rd3113, 8, 56; - bfi.b64 %rd3116, %rd3115, %rd3112, 16, 48; - shl.b64 %rd3117, %rd3116, 8; - mov.b64 {%r3832, %r3833}, %rd3117; - mov.b32 {%rs723, %rs3280}, %r3833; - mov.b32 {%rs719, %rs721}, %r3832; - shr.u16 %rs722, %rs721, 8; - shr.u16 %rs720, %rs719, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3118, [%rd4248+16]; - ld.local.u8 %rd3119, [%rd4248+17]; - bfi.b64 %rd3120, %rd3119, %rd3118, 8, 8; - ld.local.u8 %rd3121, [%rd4248+18]; - ld.local.u8 %rd3122, [%rd4248+19]; - bfi.b64 %rd3123, %rd3122, %rd3121, 8, 56; - bfi.b64 %rd3124, %rd3123, %rd3120, 16, 48; - shl.b64 %rd3125, %rd3124, 8; - mov.b64 {%r3834, %r3835}, %rd3125; - mov.b32 {%rs728, %rs3281}, %r3835; - mov.b32 {%rs724, %rs726}, %r3834; - shr.u16 %rs727, %rs726, 8; - shr.u16 %rs725, %rs724, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3126, [%rd4248+20]; - ld.local.u8 %rd3127, [%rd4248+21]; - bfi.b64 %rd3128, %rd3127, %rd3126, 8, 8; - ld.local.u8 %rd3129, [%rd4248+22]; - ld.local.u8 %rd3130, [%rd4248+23]; - bfi.b64 %rd3131, %rd3130, %rd3129, 8, 56; - bfi.b64 %rd3132, %rd3131, %rd3128, 16, 48; - shl.b64 %rd3133, %rd3132, 8; - mov.b64 {%r3836, %r3837}, %rd3133; - mov.b32 {%rs733, %rs3282}, %r3837; - mov.b32 {%rs729, %rs731}, %r3836; - shr.u16 %rs732, %rs731, 8; - shr.u16 %rs730, %rs729, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3134, [%rd4248+24]; - ld.local.u8 %rd3135, [%rd4248+25]; - bfi.b64 %rd3136, %rd3135, %rd3134, 8, 8; - ld.local.u8 %rd3137, [%rd4248+26]; - ld.local.u8 %rd3138, [%rd4248+27]; - bfi.b64 %rd3139, %rd3138, %rd3137, 8, 56; - bfi.b64 %rd3140, %rd3139, %rd3136, 16, 48; - shl.b64 %rd3141, %rd3140, 8; - mov.b64 {%r3838, %r3839}, %rd3141; - mov.b32 {%rs738, %rs3283}, %r3839; - mov.b32 {%rs734, %rs736}, %r3838; - shr.u16 %rs737, %rs736, 8; - shr.u16 %rs735, %rs734, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3142, [%rd4248+28]; - ld.local.u8 %rd3143, [%rd4248+29]; - bfi.b64 %rd3144, %rd3143, %rd3142, 8, 8; - ld.local.u8 %rd3145, [%rd4248+30]; - ld.local.u8 %rd3146, [%rd4248+31]; - bfi.b64 %rd3147, %rd3146, %rd3145, 8, 56; - bfi.b64 %rd3148, %rd3147, %rd3144, 16, 48; - shl.b64 %rd3149, %rd3148, 8; - mov.b64 {%r3840, %r3841}, %rd3149; - mov.b32 {%rs743, %rs3284}, %r3841; - mov.b32 {%rs739, %rs741}, %r3840; - shr.u16 %rs742, %rs741, 8; - shr.u16 %rs740, %rs739, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3150, [%rd4248+32]; - ld.local.u8 %rd3151, [%rd4248+33]; - bfi.b64 %rd3152, %rd3151, %rd3150, 8, 8; - ld.local.u8 %rd3153, [%rd4248+34]; - ld.local.u8 %rd3154, [%rd4248+35]; - bfi.b64 %rd3155, %rd3154, %rd3153, 8, 56; - bfi.b64 %rd3156, %rd3155, %rd3152, 16, 48; - shl.b64 %rd3157, %rd3156, 8; - mov.b64 {%r3842, %r3843}, %rd3157; - mov.b32 {%rs748, %rs3285}, %r3843; - mov.b32 {%rs744, %rs746}, %r3842; - shr.u16 %rs747, %rs746, 8; - shr.u16 %rs745, %rs744, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3158, [%rd4248+36]; - ld.local.u8 %rd3159, [%rd4248+37]; - bfi.b64 %rd3160, %rd3159, %rd3158, 8, 8; - ld.local.u8 %rd3161, [%rd4248+38]; - ld.local.u8 %rd3162, [%rd4248+39]; - bfi.b64 %rd3163, %rd3162, %rd3161, 8, 56; - bfi.b64 %rd3164, %rd3163, %rd3160, 16, 48; - shl.b64 %rd3165, %rd3164, 8; - mov.b64 {%r3844, %r3845}, %rd3165; - mov.b32 {%rs753, %rs3286}, %r3845; - mov.b32 {%rs749, %rs751}, %r3844; - shr.u16 %rs752, %rs751, 8; - shr.u16 %rs750, %rs749, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3166, [%rd4248+40]; - ld.local.u8 %rd3167, [%rd4248+41]; - bfi.b64 %rd3168, %rd3167, %rd3166, 8, 8; - ld.local.u8 %rd3169, [%rd4248+42]; - ld.local.u8 %rd3170, [%rd4248+43]; - bfi.b64 %rd3171, %rd3170, %rd3169, 8, 56; - bfi.b64 %rd3172, %rd3171, %rd3168, 16, 48; - shl.b64 %rd3173, %rd3172, 8; - mov.b64 {%r3846, %r3847}, %rd3173; - mov.b32 {%rs758, %rs3287}, %r3847; - mov.b32 {%rs754, %rs756}, %r3846; - shr.u16 %rs757, %rs756, 8; - shr.u16 %rs755, %rs754, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3174, [%rd4248+44]; - ld.local.u8 %rd3175, [%rd4248+45]; - bfi.b64 %rd3176, %rd3175, %rd3174, 8, 8; - ld.local.u8 %rd3177, [%rd4248+46]; - ld.local.u8 %rd3178, [%rd4248+47]; - bfi.b64 %rd3179, %rd3178, %rd3177, 8, 56; - bfi.b64 %rd3180, %rd3179, %rd3176, 16, 48; - shl.b64 %rd3181, %rd3180, 8; - mov.b64 {%r3848, %r3849}, %rd3181; - mov.b32 {%rs763, %rs3288}, %r3849; - mov.b32 {%rs759, %rs761}, %r3848; - shr.u16 %rs762, %rs761, 8; - shr.u16 %rs760, %rs759, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3182, [%rd4248+48]; - ld.local.u8 %rd3183, [%rd4248+49]; - bfi.b64 %rd3184, %rd3183, %rd3182, 8, 8; - ld.local.u8 %rd3185, [%rd4248+50]; - ld.local.u8 %rd3186, [%rd4248+51]; - bfi.b64 %rd3187, %rd3186, %rd3185, 8, 56; - bfi.b64 %rd3188, %rd3187, %rd3184, 16, 48; - shl.b64 %rd3189, %rd3188, 8; - mov.b64 {%r3850, %r3851}, %rd3189; - mov.b32 {%rs768, %rs3289}, %r3851; - mov.b32 {%rs764, %rs766}, %r3850; - shr.u16 %rs767, %rs766, 8; - shr.u16 %rs765, %rs764, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3190, [%rd4248+52]; - ld.local.u8 %rd3191, [%rd4248+53]; - bfi.b64 %rd3192, %rd3191, %rd3190, 8, 8; - ld.local.u8 %rd3193, [%rd4248+54]; - ld.local.u8 %rd3194, [%rd4248+55]; - bfi.b64 %rd3195, %rd3194, %rd3193, 8, 56; - bfi.b64 %rd3196, %rd3195, %rd3192, 16, 48; - shl.b64 %rd3197, %rd3196, 8; - mov.b64 {%r3852, %r3853}, %rd3197; - mov.b32 {%rs773, %rs3290}, %r3853; - mov.b32 {%rs769, %rs771}, %r3852; - shr.u16 %rs772, %rs771, 8; - shr.u16 %rs770, %rs769, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3198, [%rd4248+56]; - ld.local.u8 %rd3199, [%rd4248+57]; - bfi.b64 %rd3200, %rd3199, %rd3198, 8, 8; - ld.local.u8 %rd3201, [%rd4248+58]; - ld.local.u8 %rd3202, [%rd4248+59]; - bfi.b64 %rd3203, %rd3202, %rd3201, 8, 56; - bfi.b64 %rd3204, %rd3203, %rd3200, 16, 48; - shl.b64 %rd3205, %rd3204, 8; - mov.b64 {%r3854, %r3855}, %rd3205; - mov.b32 {%rs778, %rs3291}, %r3855; - mov.b32 {%rs774, %rs776}, %r3854; - shr.u16 %rs777, %rs776, 8; - shr.u16 %rs775, %rs774, 8; - @%p195 bra $L__BB1_323; - - ld.local.u8 %rd3206, [%rd4248+60]; - ld.local.u8 %rd3207, [%rd4248+61]; - bfi.b64 %rd3208, %rd3207, %rd3206, 8, 8; - ld.local.u8 %rd3209, [%rd4248+62]; - ld.local.u8 %rd3210, [%rd4248+63]; - bfi.b64 %rd3211, %rd3210, %rd3209, 8, 56; - bfi.b64 %rd3212, %rd3211, %rd3208, 16, 48; - shl.b64 %rd3213, %rd3212, 8; - mov.b64 {%r3856, %r3857}, %rd3213; - mov.b32 {%rs783, %rs3292}, %r3857; - mov.b32 {%rs779, %rs781}, %r3856; - shr.u16 %rs782, %rs781, 8; - shr.u16 %rs780, %rs779, 8; - @%p210 bra $L__BB1_324; - bra.uni $L__BB1_323; - -$L__BB1_324: - add.s64 %rd4247, %rd4247, 64; - shl.b16 %rs3293, %rs706, 8; - or.b16 %rs3294, %rs705, %rs3293; - shl.b16 %rs3295, %rs708, 8; - or.b16 %rs3296, %rs707, %rs3295; - mov.b32 %r3858, {%rs3294, %rs3296}; - shr.u32 %r3859, %r3858, 24; - shr.u32 %r3860, %r3858, 8; - and.b32 %r3861, %r3860, 65280; - or.b32 %r3862, %r3861, %r3859; - shl.b32 %r3863, %r3858, 24; - shl.b32 %r3864, %r3858, 8; - and.b32 %r3865, %r3864, 16711680; - or.b32 %r3866, %r3863, %r3865; - or.b32 %r3867, %r3866, %r3862; - shl.b16 %rs3297, %rs711, 8; - or.b16 %rs3298, %rs710, %rs3297; - shl.b16 %rs3299, %rs713, 8; - or.b16 %rs3300, %rs712, %rs3299; - mov.b32 %r3868, {%rs3298, %rs3300}; - shr.u32 %r3869, %r3868, 24; - shr.u32 %r3870, %r3868, 8; - and.b32 %r3871, %r3870, 65280; - or.b32 %r3872, %r3871, %r3869; - shl.b32 %r3873, %r3868, 24; - shl.b32 %r3874, %r3868, 8; - and.b32 %r3875, %r3874, 16711680; - or.b32 %r3876, %r3873, %r3875; - or.b32 %r3877, %r3876, %r3872; - shl.b16 %rs3301, %rs716, 8; - or.b16 %rs3302, %rs715, %rs3301; - shl.b16 %rs3303, %rs718, 8; - or.b16 %rs3304, %rs717, %rs3303; - mov.b32 %r3878, {%rs3302, %rs3304}; - shr.u32 %r3879, %r3878, 24; - shr.u32 %r3880, %r3878, 8; - and.b32 %r3881, %r3880, 65280; - or.b32 %r3882, %r3881, %r3879; - shl.b32 %r3883, %r3878, 24; - shl.b32 %r3884, %r3878, 8; - and.b32 %r3885, %r3884, 16711680; - or.b32 %r3886, %r3883, %r3885; - or.b32 %r3887, %r3886, %r3882; - xor.b16 %rs3305, %rs715, %rs705; - xor.b16 %rs3306, %rs716, %rs706; - shl.b16 %rs3307, %rs3306, 8; - or.b16 %rs3308, %rs3305, %rs3307; - xor.b16 %rs3309, %rs717, %rs707; - xor.b16 %rs3310, %rs718, %rs708; - shl.b16 %rs3311, %rs3310, 8; - or.b16 %rs3312, %rs3309, %rs3311; - mov.b32 %r3888, {%rs3308, %rs3312}; - shl.b16 %rs3313, %rs721, 8; - or.b16 %rs3314, %rs720, %rs3313; - shl.b16 %rs3315, %rs723, 8; - or.b16 %rs3316, %rs722, %rs3315; - mov.b32 %r3889, {%rs3314, %rs3316}; - shr.u32 %r3890, %r3889, 24; - shr.u32 %r3891, %r3889, 8; - and.b32 %r3892, %r3891, 65280; - or.b32 %r3893, %r3892, %r3890; - shl.b32 %r3894, %r3889, 24; - shl.b32 %r3895, %r3889, 8; - and.b32 %r3896, %r3895, 16711680; - or.b32 %r3897, %r3894, %r3896; - or.b32 %r3898, %r3897, %r3893; - xor.b16 %rs3317, %rs720, %rs710; - xor.b16 %rs3318, %rs721, %rs711; - shl.b16 %rs3319, %rs3318, 8; - or.b16 %rs3320, %rs3317, %rs3319; - xor.b16 %rs3321, %rs722, %rs712; - xor.b16 %rs3322, %rs723, %rs713; - shl.b16 %rs3323, %rs3322, 8; - or.b16 %rs3324, %rs3321, %rs3323; - mov.b32 %r3899, {%rs3320, %rs3324}; - shl.b16 %rs3325, %rs726, 8; - or.b16 %rs3326, %rs725, %rs3325; - shl.b16 %rs3327, %rs728, 8; - or.b16 %rs3328, %rs727, %rs3327; - mov.b32 %r3900, {%rs3326, %rs3328}; - shr.u32 %r3901, %r3900, 24; - shr.u32 %r3902, %r3900, 8; - and.b32 %r3903, %r3902, 65280; - or.b32 %r3904, %r3903, %r3901; - shl.b32 %r3905, %r3900, 24; - shl.b32 %r3906, %r3900, 8; - and.b32 %r3907, %r3906, 16711680; - or.b32 %r3908, %r3905, %r3907; - or.b32 %r3909, %r3908, %r3904; - xor.b16 %rs3329, %rs725, %rs715; - xor.b16 %rs3330, %rs726, %rs716; - shl.b16 %rs3331, %rs3330, 8; - or.b16 %rs3332, %rs3329, %rs3331; - xor.b16 %rs3333, %rs727, %rs717; - xor.b16 %rs3334, %rs728, %rs718; - shl.b16 %rs3335, %rs3334, 8; - or.b16 %rs3336, %rs3333, %rs3335; - mov.b32 %r3910, {%rs3332, %rs3336}; - shl.b16 %rs3337, %rs731, 8; - or.b16 %rs3338, %rs730, %rs3337; - shl.b16 %rs3339, %rs733, 8; - or.b16 %rs3340, %rs732, %rs3339; - mov.b32 %r3911, {%rs3338, %rs3340}; - shr.u32 %r3912, %r3911, 24; - shr.u32 %r3913, %r3911, 8; - and.b32 %r3914, %r3913, 65280; - or.b32 %r3915, %r3914, %r3912; - shl.b32 %r3916, %r3911, 24; - shl.b32 %r3917, %r3911, 8; - and.b32 %r3918, %r3917, 16711680; - or.b32 %r3919, %r3916, %r3918; - or.b32 %r3920, %r3919, %r3915; - xor.b16 %rs3341, %rs730, %rs720; - xor.b16 %rs3342, %rs731, %rs721; - shl.b16 %rs3343, %rs3342, 8; - or.b16 %rs3344, %rs3341, %rs3343; - xor.b16 %rs3345, %rs732, %rs722; - xor.b16 %rs3346, %rs733, %rs723; - shl.b16 %rs3347, %rs3346, 8; - or.b16 %rs3348, %rs3345, %rs3347; - mov.b32 %r3921, {%rs3344, %rs3348}; - shl.b16 %rs3349, %rs736, 8; - or.b16 %rs3350, %rs735, %rs3349; - shl.b16 %rs3351, %rs738, 8; - or.b16 %rs3352, %rs737, %rs3351; - mov.b32 %r3922, {%rs3350, %rs3352}; - shr.u32 %r3923, %r3922, 24; - shr.u32 %r3924, %r3922, 8; - and.b32 %r3925, %r3924, 65280; - or.b32 %r3926, %r3925, %r3923; - shl.b32 %r3927, %r3922, 24; - shl.b32 %r3928, %r3922, 8; - and.b32 %r3929, %r3928, 16711680; - or.b32 %r3930, %r3927, %r3929; - or.b32 %r3931, %r3930, %r3926; - xor.b16 %rs3353, %rs735, %rs725; - xor.b16 %rs3354, %rs736, %rs726; - shl.b16 %rs3355, %rs3354, 8; - or.b16 %rs3356, %rs3353, %rs3355; - xor.b16 %rs3357, %rs737, %rs727; - xor.b16 %rs3358, %rs738, %rs728; - shl.b16 %rs3359, %rs3358, 8; - or.b16 %rs3360, %rs3357, %rs3359; - mov.b32 %r3932, {%rs3356, %rs3360}; - shl.b16 %rs3361, %rs741, 8; - or.b16 %rs3362, %rs740, %rs3361; - shl.b16 %rs3363, %rs743, 8; - or.b16 %rs3364, %rs742, %rs3363; - mov.b32 %r3933, {%rs3362, %rs3364}; - shr.u32 %r3934, %r3933, 24; - shr.u32 %r3935, %r3933, 8; - and.b32 %r3936, %r3935, 65280; - or.b32 %r3937, %r3936, %r3934; - shl.b32 %r3938, %r3933, 24; - shl.b32 %r3939, %r3933, 8; - and.b32 %r3940, %r3939, 16711680; - or.b32 %r3941, %r3938, %r3940; - or.b32 %r3942, %r3941, %r3937; - xor.b16 %rs3365, %rs740, %rs730; - xor.b16 %rs3366, %rs741, %rs731; - shl.b16 %rs3367, %rs3366, 8; - or.b16 %rs3368, %rs3365, %rs3367; - xor.b16 %rs3369, %rs742, %rs732; - xor.b16 %rs3370, %rs743, %rs733; - shl.b16 %rs3371, %rs3370, 8; - or.b16 %rs3372, %rs3369, %rs3371; - mov.b32 %r3943, {%rs3368, %rs3372}; - shl.b16 %rs3373, %rs776, 8; - or.b16 %rs3374, %rs775, %rs3373; - shl.b16 %rs3375, %rs778, 8; - or.b16 %rs3376, %rs777, %rs3375; - mov.b32 %r3944, {%rs3374, %rs3376}; - shr.u32 %r3945, %r3944, 24; - shr.u32 %r3946, %r3944, 8; - and.b32 %r3947, %r3946, 65280; - or.b32 %r3948, %r3947, %r3945; - shl.b32 %r3949, %r3944, 24; - shl.b32 %r3950, %r3944, 8; - and.b32 %r3951, %r3950, 16711680; - or.b32 %r3952, %r3949, %r3951; - or.b32 %r3953, %r3952, %r3948; - shl.b16 %rs3377, %rs781, 8; - or.b16 %rs3378, %rs780, %rs3377; - shl.b16 %rs3379, %rs783, 8; - or.b16 %rs3380, %rs782, %rs3379; - mov.b32 %r3954, {%rs3378, %rs3380}; - shr.u32 %r3955, %r3954, 24; - shr.u32 %r3956, %r3954, 8; - and.b32 %r3957, %r3956, 65280; - or.b32 %r3958, %r3957, %r3955; - shl.b32 %r3959, %r3954, 24; - shl.b32 %r3960, %r3954, 8; - and.b32 %r3961, %r3960, 16711680; - or.b32 %r3962, %r3959, %r3961; - or.b32 %r3963, %r3962, %r3958; - xor.b32 %r3964, %r9088, %r9087; - and.b32 %r3965, %r3964, %r9086; - xor.b32 %r3966, %r3965, %r9088; - shf.l.wrap.b32 %r3967, %r9085, %r9085, 5; - add.s32 %r3968, %r3967, %r9089; - add.s32 %r3969, %r3968, %r3966; - add.s32 %r3970, %r3969, %r3867; - add.s32 %r3971, %r3970, 1518500249; - shf.l.wrap.b32 %r3972, %r3971, %r3971, 5; - shf.l.wrap.b32 %r3973, %r9086, %r9086, 30; - xor.b32 %r3974, %r3973, %r9087; - and.b32 %r3975, %r3974, %r9085; - xor.b32 %r3976, %r3975, %r9087; - add.s32 %r3977, %r9088, %r3976; - add.s32 %r3978, %r3977, %r3877; - add.s32 %r3979, %r3978, %r3972; - add.s32 %r3980, %r3979, 1518500249; - shf.l.wrap.b32 %r3981, %r3980, %r3980, 5; - shf.l.wrap.b32 %r3982, %r9085, %r9085, 30; - xor.b32 %r3983, %r3973, %r3982; - and.b32 %r3984, %r3971, %r3983; - xor.b32 %r3985, %r3984, %r3973; - add.s32 %r3986, %r9087, %r3887; - add.s32 %r3987, %r3986, %r3985; - add.s32 %r3988, %r3987, %r3981; - add.s32 %r3989, %r3988, 1518500249; - shf.l.wrap.b32 %r3990, %r3971, %r3971, 30; - shf.l.wrap.b32 %r3991, %r3989, %r3989, 5; - xor.b32 %r3992, %r3990, %r3982; - and.b32 %r3993, %r3980, %r3992; - xor.b32 %r3994, %r3993, %r3982; - add.s32 %r3995, %r3973, %r3898; - add.s32 %r3996, %r3995, %r3994; - add.s32 %r3997, %r3996, %r3991; - add.s32 %r3998, %r3997, 1518500249; - shf.l.wrap.b32 %r3999, %r3980, %r3980, 30; - shf.l.wrap.b32 %r4000, %r3998, %r3998, 5; - xor.b32 %r4001, %r3999, %r3990; - and.b32 %r4002, %r4001, %r3989; - xor.b32 %r4003, %r4002, %r3990; - add.s32 %r4004, %r3982, %r3909; - add.s32 %r4005, %r4004, %r4003; - add.s32 %r4006, %r4005, %r4000; - add.s32 %r4007, %r4006, 1518500249; - shf.l.wrap.b32 %r4008, %r3989, %r3989, 30; - shf.l.wrap.b32 %r4009, %r4007, %r4007, 5; - xor.b32 %r4010, %r4008, %r3999; - and.b32 %r4011, %r4010, %r3998; - xor.b32 %r4012, %r4011, %r3999; - add.s32 %r4013, %r3990, %r3920; - add.s32 %r4014, %r4013, %r4012; - add.s32 %r4015, %r4014, %r4009; - add.s32 %r4016, %r4015, 1518500249; - shf.l.wrap.b32 %r4017, %r3998, %r3998, 30; - shf.l.wrap.b32 %r4018, %r4016, %r4016, 5; - xor.b32 %r4019, %r4017, %r4008; - and.b32 %r4020, %r4007, %r4019; - xor.b32 %r4021, %r4020, %r4008; - add.s32 %r4022, %r3999, %r3931; - add.s32 %r4023, %r4022, %r4021; - add.s32 %r4024, %r4023, %r4018; - add.s32 %r4025, %r4024, 1518500249; - shf.l.wrap.b32 %r4026, %r4007, %r4007, 30; - shf.l.wrap.b32 %r4027, %r4025, %r4025, 5; - xor.b32 %r4028, %r4026, %r4017; - and.b32 %r4029, %r4016, %r4028; - xor.b32 %r4030, %r4029, %r4017; - add.s32 %r4031, %r4008, %r3942; - add.s32 %r4032, %r4031, %r4030; - add.s32 %r4033, %r4032, %r4027; - add.s32 %r4034, %r4033, 1518500249; - shf.l.wrap.b32 %r4035, %r4016, %r4016, 30; - cvt.u64.u32 %rd3214, %r4026; - cvt.u64.u32 %rd3215, %r4035; - cvt.u64.u32 %rd3216, %r4025; - cvt.u64.u32 %rd3217, %r4034; - bfi.b64 %rd3218, %rd3216, %rd3217, 32, 32; - bfi.b64 %rd3219, %rd3214, %rd3215, 32, 32; - mov.b64 {%r4036, %r4037}, %rd3218; - mov.b64 {%r4038, %r4039}, %rd3219; - shl.b16 %rs3381, %rs761, 8; - or.b16 %rs3382, %rs760, %rs3381; - shl.b16 %rs3383, %rs763, 8; - or.b16 %rs3384, %rs762, %rs3383; - mov.b32 %r4040, {%rs3382, %rs3384}; - shr.u32 %r4041, %r4040, 24; - shr.u32 %r4042, %r4040, 8; - and.b32 %r4043, %r4042, 65280; - or.b32 %r4044, %r4043, %r4041; - shl.b32 %r4045, %r4040, 24; - shl.b32 %r4046, %r4040, 8; - and.b32 %r4047, %r4046, 16711680; - or.b32 %r4048, %r4045, %r4047; - or.b32 %r4049, %r4048, %r4044; - cvt.u64.u32 %rd3220, %r4049; - shl.b16 %rs3385, %rs756, 8; - or.b16 %rs3386, %rs755, %rs3385; - shl.b16 %rs3387, %rs758, 8; - or.b16 %rs3388, %rs757, %rs3387; - mov.b32 %r4050, {%rs3386, %rs3388}; - shr.u32 %r4051, %r4050, 24; - shr.u32 %r4052, %r4050, 8; - and.b32 %r4053, %r4052, 65280; - or.b32 %r4054, %r4053, %r4051; - shl.b32 %r4055, %r4050, 24; - shl.b32 %r4056, %r4050, 8; - and.b32 %r4057, %r4056, 16711680; - or.b32 %r4058, %r4055, %r4057; - or.b32 %r4059, %r4058, %r4054; - shl.b16 %rs3389, %rs751, 8; - or.b16 %rs3390, %rs750, %rs3389; - shl.b16 %rs3391, %rs753, 8; - or.b16 %rs3392, %rs752, %rs3391; - mov.b32 %r4060, {%rs3390, %rs3392}; - shr.u32 %r4061, %r4060, 24; - shr.u32 %r4062, %r4060, 8; - and.b32 %r4063, %r4062, 65280; - or.b32 %r4064, %r4063, %r4061; - shl.b32 %r4065, %r4060, 24; - shl.b32 %r4066, %r4060, 8; - and.b32 %r4067, %r4066, 16711680; - or.b32 %r4068, %r4065, %r4067; - or.b32 %r4069, %r4068, %r4064; - cvt.u64.u32 %rd3221, %r4069; - shl.b16 %rs3393, %rs746, 8; - or.b16 %rs3394, %rs745, %rs3393; - shl.b16 %rs3395, %rs748, 8; - or.b16 %rs3396, %rs747, %rs3395; - mov.b32 %r4070, {%rs3394, %rs3396}; - shr.u32 %r4071, %r4070, 24; - shr.u32 %r4072, %r4070, 8; - and.b32 %r4073, %r4072, 65280; - or.b32 %r4074, %r4073, %r4071; - shl.b32 %r4075, %r4070, 24; - shl.b32 %r4076, %r4070, 8; - and.b32 %r4077, %r4076, 16711680; - or.b32 %r4078, %r4075, %r4077; - or.b32 %r4079, %r4078, %r4074; - cvt.u64.u32 %rd3222, %r4079; - cvt.u64.u32 %rd3223, %r4059; - bfi.b64 %rd3224, %rd3220, %rd3223, 32, 32; - bfi.b64 %rd3225, %rd3221, %rd3222, 32, 32; - mov.b64 {%r4080, %r4081}, %rd3225; - mov.b64 {%r4082, %r4083}, %rd3224; - cvt.u64.u32 %rd3226, %r4039; - cvt.u64.u32 %rd3227, %r4037; - cvt.u64.u32 %rd3228, %r4038; - bfi.b64 %rd3229, %rd3227, %rd3217, 32, 32; - bfi.b64 %rd3230, %rd3226, %rd3228, 32, 32; - mov.b64 {%r4084, %r4085}, %rd3229; - mov.b64 {%r4086, %r4087}, %rd3230; - shf.l.wrap.b32 %r4088, %r4084, %r4084, 5; - xor.b32 %r4089, %r4087, %r4086; - and.b32 %r4090, %r4089, %r4085; - xor.b32 %r4091, %r4090, %r4087; - add.s32 %r4092, %r4017, %r4080; - add.s32 %r4093, %r4092, %r4088; - add.s32 %r4094, %r4093, %r4091; - add.s32 %r4095, %r4094, 1518500249; - shf.l.wrap.b32 %r4096, %r4085, %r4085, 30; - shf.l.wrap.b32 %r4097, %r4095, %r4095, 5; - xor.b32 %r4098, %r4096, %r4086; - and.b32 %r4099, %r4098, %r4084; - xor.b32 %r4100, %r4099, %r4086; - add.s32 %r4101, %r4081, %r4087; - add.s32 %r4102, %r4101, %r4100; - add.s32 %r4103, %r4102, %r4097; - add.s32 %r4104, %r4103, 1518500249; - shf.l.wrap.b32 %r4105, %r4084, %r4084, 30; - shf.l.wrap.b32 %r4106, %r4104, %r4104, 5; - xor.b32 %r4107, %r4096, %r4105; - and.b32 %r4108, %r4095, %r4107; - xor.b32 %r4109, %r4108, %r4096; - add.s32 %r4110, %r4082, %r4086; - add.s32 %r4111, %r4110, %r4109; - add.s32 %r4112, %r4111, %r4106; - add.s32 %r4113, %r4112, 1518500249; - shf.l.wrap.b32 %r4114, %r4095, %r4095, 30; - shf.l.wrap.b32 %r4115, %r4113, %r4113, 5; - xor.b32 %r4116, %r4114, %r4105; - and.b32 %r4117, %r4104, %r4116; - xor.b32 %r4118, %r4117, %r4105; - add.s32 %r4119, %r4083, %r4096; - add.s32 %r4120, %r4119, %r4118; - add.s32 %r4121, %r4120, %r4115; - add.s32 %r4122, %r4121, 1518500249; - shf.l.wrap.b32 %r4123, %r4104, %r4104, 30; - cvt.u64.u32 %rd3231, %r3963; - shl.b16 %rs3397, %rs771, 8; - or.b16 %rs3398, %rs770, %rs3397; - shl.b16 %rs3399, %rs773, 8; - or.b16 %rs3400, %rs772, %rs3399; - mov.b32 %r4124, {%rs3398, %rs3400}; - shr.u32 %r4125, %r4124, 24; - shr.u32 %r4126, %r4124, 8; - and.b32 %r4127, %r4126, 65280; - or.b32 %r4128, %r4127, %r4125; - shl.b32 %r4129, %r4124, 24; - shl.b32 %r4130, %r4124, 8; - and.b32 %r4131, %r4130, 16711680; - or.b32 %r4132, %r4129, %r4131; - or.b32 %r4133, %r4132, %r4128; - cvt.u64.u32 %rd3232, %r4133; - shl.b16 %rs3401, %rs766, 8; - or.b16 %rs3402, %rs765, %rs3401; - shl.b16 %rs3403, %rs768, 8; - or.b16 %rs3404, %rs767, %rs3403; - mov.b32 %r4134, {%rs3402, %rs3404}; - shr.u32 %r4135, %r4134, 24; - shr.u32 %r4136, %r4134, 8; - and.b32 %r4137, %r4136, 65280; - or.b32 %r4138, %r4137, %r4135; - shl.b32 %r4139, %r4134, 24; - shl.b32 %r4140, %r4134, 8; - and.b32 %r4141, %r4140, 16711680; - or.b32 %r4142, %r4139, %r4141; - or.b32 %r4143, %r4142, %r4138; - cvt.u64.u32 %rd3233, %r4143; - cvt.u64.u32 %rd3234, %r3953; - bfi.b64 %rd3235, %rd3231, %rd3234, 32, 32; - bfi.b64 %rd3236, %rd3232, %rd3233, 32, 32; - mov.b64 {%r4144, %r4145}, %rd3236; - mov.b64 {%r4146, %r4147}, %rd3235; - shf.l.wrap.b32 %r4148, %r4122, %r4122, 5; - xor.b32 %r4149, %r4123, %r4114; - and.b32 %r4150, %r4149, %r4113; - xor.b32 %r4151, %r4150, %r4114; - add.s32 %r4152, %r4144, %r4105; - add.s32 %r4153, %r4152, %r4151; - add.s32 %r4154, %r4153, %r4148; - add.s32 %r4155, %r4154, 1518500249; - shf.l.wrap.b32 %r4156, %r4113, %r4113, 30; - shf.l.wrap.b32 %r4157, %r4155, %r4155, 5; - xor.b32 %r4158, %r4156, %r4123; - and.b32 %r4159, %r4158, %r4122; - xor.b32 %r4160, %r4159, %r4123; - add.s32 %r4161, %r4145, %r4114; - add.s32 %r4162, %r4161, %r4160; - add.s32 %r4163, %r4162, %r4157; - add.s32 %r4164, %r4163, 1518500249; - shf.l.wrap.b32 %r4165, %r4122, %r4122, 30; - shf.l.wrap.b32 %r4166, %r4164, %r4164, 5; - xor.b32 %r4167, %r4165, %r4156; - and.b32 %r4168, %r4155, %r4167; - xor.b32 %r4169, %r4168, %r4156; - add.s32 %r4170, %r4146, %r4123; - add.s32 %r4171, %r4170, %r4169; - add.s32 %r4172, %r4171, %r4166; - add.s32 %r4173, %r4172, 1518500249; - shf.l.wrap.b32 %r4174, %r4155, %r4155, 30; - shf.l.wrap.b32 %r4175, %r4173, %r4173, 5; - xor.b32 %r4176, %r4174, %r4165; - and.b32 %r4177, %r4164, %r4176; - xor.b32 %r4178, %r4177, %r4165; - add.s32 %r4179, %r4147, %r4156; - add.s32 %r4180, %r4179, %r4178; - add.s32 %r4181, %r4180, %r4175; - add.s32 %r4182, %r4181, 1518500249; - shf.l.wrap.b32 %r4183, %r4164, %r4164, 30; - cvt.u64.u32 %rd3237, %r4174; - cvt.u64.u32 %rd3238, %r4183; - cvt.u64.u32 %rd3239, %r4173; - cvt.u64.u32 %rd3240, %r4182; - bfi.b64 %rd3241, %rd3239, %rd3240, 32, 32; - bfi.b64 %rd3242, %rd3237, %rd3238, 32, 32; - mov.b64 {%r4184, %r4185}, %rd3241; - mov.b64 {%r4186, %r4187}, %rd3242; - shr.u32 %r4188, %r3921, 24; - shr.u32 %r4189, %r3921, 8; - and.b32 %r4190, %r4189, 65280; - or.b32 %r4191, %r4190, %r4188; - shl.b32 %r4192, %r3921, 24; - shl.b32 %r4193, %r3921, 8; - and.b32 %r4194, %r4193, 16711680; - or.b32 %r4195, %r4192, %r4194; - or.b32 %r4196, %r4195, %r4191; - cvt.u64.u32 %rd3243, %r4196; - shr.u32 %r4197, %r3910, 24; - shr.u32 %r4198, %r3910, 8; - and.b32 %r4199, %r4198, 65280; - or.b32 %r4200, %r4199, %r4197; - shl.b32 %r4201, %r3910, 24; - shl.b32 %r4202, %r3910, 8; - and.b32 %r4203, %r4202, 16711680; - or.b32 %r4204, %r4201, %r4203; - or.b32 %r4205, %r4204, %r4200; - shr.u32 %r4206, %r3899, 24; - shr.u32 %r4207, %r3899, 8; - and.b32 %r4208, %r4207, 65280; - or.b32 %r4209, %r4208, %r4206; - shl.b32 %r4210, %r3899, 24; - shl.b32 %r4211, %r3899, 8; - and.b32 %r4212, %r4211, 16711680; - or.b32 %r4213, %r4210, %r4212; - or.b32 %r4214, %r4213, %r4209; - cvt.u64.u32 %rd3244, %r4214; - shr.u32 %r4215, %r3888, 24; - shr.u32 %r4216, %r3888, 8; - and.b32 %r4217, %r4216, 65280; - or.b32 %r4218, %r4217, %r4215; - shl.b32 %r4219, %r3888, 24; - shl.b32 %r4220, %r3888, 8; - and.b32 %r4221, %r4220, 16711680; - or.b32 %r4222, %r4219, %r4221; - or.b32 %r4223, %r4222, %r4218; - cvt.u64.u32 %rd3245, %r4223; - cvt.u64.u32 %rd3246, %r4205; - bfi.b64 %rd3247, %rd3243, %rd3246, 32, 32; - bfi.b64 %rd3248, %rd3244, %rd3245, 32, 32; - mov.b64 {%r4224, %r4225}, %rd3248; - mov.b64 {%r4226, %r4227}, %rd3247; - xor.b16 %rs3405, %rs745, %rs3305; - xor.b16 %rs3406, %rs746, %rs3306; - shl.b16 %rs3407, %rs3406, 8; - or.b16 %rs3408, %rs3405, %rs3407; - xor.b16 %rs3409, %rs747, %rs3309; - xor.b16 %rs3410, %rs748, %rs3310; - shl.b16 %rs3411, %rs3410, 8; - or.b16 %rs3412, %rs3409, %rs3411; - mov.b32 %r4228, {%rs3408, %rs3412}; - shr.u32 %r4229, %r4228, 24; - shr.u32 %r4230, %r4228, 8; - and.b32 %r4231, %r4230, 65280; - or.b32 %r4232, %r4231, %r4229; - shl.b32 %r4233, %r4228, 24; - shl.b32 %r4234, %r4228, 8; - and.b32 %r4235, %r4234, 16711680; - or.b32 %r4236, %r4233, %r4235; - or.b32 %r4237, %r4236, %r4232; - xor.b32 %r4238, %r4081, %r4225; - xor.b32 %r4239, %r4082, %r4226; - xor.b32 %r4240, %r4083, %r4227; - xor.b32 %r4241, %r4145, %r4237; - xor.b32 %r4242, %r4238, %r4146; - shf.l.wrap.b32 %r4243, %r4242, %r4242, 1; - xor.b32 %r4244, %r4239, %r4147; - shf.l.wrap.b32 %r4245, %r4244, %r4244, 1; - shf.l.wrap.b32 %r4246, %r4241, %r4241, 1; - xor.b32 %r4247, %r4240, %r4246; - shf.l.wrap.b32 %r4248, %r4247, %r4247, 1; - cvt.u64.u32 %rd3249, %r4248; - cvt.u64.u32 %rd3250, %r4243; - cvt.u64.u32 %rd3251, %r4246; - cvt.u64.u32 %rd3252, %r4245; - bfi.b64 %rd3253, %rd3249, %rd3252, 32, 32; - bfi.b64 %rd3254, %rd3250, %rd3251, 32, 32; - mov.b64 {%r4249, %r4250}, %rd3254; - mov.b64 {%r4251, %r4252}, %rd3253; - cvt.u64.u32 %rd3255, %r4187; - cvt.u64.u32 %rd3256, %r4185; - cvt.u64.u32 %rd3257, %r4186; - bfi.b64 %rd3258, %rd3256, %rd3240, 32, 32; - bfi.b64 %rd3259, %rd3255, %rd3257, 32, 32; - mov.b64 {%r4253, %r4254}, %rd3258; - mov.b64 {%r4255, %r4256}, %rd3259; - shf.l.wrap.b32 %r4257, %r4253, %r4253, 5; - xor.b32 %r4258, %r4256, %r4255; - and.b32 %r4259, %r4258, %r4254; - xor.b32 %r4260, %r4259, %r4256; - add.s32 %r4261, %r4249, %r4165; - add.s32 %r4262, %r4261, %r4257; - add.s32 %r4263, %r4262, %r4260; - add.s32 %r4264, %r4263, 1518500249; - shf.l.wrap.b32 %r4265, %r4254, %r4254, 30; - shf.l.wrap.b32 %r4266, %r4264, %r4264, 5; - xor.b32 %r4267, %r4265, %r4255; - and.b32 %r4268, %r4267, %r4253; - xor.b32 %r4269, %r4268, %r4255; - add.s32 %r4270, %r4250, %r4256; - add.s32 %r4271, %r4270, %r4269; - add.s32 %r4272, %r4271, %r4266; - add.s32 %r4273, %r4272, 1518500249; - shf.l.wrap.b32 %r4274, %r4253, %r4253, 30; - shf.l.wrap.b32 %r4275, %r4273, %r4273, 5; - xor.b32 %r4276, %r4265, %r4274; - and.b32 %r4277, %r4264, %r4276; - xor.b32 %r4278, %r4277, %r4265; - add.s32 %r4279, %r4251, %r4255; - add.s32 %r4280, %r4279, %r4278; - add.s32 %r4281, %r4280, %r4275; - add.s32 %r4282, %r4281, 1518500249; - shf.l.wrap.b32 %r4283, %r4264, %r4264, 30; - shf.l.wrap.b32 %r4284, %r4282, %r4282, 5; - xor.b32 %r4285, %r4283, %r4274; - and.b32 %r4286, %r4273, %r4285; - xor.b32 %r4287, %r4286, %r4274; - add.s32 %r4288, %r4252, %r4265; - add.s32 %r4289, %r4288, %r4287; - add.s32 %r4290, %r4289, %r4284; - add.s32 %r4291, %r4290, 1518500249; - shf.l.wrap.b32 %r4292, %r4273, %r4273, 30; - xor.b32 %r4293, %r4080, %r3931; - xor.b32 %r4294, %r4081, %r3942; - cvt.u64.u32 %rd3260, %r4294; - shr.u32 %r4295, %r3943, 24; - shr.u32 %r4296, %r3943, 8; - and.b32 %r4297, %r4296, 65280; - or.b32 %r4298, %r4297, %r4295; - shl.b32 %r4299, %r3943, 24; - shl.b32 %r4300, %r3943, 8; - and.b32 %r4301, %r4300, 16711680; - or.b32 %r4302, %r4299, %r4301; - or.b32 %r4303, %r4302, %r4298; - cvt.u64.u32 %rd3261, %r4303; - shr.u32 %r4304, %r3932, 24; - shr.u32 %r4305, %r3932, 8; - and.b32 %r4306, %r4305, 65280; - or.b32 %r4307, %r4306, %r4304; - shl.b32 %r4308, %r3932, 24; - shl.b32 %r4309, %r3932, 8; - and.b32 %r4310, %r4309, 16711680; - or.b32 %r4311, %r4308, %r4310; - or.b32 %r4312, %r4311, %r4307; - cvt.u64.u32 %rd3262, %r4312; - cvt.u64.u32 %rd3263, %r4293; - bfi.b64 %rd3264, %rd3260, %rd3263, 32, 32; - bfi.b64 %rd3265, %rd3261, %rd3262, 32, 32; - mov.b64 {%r4313, %r4314}, %rd3265; - mov.b64 {%r4315, %r4316}, %rd3264; - xor.b16 %rs3413, %rs3353, %rs765; - xor.b16 %rs3414, %rs3354, %rs766; - shl.b16 %rs3415, %rs3414, 8; - or.b16 %rs3416, %rs3413, %rs3415; - xor.b16 %rs3417, %rs3357, %rs767; - xor.b16 %rs3418, %rs3358, %rs768; - shl.b16 %rs3419, %rs3418, 8; - or.b16 %rs3420, %rs3417, %rs3419; - mov.b32 %r4317, {%rs3416, %rs3420}; - shr.u32 %r4318, %r4317, 24; - shr.u32 %r4319, %r4317, 8; - and.b32 %r4320, %r4319, 65280; - or.b32 %r4321, %r4320, %r4318; - shl.b32 %r4322, %r4317, 24; - shl.b32 %r4323, %r4317, 8; - and.b32 %r4324, %r4323, 16711680; - or.b32 %r4325, %r4322, %r4324; - or.b32 %r4326, %r4325, %r4321; - xor.b32 %r4327, %r4314, %r4145; - xor.b32 %r4328, %r4315, %r4146; - xor.b32 %r4329, %r4316, %r4147; - xor.b32 %r4330, %r4250, %r4326; - xor.b32 %r4331, %r4327, %r4251; - shf.l.wrap.b32 %r4332, %r4331, %r4331, 1; - xor.b32 %r4333, %r4328, %r4252; - shf.l.wrap.b32 %r4334, %r4333, %r4333, 1; - shf.l.wrap.b32 %r4335, %r4330, %r4330, 1; - xor.b32 %r4336, %r4329, %r4335; - shf.l.wrap.b32 %r4337, %r4336, %r4336, 1; - cvt.u64.u32 %rd3266, %r4337; - cvt.u64.u32 %rd3267, %r4332; - cvt.u64.u32 %rd3268, %r4334; - bfi.b64 %rd3269, %rd3266, %rd3268, 32, 32; - cvt.u64.u32 %rd3270, %r4335; - bfi.b64 %rd3271, %rd3267, %rd3270, 32, 32; - mov.b64 {%r4338, %r4339}, %rd3271; - mov.b64 {%r4340, %r4341}, %rd3269; - cvt.u64.u32 %rd3272, %r4341; - cvt.u64.u32 %rd3273, %r4339; - cvt.u64.u32 %rd3274, %r4340; - bfi.b64 %rd3275, %rd3272, %rd3274, 32, 32; - bfi.b64 %rd3276, %rd3273, %rd3270, 32, 32; - mov.b64 {%r4342, %r4343}, %rd3276; - mov.b64 {%r4344, %r4345}, %rd3275; - shf.l.wrap.b32 %r4346, %r4291, %r4291, 5; - xor.b32 %r4347, %r4292, %r4283; - xor.b32 %r4348, %r4347, %r4282; - add.s32 %r4349, %r4342, %r4274; - add.s32 %r4350, %r4349, %r4348; - add.s32 %r4351, %r4350, %r4346; - add.s32 %r4352, %r4351, 1859775393; - shf.l.wrap.b32 %r4353, %r4282, %r4282, 30; - shf.l.wrap.b32 %r4354, %r4352, %r4352, 5; - xor.b32 %r4355, %r4353, %r4292; - xor.b32 %r4356, %r4355, %r4291; - add.s32 %r4357, %r4343, %r4283; - add.s32 %r4358, %r4357, %r4356; - add.s32 %r4359, %r4358, %r4354; - add.s32 %r4360, %r4359, 1859775393; - shf.l.wrap.b32 %r4361, %r4291, %r4291, 30; - shf.l.wrap.b32 %r4362, %r4360, %r4360, 5; - xor.b32 %r4363, %r4361, %r4353; - xor.b32 %r4364, %r4363, %r4352; - add.s32 %r4365, %r4344, %r4292; - add.s32 %r4366, %r4365, %r4364; - add.s32 %r4367, %r4366, %r4362; - add.s32 %r4368, %r4367, 1859775393; - shf.l.wrap.b32 %r4369, %r4352, %r4352, 30; - shf.l.wrap.b32 %r4370, %r4368, %r4368, 5; - xor.b32 %r4371, %r4369, %r4361; - xor.b32 %r4372, %r4371, %r4360; - add.s32 %r4373, %r4345, %r4353; - add.s32 %r4374, %r4373, %r4372; - add.s32 %r4375, %r4374, %r4370; - add.s32 %r4376, %r4375, 1859775393; - shf.l.wrap.b32 %r4377, %r4360, %r4360, 30; - cvt.u64.u32 %rd3277, %r4369; - cvt.u64.u32 %rd3278, %r4377; - cvt.u64.u32 %rd3279, %r4368; - cvt.u64.u32 %rd3280, %r4376; - bfi.b64 %rd3281, %rd3279, %rd3280, 32, 32; - bfi.b64 %rd3282, %rd3277, %rd3278, 32, 32; - mov.b64 {%r4378, %r4379}, %rd3281; - mov.b64 {%r4380, %r4381}, %rd3282; - xor.b32 %r4382, %r4083, %r4081; - xor.b32 %r4383, %r4144, %r4082; - xor.b32 %r4384, %r4145, %r4083; - cvt.u64.u32 %rd3283, %r4384; - cvt.u64.u32 %rd3284, %r4382; - xor.b32 %r4385, %r4082, %r4080; - cvt.u64.u32 %rd3285, %r4385; - cvt.u64.u32 %rd3286, %r4383; - bfi.b64 %rd3287, %rd3283, %rd3286, 32, 32; - bfi.b64 %rd3288, %rd3284, %rd3285, 32, 32; - mov.b64 {%r4386, %r4387}, %rd3288; - mov.b64 {%r4388, %r4389}, %rd3287; - xor.b32 %r4390, %r4246, %r4385; - xor.b32 %r4391, %r4250, %r4387; - xor.b32 %r4392, %r4251, %r4388; - xor.b32 %r4393, %r4252, %r4389; - xor.b32 %r4394, %r4343, %r4390; - xor.b32 %r4395, %r4391, %r4344; - shf.l.wrap.b32 %r4396, %r4395, %r4395, 1; - xor.b32 %r4397, %r4392, %r4345; - shf.l.wrap.b32 %r4398, %r4397, %r4397, 1; - shf.l.wrap.b32 %r4399, %r4394, %r4394, 1; - xor.b32 %r4400, %r4393, %r4399; - shf.l.wrap.b32 %r4401, %r4400, %r4400, 1; - cvt.u64.u32 %rd3289, %r4401; - cvt.u64.u32 %rd3290, %r4396; - cvt.u64.u32 %rd3291, %r4398; - bfi.b64 %rd3292, %rd3289, %rd3291, 32, 32; - cvt.u64.u32 %rd3293, %r4399; - bfi.b64 %rd3294, %rd3290, %rd3293, 32, 32; - mov.b64 {%r4402, %r4403}, %rd3294; - mov.b64 {%r4404, %r4405}, %rd3292; - cvt.u64.u32 %rd3295, %r4405; - cvt.u64.u32 %rd3296, %r4403; - cvt.u64.u32 %rd3297, %r4404; - bfi.b64 %rd3298, %rd3295, %rd3297, 32, 32; - bfi.b64 %rd3299, %rd3296, %rd3293, 32, 32; - mov.b64 {%r4406, %r4407}, %rd3299; - mov.b64 {%r4408, %r4409}, %rd3298; - cvt.u64.u32 %rd3300, %r4381; - cvt.u64.u32 %rd3301, %r4379; - cvt.u64.u32 %rd3302, %r4380; - bfi.b64 %rd3303, %rd3301, %rd3280, 32, 32; - bfi.b64 %rd3304, %rd3300, %rd3302, 32, 32; - mov.b64 {%r4410, %r4411}, %rd3303; - mov.b64 {%r4412, %r4413}, %rd3304; - shf.l.wrap.b32 %r4414, %r4410, %r4410, 5; - xor.b32 %r4415, %r4412, %r4411; - xor.b32 %r4416, %r4415, %r4413; - add.s32 %r4417, %r4406, %r4361; - add.s32 %r4418, %r4417, %r4414; - add.s32 %r4419, %r4418, %r4416; - add.s32 %r4420, %r4419, 1859775393; - shf.l.wrap.b32 %r4421, %r4411, %r4411, 30; - shf.l.wrap.b32 %r4422, %r4420, %r4420, 5; - xor.b32 %r4423, %r4412, %r4410; - xor.b32 %r4424, %r4423, %r4421; - add.s32 %r4425, %r4407, %r4413; - add.s32 %r4426, %r4425, %r4424; - add.s32 %r4427, %r4426, %r4422; - add.s32 %r4428, %r4427, 1859775393; - shf.l.wrap.b32 %r4429, %r4410, %r4410, 30; - shf.l.wrap.b32 %r4430, %r4428, %r4428, 5; - xor.b32 %r4431, %r4421, %r4429; - xor.b32 %r4432, %r4431, %r4420; - add.s32 %r4433, %r4408, %r4412; - add.s32 %r4434, %r4433, %r4432; - add.s32 %r4435, %r4434, %r4430; - add.s32 %r4436, %r4435, 1859775393; - shf.l.wrap.b32 %r4437, %r4420, %r4420, 30; - shf.l.wrap.b32 %r4438, %r4436, %r4436, 5; - xor.b32 %r4439, %r4437, %r4429; - xor.b32 %r4440, %r4439, %r4428; - add.s32 %r4441, %r4409, %r4421; - add.s32 %r4442, %r4441, %r4440; - add.s32 %r4443, %r4442, %r4438; - add.s32 %r4444, %r4443, 1859775393; - shf.l.wrap.b32 %r4445, %r4428, %r4428, 30; - xor.b32 %r4446, %r4147, %r4145; - xor.b32 %r4447, %r4249, %r4146; - xor.b32 %r4448, %r4250, %r4147; - cvt.u64.u32 %rd3305, %r4448; - cvt.u64.u32 %rd3306, %r4446; - xor.b32 %r4449, %r4146, %r4144; - cvt.u64.u32 %rd3307, %r4449; - cvt.u64.u32 %rd3308, %r4447; - bfi.b64 %rd3309, %rd3305, %rd3308, 32, 32; - bfi.b64 %rd3310, %rd3306, %rd3307, 32, 32; - mov.b64 {%r4450, %r4451}, %rd3310; - mov.b64 {%r4452, %r4453}, %rd3309; - xor.b32 %r4454, %r4335, %r4449; - xor.b32 %r4455, %r4343, %r4451; - xor.b32 %r4456, %r4344, %r4452; - xor.b32 %r4457, %r4345, %r4453; - xor.b32 %r4458, %r4407, %r4454; - xor.b32 %r4459, %r4455, %r4408; - shf.l.wrap.b32 %r4460, %r4459, %r4459, 1; - xor.b32 %r4461, %r4456, %r4409; - shf.l.wrap.b32 %r4462, %r4461, %r4461, 1; - shf.l.wrap.b32 %r4463, %r4458, %r4458, 1; - xor.b32 %r4464, %r4457, %r4463; - shf.l.wrap.b32 %r4465, %r4464, %r4464, 1; - cvt.u64.u32 %rd3311, %r4465; - cvt.u64.u32 %rd3312, %r4460; - cvt.u64.u32 %rd3313, %r4462; - bfi.b64 %rd3314, %rd3311, %rd3313, 32, 32; - cvt.u64.u32 %rd3315, %r4463; - bfi.b64 %rd3316, %rd3312, %rd3315, 32, 32; - mov.b64 {%r4466, %r4467}, %rd3316; - mov.b64 {%r4468, %r4469}, %rd3314; - cvt.u64.u32 %rd3317, %r4469; - cvt.u64.u32 %rd3318, %r4467; - cvt.u64.u32 %rd3319, %r4468; - bfi.b64 %rd3320, %rd3317, %rd3319, 32, 32; - bfi.b64 %rd3321, %rd3318, %rd3315, 32, 32; - mov.b64 {%r4470, %r4471}, %rd3321; - mov.b64 {%r4472, %r4473}, %rd3320; - shf.l.wrap.b32 %r4474, %r4444, %r4444, 5; - xor.b32 %r4475, %r4445, %r4437; - xor.b32 %r4476, %r4475, %r4436; - add.s32 %r4477, %r4470, %r4429; - add.s32 %r4478, %r4477, %r4476; - add.s32 %r4479, %r4478, %r4474; - add.s32 %r4480, %r4479, 1859775393; - shf.l.wrap.b32 %r4481, %r4436, %r4436, 30; - shf.l.wrap.b32 %r4482, %r4480, %r4480, 5; - xor.b32 %r4483, %r4481, %r4445; - xor.b32 %r4484, %r4483, %r4444; - add.s32 %r4485, %r4471, %r4437; - add.s32 %r4486, %r4485, %r4484; - add.s32 %r4487, %r4486, %r4482; - add.s32 %r4488, %r4487, 1859775393; - shf.l.wrap.b32 %r4489, %r4444, %r4444, 30; - shf.l.wrap.b32 %r4490, %r4488, %r4488, 5; - xor.b32 %r4491, %r4489, %r4481; - xor.b32 %r4492, %r4491, %r4480; - add.s32 %r4493, %r4472, %r4445; - add.s32 %r4494, %r4493, %r4492; - add.s32 %r4495, %r4494, %r4490; - add.s32 %r4496, %r4495, 1859775393; - shf.l.wrap.b32 %r4497, %r4480, %r4480, 30; - shf.l.wrap.b32 %r4498, %r4496, %r4496, 5; - xor.b32 %r4499, %r4497, %r4489; - xor.b32 %r4500, %r4499, %r4488; - add.s32 %r4501, %r4473, %r4481; - add.s32 %r4502, %r4501, %r4500; - add.s32 %r4503, %r4502, %r4498; - add.s32 %r4504, %r4503, 1859775393; - shf.l.wrap.b32 %r4505, %r4488, %r4488, 30; - cvt.u64.u32 %rd3322, %r4497; - cvt.u64.u32 %rd3323, %r4505; - cvt.u64.u32 %rd3324, %r4496; - cvt.u64.u32 %rd3325, %r4504; - bfi.b64 %rd3326, %rd3324, %rd3325, 32, 32; - bfi.b64 %rd3327, %rd3322, %rd3323, 32, 32; - mov.b64 {%r4506, %r4507}, %rd3326; - mov.b64 {%r4508, %r4509}, %rd3327; - xor.b32 %r4510, %r4252, %r4250; - xor.b32 %r4511, %r4342, %r4251; - xor.b32 %r4512, %r4343, %r4252; - cvt.u64.u32 %rd3328, %r4512; - cvt.u64.u32 %rd3329, %r4510; - xor.b32 %r4513, %r4251, %r4249; - cvt.u64.u32 %rd3330, %r4513; - cvt.u64.u32 %rd3331, %r4511; - bfi.b64 %rd3332, %rd3328, %rd3331, 32, 32; - bfi.b64 %rd3333, %rd3329, %rd3330, 32, 32; - mov.b64 {%r4514, %r4515}, %rd3333; - mov.b64 {%r4516, %r4517}, %rd3332; - xor.b32 %r4518, %r4399, %r4513; - xor.b32 %r4519, %r4407, %r4515; - xor.b32 %r4520, %r4408, %r4516; - xor.b32 %r4521, %r4409, %r4517; - xor.b32 %r4522, %r4471, %r4518; - xor.b32 %r4523, %r4519, %r4472; - shf.l.wrap.b32 %r4524, %r4523, %r4523, 1; - xor.b32 %r4525, %r4520, %r4473; - shf.l.wrap.b32 %r4526, %r4525, %r4525, 1; - shf.l.wrap.b32 %r4527, %r4522, %r4522, 1; - xor.b32 %r4528, %r4521, %r4527; - shf.l.wrap.b32 %r4529, %r4528, %r4528, 1; - cvt.u64.u32 %rd3334, %r4529; - cvt.u64.u32 %rd3335, %r4524; - cvt.u64.u32 %rd3336, %r4526; - bfi.b64 %rd3337, %rd3334, %rd3336, 32, 32; - cvt.u64.u32 %rd3338, %r4527; - bfi.b64 %rd3339, %rd3335, %rd3338, 32, 32; - mov.b64 {%r4530, %r4531}, %rd3339; - mov.b64 {%r4532, %r4533}, %rd3337; - cvt.u64.u32 %rd3340, %r4533; - cvt.u64.u32 %rd3341, %r4531; - cvt.u64.u32 %rd3342, %r4532; - bfi.b64 %rd3343, %rd3340, %rd3342, 32, 32; - bfi.b64 %rd3344, %rd3341, %rd3338, 32, 32; - mov.b64 {%r4534, %r4535}, %rd3344; - mov.b64 {%r4536, %r4537}, %rd3343; - cvt.u64.u32 %rd3345, %r4509; - cvt.u64.u32 %rd3346, %r4507; - cvt.u64.u32 %rd3347, %r4508; - bfi.b64 %rd3348, %rd3346, %rd3325, 32, 32; - bfi.b64 %rd3349, %rd3345, %rd3347, 32, 32; - mov.b64 {%r4538, %r4539}, %rd3348; - mov.b64 {%r4540, %r4541}, %rd3349; - shf.l.wrap.b32 %r4542, %r4538, %r4538, 5; - xor.b32 %r4543, %r4540, %r4539; - xor.b32 %r4544, %r4543, %r4541; - add.s32 %r4545, %r4534, %r4489; - add.s32 %r4546, %r4545, %r4542; - add.s32 %r4547, %r4546, %r4544; - add.s32 %r4548, %r4547, 1859775393; - shf.l.wrap.b32 %r4549, %r4539, %r4539, 30; - shf.l.wrap.b32 %r4550, %r4548, %r4548, 5; - xor.b32 %r4551, %r4540, %r4538; - xor.b32 %r4552, %r4551, %r4549; - add.s32 %r4553, %r4535, %r4541; - add.s32 %r4554, %r4553, %r4552; - add.s32 %r4555, %r4554, %r4550; - add.s32 %r4556, %r4555, 1859775393; - shf.l.wrap.b32 %r4557, %r4538, %r4538, 30; - shf.l.wrap.b32 %r4558, %r4556, %r4556, 5; - xor.b32 %r4559, %r4549, %r4557; - xor.b32 %r4560, %r4559, %r4548; - add.s32 %r4561, %r4536, %r4540; - add.s32 %r4562, %r4561, %r4560; - add.s32 %r4563, %r4562, %r4558; - add.s32 %r4564, %r4563, 1859775393; - shf.l.wrap.b32 %r4565, %r4548, %r4548, 30; - shf.l.wrap.b32 %r4566, %r4564, %r4564, 5; - xor.b32 %r4567, %r4565, %r4557; - xor.b32 %r4568, %r4567, %r4556; - add.s32 %r4569, %r4537, %r4549; - add.s32 %r4570, %r4569, %r4568; - add.s32 %r4571, %r4570, %r4566; - add.s32 %r4572, %r4571, 1859775393; - shf.l.wrap.b32 %r4573, %r4556, %r4556, 30; - xor.b32 %r4574, %r4345, %r4343; - xor.b32 %r4575, %r4406, %r4344; - xor.b32 %r4576, %r4407, %r4345; - cvt.u64.u32 %rd3350, %r4576; - cvt.u64.u32 %rd3351, %r4574; - xor.b32 %r4577, %r4344, %r4342; - cvt.u64.u32 %rd3352, %r4577; - cvt.u64.u32 %rd3353, %r4575; - bfi.b64 %rd3354, %rd3350, %rd3353, 32, 32; - bfi.b64 %rd3355, %rd3351, %rd3352, 32, 32; - mov.b64 {%r4578, %r4579}, %rd3355; - mov.b64 {%r4580, %r4581}, %rd3354; - xor.b32 %r4582, %r4463, %r4577; - xor.b32 %r4583, %r4471, %r4579; - xor.b32 %r4584, %r4472, %r4580; - xor.b32 %r4585, %r4473, %r4581; - xor.b32 %r4586, %r4535, %r4582; - xor.b32 %r4587, %r4583, %r4536; - shf.l.wrap.b32 %r4588, %r4587, %r4587, 1; - xor.b32 %r4589, %r4584, %r4537; - shf.l.wrap.b32 %r4590, %r4589, %r4589, 1; - shf.l.wrap.b32 %r4591, %r4586, %r4586, 1; - xor.b32 %r4592, %r4585, %r4591; - shf.l.wrap.b32 %r4593, %r4592, %r4592, 1; - cvt.u64.u32 %rd3356, %r4593; - cvt.u64.u32 %rd3357, %r4588; - cvt.u64.u32 %rd3358, %r4591; - cvt.u64.u32 %rd3359, %r4590; - bfi.b64 %rd3360, %rd3356, %rd3359, 32, 32; - bfi.b64 %rd3361, %rd3357, %rd3358, 32, 32; - mov.b64 {%r4594, %r4595}, %rd3361; - mov.b64 {%r4596, %r4597}, %rd3360; - shf.l.wrap.b32 %r4598, %r4572, %r4572, 5; - xor.b32 %r4599, %r4573, %r4565; - xor.b32 %r4600, %r4599, %r4564; - add.s32 %r4601, %r4594, %r4557; - add.s32 %r4602, %r4601, %r4600; - add.s32 %r4603, %r4602, %r4598; - add.s32 %r4604, %r4603, 1859775393; - shf.l.wrap.b32 %r4605, %r4564, %r4564, 30; - shf.l.wrap.b32 %r4606, %r4604, %r4604, 5; - xor.b32 %r4607, %r4605, %r4573; - xor.b32 %r4608, %r4607, %r4572; - add.s32 %r4609, %r4595, %r4565; - add.s32 %r4610, %r4609, %r4608; - add.s32 %r4611, %r4610, %r4606; - add.s32 %r4612, %r4611, 1859775393; - shf.l.wrap.b32 %r4613, %r4572, %r4572, 30; - shf.l.wrap.b32 %r4614, %r4612, %r4612, 5; - xor.b32 %r4615, %r4613, %r4605; - xor.b32 %r4616, %r4615, %r4604; - add.s32 %r4617, %r4596, %r4573; - add.s32 %r4618, %r4617, %r4616; - add.s32 %r4619, %r4618, %r4614; - add.s32 %r4620, %r4619, 1859775393; - shf.l.wrap.b32 %r4621, %r4604, %r4604, 30; - shf.l.wrap.b32 %r4622, %r4620, %r4620, 5; - xor.b32 %r4623, %r4621, %r4613; - xor.b32 %r4624, %r4623, %r4612; - add.s32 %r4625, %r4597, %r4605; - add.s32 %r4626, %r4625, %r4624; - add.s32 %r4627, %r4626, %r4622; - add.s32 %r4628, %r4627, 1859775393; - shf.l.wrap.b32 %r4629, %r4612, %r4612, 30; - cvt.u64.u32 %rd3362, %r4621; - cvt.u64.u32 %rd3363, %r4629; - cvt.u64.u32 %rd3364, %r4620; - cvt.u64.u32 %rd3365, %r4628; - bfi.b64 %rd3366, %rd3364, %rd3365, 32, 32; - bfi.b64 %rd3367, %rd3362, %rd3363, 32, 32; - mov.b64 {%r4630, %r4631}, %rd3366; - mov.b64 {%r4632, %r4633}, %rd3367; - xor.b32 %r4634, %r4409, %r4407; - xor.b32 %r4635, %r4470, %r4408; - xor.b32 %r4636, %r4471, %r4409; - cvt.u64.u32 %rd3368, %r4636; - cvt.u64.u32 %rd3369, %r4634; - xor.b32 %r4637, %r4408, %r4406; - cvt.u64.u32 %rd3370, %r4637; - cvt.u64.u32 %rd3371, %r4635; - bfi.b64 %rd3372, %rd3368, %rd3371, 32, 32; - bfi.b64 %rd3373, %rd3369, %rd3370, 32, 32; - mov.b64 {%r4638, %r4639}, %rd3373; - mov.b64 {%r4640, %r4641}, %rd3372; - xor.b32 %r4642, %r4527, %r4637; - xor.b32 %r4643, %r4535, %r4639; - xor.b32 %r4644, %r4536, %r4640; - xor.b32 %r4645, %r4537, %r4641; - xor.b32 %r4646, %r4595, %r4642; - xor.b32 %r4647, %r4643, %r4596; - shf.l.wrap.b32 %r4648, %r4647, %r4647, 1; - xor.b32 %r4649, %r4644, %r4597; - shf.l.wrap.b32 %r4650, %r4649, %r4649, 1; - shf.l.wrap.b32 %r4651, %r4646, %r4646, 1; - xor.b32 %r4652, %r4645, %r4651; - shf.l.wrap.b32 %r4653, %r4652, %r4652, 1; - cvt.u64.u32 %rd3374, %r4653; - cvt.u64.u32 %rd3375, %r4648; - cvt.u64.u32 %rd3376, %r4650; - bfi.b64 %rd3377, %rd3374, %rd3376, 32, 32; - cvt.u64.u32 %rd3378, %r4651; - bfi.b64 %rd3379, %rd3375, %rd3378, 32, 32; - mov.b64 {%r4654, %r4655}, %rd3379; - mov.b64 {%r4656, %r4657}, %rd3377; - cvt.u64.u32 %rd3380, %r4657; - cvt.u64.u32 %rd3381, %r4655; - cvt.u64.u32 %rd3382, %r4656; - bfi.b64 %rd3383, %rd3380, %rd3382, 32, 32; - bfi.b64 %rd3384, %rd3381, %rd3378, 32, 32; - mov.b64 {%r4658, %r4659}, %rd3384; - mov.b64 {%r4660, %r4661}, %rd3383; - cvt.u64.u32 %rd3385, %r4633; - cvt.u64.u32 %rd3386, %r4631; - cvt.u64.u32 %rd3387, %r4632; - bfi.b64 %rd3388, %rd3386, %rd3365, 32, 32; - bfi.b64 %rd3389, %rd3385, %rd3387, 32, 32; - mov.b64 {%r4662, %r4663}, %rd3388; - mov.b64 {%r4664, %r4665}, %rd3389; - shf.l.wrap.b32 %r4666, %r4662, %r4662, 5; - xor.b32 %r4667, %r4665, %r4664; - and.b32 %r4668, %r4667, %r4663; - and.b32 %r4669, %r4665, %r4664; - xor.b32 %r4670, %r4668, %r4669; - add.s32 %r4671, %r4658, %r4613; - add.s32 %r4672, %r4671, %r4666; - add.s32 %r4673, %r4672, %r4670; - add.s32 %r4674, %r4673, -1894007588; - shf.l.wrap.b32 %r4675, %r4663, %r4663, 30; - shf.l.wrap.b32 %r4676, %r4674, %r4674, 5; - xor.b32 %r4677, %r4675, %r4664; - and.b32 %r4678, %r4677, %r4662; - and.b32 %r4679, %r4675, %r4664; - xor.b32 %r4680, %r4678, %r4679; - add.s32 %r4681, %r4659, %r4665; - add.s32 %r4682, %r4681, %r4680; - add.s32 %r4683, %r4682, %r4676; - add.s32 %r4684, %r4683, -1894007588; - shf.l.wrap.b32 %r4685, %r4662, %r4662, 30; - shf.l.wrap.b32 %r4686, %r4684, %r4684, 5; - xor.b32 %r4687, %r4675, %r4685; - and.b32 %r4688, %r4674, %r4687; - and.b32 %r4689, %r4675, %r4685; - xor.b32 %r4690, %r4688, %r4689; - add.s32 %r4691, %r4660, %r4664; - add.s32 %r4692, %r4691, %r4690; - add.s32 %r4693, %r4692, %r4686; - add.s32 %r4694, %r4693, -1894007588; - shf.l.wrap.b32 %r4695, %r4674, %r4674, 30; - shf.l.wrap.b32 %r4696, %r4694, %r4694, 5; - xor.b32 %r4697, %r4695, %r4685; - and.b32 %r4698, %r4684, %r4697; - and.b32 %r4699, %r4695, %r4685; - xor.b32 %r4700, %r4698, %r4699; - add.s32 %r4701, %r4661, %r4675; - add.s32 %r4702, %r4701, %r4700; - add.s32 %r4703, %r4702, %r4696; - add.s32 %r4704, %r4703, -1894007588; - shf.l.wrap.b32 %r4705, %r4684, %r4684, 30; - xor.b32 %r4706, %r4473, %r4471; - xor.b32 %r4707, %r4534, %r4472; - xor.b32 %r4708, %r4535, %r4473; - cvt.u64.u32 %rd3390, %r4708; - cvt.u64.u32 %rd3391, %r4706; - xor.b32 %r4709, %r4472, %r4470; - cvt.u64.u32 %rd3392, %r4709; - cvt.u64.u32 %rd3393, %r4707; - bfi.b64 %rd3394, %rd3390, %rd3393, 32, 32; - bfi.b64 %rd3395, %rd3391, %rd3392, 32, 32; - mov.b64 {%r4710, %r4711}, %rd3395; - mov.b64 {%r4712, %r4713}, %rd3394; - xor.b32 %r4714, %r4591, %r4709; - xor.b32 %r4715, %r4595, %r4711; - xor.b32 %r4716, %r4596, %r4712; - xor.b32 %r4717, %r4597, %r4713; - xor.b32 %r4718, %r4659, %r4714; - xor.b32 %r4719, %r4715, %r4660; - shf.l.wrap.b32 %r4720, %r4719, %r4719, 1; - xor.b32 %r4721, %r4716, %r4661; - shf.l.wrap.b32 %r4722, %r4721, %r4721, 1; - shf.l.wrap.b32 %r4723, %r4718, %r4718, 1; - xor.b32 %r4724, %r4717, %r4723; - shf.l.wrap.b32 %r4725, %r4724, %r4724, 1; - cvt.u64.u32 %rd3396, %r4725; - cvt.u64.u32 %rd3397, %r4720; - cvt.u64.u32 %rd3398, %r4722; - bfi.b64 %rd3399, %rd3396, %rd3398, 32, 32; - cvt.u64.u32 %rd3400, %r4723; - bfi.b64 %rd3401, %rd3397, %rd3400, 32, 32; - mov.b64 {%r4726, %r4727}, %rd3401; - mov.b64 {%r4728, %r4729}, %rd3399; - cvt.u64.u32 %rd3402, %r4729; - cvt.u64.u32 %rd3403, %r4727; - cvt.u64.u32 %rd3404, %r4728; - bfi.b64 %rd3405, %rd3402, %rd3404, 32, 32; - bfi.b64 %rd3406, %rd3403, %rd3400, 32, 32; - mov.b64 {%r4730, %r4731}, %rd3406; - mov.b64 {%r4732, %r4733}, %rd3405; - shf.l.wrap.b32 %r4734, %r4704, %r4704, 5; - xor.b32 %r4735, %r4705, %r4695; - and.b32 %r4736, %r4735, %r4694; - and.b32 %r4737, %r4705, %r4695; - xor.b32 %r4738, %r4736, %r4737; - add.s32 %r4739, %r4730, %r4685; - add.s32 %r4740, %r4739, %r4738; - add.s32 %r4741, %r4740, %r4734; - add.s32 %r4742, %r4741, -1894007588; - shf.l.wrap.b32 %r4743, %r4694, %r4694, 30; - shf.l.wrap.b32 %r4744, %r4742, %r4742, 5; - xor.b32 %r4745, %r4743, %r4705; - and.b32 %r4746, %r4745, %r4704; - and.b32 %r4747, %r4743, %r4705; - xor.b32 %r4748, %r4746, %r4747; - add.s32 %r4749, %r4731, %r4695; - add.s32 %r4750, %r4749, %r4748; - add.s32 %r4751, %r4750, %r4744; - add.s32 %r4752, %r4751, -1894007588; - shf.l.wrap.b32 %r4753, %r4704, %r4704, 30; - shf.l.wrap.b32 %r4754, %r4752, %r4752, 5; - xor.b32 %r4755, %r4753, %r4743; - and.b32 %r4756, %r4742, %r4755; - and.b32 %r4757, %r4753, %r4743; - xor.b32 %r4758, %r4756, %r4757; - add.s32 %r4759, %r4732, %r4705; - add.s32 %r4760, %r4759, %r4758; - add.s32 %r4761, %r4760, %r4754; - add.s32 %r4762, %r4761, -1894007588; - shf.l.wrap.b32 %r4763, %r4742, %r4742, 30; - shf.l.wrap.b32 %r4764, %r4762, %r4762, 5; - xor.b32 %r4765, %r4763, %r4753; - and.b32 %r4766, %r4752, %r4765; - and.b32 %r4767, %r4763, %r4753; - xor.b32 %r4768, %r4766, %r4767; - add.s32 %r4769, %r4733, %r4743; - add.s32 %r4770, %r4769, %r4768; - add.s32 %r4771, %r4770, %r4764; - add.s32 %r4772, %r4771, -1894007588; - shf.l.wrap.b32 %r4773, %r4752, %r4752, 30; - cvt.u64.u32 %rd3407, %r4763; - cvt.u64.u32 %rd3408, %r4773; - cvt.u64.u32 %rd3409, %r4762; - cvt.u64.u32 %rd3410, %r4772; - bfi.b64 %rd3411, %rd3409, %rd3410, 32, 32; - bfi.b64 %rd3412, %rd3407, %rd3408, 32, 32; - mov.b64 {%r4774, %r4775}, %rd3411; - mov.b64 {%r4776, %r4777}, %rd3412; - xor.b32 %r4778, %r4537, %r4535; - xor.b32 %r4779, %r4594, %r4536; - xor.b32 %r4780, %r4595, %r4537; - cvt.u64.u32 %rd3413, %r4780; - cvt.u64.u32 %rd3414, %r4778; - xor.b32 %r4781, %r4536, %r4534; - cvt.u64.u32 %rd3415, %r4781; - cvt.u64.u32 %rd3416, %r4779; - bfi.b64 %rd3417, %rd3413, %rd3416, 32, 32; - bfi.b64 %rd3418, %rd3414, %rd3415, 32, 32; - mov.b64 {%r4782, %r4783}, %rd3418; - mov.b64 {%r4784, %r4785}, %rd3417; - xor.b32 %r4786, %r4651, %r4781; - xor.b32 %r4787, %r4659, %r4783; - xor.b32 %r4788, %r4660, %r4784; - xor.b32 %r4789, %r4661, %r4785; - xor.b32 %r4790, %r4731, %r4786; - xor.b32 %r4791, %r4787, %r4732; - shf.l.wrap.b32 %r4792, %r4791, %r4791, 1; - xor.b32 %r4793, %r4788, %r4733; - shf.l.wrap.b32 %r4794, %r4793, %r4793, 1; - shf.l.wrap.b32 %r4795, %r4790, %r4790, 1; - xor.b32 %r4796, %r4789, %r4795; - shf.l.wrap.b32 %r4797, %r4796, %r4796, 1; - cvt.u64.u32 %rd3419, %r4797; - cvt.u64.u32 %rd3420, %r4792; - cvt.u64.u32 %rd3421, %r4794; - bfi.b64 %rd3422, %rd3419, %rd3421, 32, 32; - cvt.u64.u32 %rd3423, %r4795; - bfi.b64 %rd3424, %rd3420, %rd3423, 32, 32; - mov.b64 {%r4798, %r4799}, %rd3424; - mov.b64 {%r4800, %r4801}, %rd3422; - cvt.u64.u32 %rd3425, %r4801; - cvt.u64.u32 %rd3426, %r4799; - cvt.u64.u32 %rd3427, %r4800; - bfi.b64 %rd3428, %rd3425, %rd3427, 32, 32; - bfi.b64 %rd3429, %rd3426, %rd3423, 32, 32; - mov.b64 {%r4802, %r4803}, %rd3429; - mov.b64 {%r4804, %r4805}, %rd3428; - cvt.u64.u32 %rd3430, %r4777; - cvt.u64.u32 %rd3431, %r4775; - cvt.u64.u32 %rd3432, %r4776; - bfi.b64 %rd3433, %rd3431, %rd3410, 32, 32; - bfi.b64 %rd3434, %rd3430, %rd3432, 32, 32; - mov.b64 {%r4806, %r4807}, %rd3433; - mov.b64 {%r4808, %r4809}, %rd3434; - shf.l.wrap.b32 %r4810, %r4806, %r4806, 5; - xor.b32 %r4811, %r4809, %r4808; - and.b32 %r4812, %r4811, %r4807; - and.b32 %r4813, %r4809, %r4808; - xor.b32 %r4814, %r4812, %r4813; - add.s32 %r4815, %r4802, %r4753; - add.s32 %r4816, %r4815, %r4810; - add.s32 %r4817, %r4816, %r4814; - add.s32 %r4818, %r4817, -1894007588; - shf.l.wrap.b32 %r4819, %r4807, %r4807, 30; - shf.l.wrap.b32 %r4820, %r4818, %r4818, 5; - xor.b32 %r4821, %r4819, %r4808; - and.b32 %r4822, %r4821, %r4806; - and.b32 %r4823, %r4819, %r4808; - xor.b32 %r4824, %r4822, %r4823; - add.s32 %r4825, %r4803, %r4809; - add.s32 %r4826, %r4825, %r4824; - add.s32 %r4827, %r4826, %r4820; - add.s32 %r4828, %r4827, -1894007588; - shf.l.wrap.b32 %r4829, %r4806, %r4806, 30; - shf.l.wrap.b32 %r4830, %r4828, %r4828, 5; - xor.b32 %r4831, %r4819, %r4829; - and.b32 %r4832, %r4818, %r4831; - and.b32 %r4833, %r4819, %r4829; - xor.b32 %r4834, %r4832, %r4833; - add.s32 %r4835, %r4804, %r4808; - add.s32 %r4836, %r4835, %r4834; - add.s32 %r4837, %r4836, %r4830; - add.s32 %r4838, %r4837, -1894007588; - shf.l.wrap.b32 %r4839, %r4818, %r4818, 30; - shf.l.wrap.b32 %r4840, %r4838, %r4838, 5; - xor.b32 %r4841, %r4839, %r4829; - and.b32 %r4842, %r4828, %r4841; - and.b32 %r4843, %r4839, %r4829; - xor.b32 %r4844, %r4842, %r4843; - add.s32 %r4845, %r4805, %r4819; - add.s32 %r4846, %r4845, %r4844; - add.s32 %r4847, %r4846, %r4840; - add.s32 %r4848, %r4847, -1894007588; - shf.l.wrap.b32 %r4849, %r4828, %r4828, 30; - xor.b32 %r4850, %r4597, %r4595; - xor.b32 %r4851, %r4658, %r4596; - xor.b32 %r4852, %r4659, %r4597; - cvt.u64.u32 %rd3435, %r4852; - cvt.u64.u32 %rd3436, %r4850; - xor.b32 %r4853, %r4596, %r4594; - cvt.u64.u32 %rd3437, %r4853; - cvt.u64.u32 %rd3438, %r4851; - bfi.b64 %rd3439, %rd3435, %rd3438, 32, 32; - bfi.b64 %rd3440, %rd3436, %rd3437, 32, 32; - mov.b64 {%r4854, %r4855}, %rd3440; - mov.b64 {%r4856, %r4857}, %rd3439; - xor.b32 %r4858, %r4723, %r4853; - xor.b32 %r4859, %r4731, %r4855; - xor.b32 %r4860, %r4732, %r4856; - xor.b32 %r4861, %r4733, %r4857; - xor.b32 %r4862, %r4803, %r4858; - xor.b32 %r4863, %r4859, %r4804; - shf.l.wrap.b32 %r4864, %r4863, %r4863, 1; - xor.b32 %r4865, %r4860, %r4805; - shf.l.wrap.b32 %r4866, %r4865, %r4865, 1; - shf.l.wrap.b32 %r4867, %r4862, %r4862, 1; - xor.b32 %r4868, %r4861, %r4867; - shf.l.wrap.b32 %r4869, %r4868, %r4868, 1; - cvt.u64.u32 %rd3441, %r4869; - cvt.u64.u32 %rd3442, %r4864; - cvt.u64.u32 %rd3443, %r4866; - bfi.b64 %rd3444, %rd3441, %rd3443, 32, 32; - cvt.u64.u32 %rd3445, %r4867; - bfi.b64 %rd3446, %rd3442, %rd3445, 32, 32; - mov.b64 {%r4870, %r4871}, %rd3446; - mov.b64 {%r4872, %r4873}, %rd3444; - cvt.u64.u32 %rd3447, %r4873; - cvt.u64.u32 %rd3448, %r4871; - cvt.u64.u32 %rd3449, %r4872; - bfi.b64 %rd3450, %rd3447, %rd3449, 32, 32; - bfi.b64 %rd3451, %rd3448, %rd3445, 32, 32; - mov.b64 {%r4874, %r4875}, %rd3451; - mov.b64 {%r4876, %r4877}, %rd3450; - shf.l.wrap.b32 %r4878, %r4848, %r4848, 5; - xor.b32 %r4879, %r4849, %r4839; - and.b32 %r4880, %r4879, %r4838; - and.b32 %r4881, %r4849, %r4839; - xor.b32 %r4882, %r4880, %r4881; - add.s32 %r4883, %r4874, %r4829; - add.s32 %r4884, %r4883, %r4882; - add.s32 %r4885, %r4884, %r4878; - add.s32 %r4886, %r4885, -1894007588; - shf.l.wrap.b32 %r4887, %r4838, %r4838, 30; - shf.l.wrap.b32 %r4888, %r4886, %r4886, 5; - xor.b32 %r4889, %r4887, %r4849; - and.b32 %r4890, %r4889, %r4848; - and.b32 %r4891, %r4887, %r4849; - xor.b32 %r4892, %r4890, %r4891; - add.s32 %r4893, %r4875, %r4839; - add.s32 %r4894, %r4893, %r4892; - add.s32 %r4895, %r4894, %r4888; - add.s32 %r4896, %r4895, -1894007588; - shf.l.wrap.b32 %r4897, %r4848, %r4848, 30; - shf.l.wrap.b32 %r4898, %r4896, %r4896, 5; - xor.b32 %r4899, %r4897, %r4887; - and.b32 %r4900, %r4886, %r4899; - and.b32 %r4901, %r4897, %r4887; - xor.b32 %r4902, %r4900, %r4901; - add.s32 %r4903, %r4876, %r4849; - add.s32 %r4904, %r4903, %r4902; - add.s32 %r4905, %r4904, %r4898; - add.s32 %r4906, %r4905, -1894007588; - shf.l.wrap.b32 %r4907, %r4886, %r4886, 30; - shf.l.wrap.b32 %r4908, %r4906, %r4906, 5; - xor.b32 %r4909, %r4907, %r4897; - and.b32 %r4910, %r4896, %r4909; - and.b32 %r4911, %r4907, %r4897; - xor.b32 %r4912, %r4910, %r4911; - add.s32 %r4913, %r4877, %r4887; - add.s32 %r4914, %r4913, %r4912; - add.s32 %r4915, %r4914, %r4908; - add.s32 %r4916, %r4915, -1894007588; - shf.l.wrap.b32 %r4917, %r4896, %r4896, 30; - cvt.u64.u32 %rd3452, %r4907; - cvt.u64.u32 %rd3453, %r4917; - cvt.u64.u32 %rd3454, %r4906; - cvt.u64.u32 %rd3455, %r4916; - bfi.b64 %rd3456, %rd3454, %rd3455, 32, 32; - bfi.b64 %rd3457, %rd3452, %rd3453, 32, 32; - mov.b64 {%r4918, %r4919}, %rd3456; - mov.b64 {%r4920, %r4921}, %rd3457; - xor.b32 %r4922, %r4661, %r4659; - xor.b32 %r4923, %r4730, %r4660; - xor.b32 %r4924, %r4731, %r4661; - cvt.u64.u32 %rd3458, %r4924; - cvt.u64.u32 %rd3459, %r4922; - xor.b32 %r4925, %r4660, %r4658; - cvt.u64.u32 %rd3460, %r4925; - cvt.u64.u32 %rd3461, %r4923; - bfi.b64 %rd3462, %rd3458, %rd3461, 32, 32; - bfi.b64 %rd3463, %rd3459, %rd3460, 32, 32; - mov.b64 {%r4926, %r4927}, %rd3463; - mov.b64 {%r4928, %r4929}, %rd3462; - xor.b32 %r4930, %r4795, %r4925; - xor.b32 %r4931, %r4803, %r4927; - xor.b32 %r4932, %r4804, %r4928; - xor.b32 %r4933, %r4805, %r4929; - xor.b32 %r4934, %r4875, %r4930; - xor.b32 %r4935, %r4931, %r4876; - shf.l.wrap.b32 %r4936, %r4935, %r4935, 1; - xor.b32 %r4937, %r4932, %r4877; - shf.l.wrap.b32 %r4938, %r4937, %r4937, 1; - shf.l.wrap.b32 %r4939, %r4934, %r4934, 1; - xor.b32 %r4940, %r4933, %r4939; - shf.l.wrap.b32 %r4941, %r4940, %r4940, 1; - cvt.u64.u32 %rd3464, %r4941; - cvt.u64.u32 %rd3465, %r4936; - cvt.u64.u32 %rd3466, %r4939; - cvt.u64.u32 %rd3467, %r4938; - bfi.b64 %rd3468, %rd3464, %rd3467, 32, 32; - bfi.b64 %rd3469, %rd3465, %rd3466, 32, 32; - mov.b64 {%r4942, %r4943}, %rd3469; - mov.b64 {%r4944, %r4945}, %rd3468; - cvt.u64.u32 %rd3470, %r4921; - cvt.u64.u32 %rd3471, %r4919; - cvt.u64.u32 %rd3472, %r4920; - bfi.b64 %rd3473, %rd3471, %rd3455, 32, 32; - bfi.b64 %rd3474, %rd3470, %rd3472, 32, 32; - mov.b64 {%r4946, %r4947}, %rd3473; - mov.b64 {%r4948, %r4949}, %rd3474; - shf.l.wrap.b32 %r4950, %r4946, %r4946, 5; - xor.b32 %r4951, %r4949, %r4948; - and.b32 %r4952, %r4951, %r4947; - and.b32 %r4953, %r4949, %r4948; - xor.b32 %r4954, %r4952, %r4953; - add.s32 %r4955, %r4942, %r4897; - add.s32 %r4956, %r4955, %r4950; - add.s32 %r4957, %r4956, %r4954; - add.s32 %r4958, %r4957, -1894007588; - shf.l.wrap.b32 %r4959, %r4947, %r4947, 30; - shf.l.wrap.b32 %r4960, %r4958, %r4958, 5; - xor.b32 %r4961, %r4959, %r4948; - and.b32 %r4962, %r4961, %r4946; - and.b32 %r4963, %r4959, %r4948; - xor.b32 %r4964, %r4962, %r4963; - add.s32 %r4965, %r4943, %r4949; - add.s32 %r4966, %r4965, %r4964; - add.s32 %r4967, %r4966, %r4960; - add.s32 %r4968, %r4967, -1894007588; - shf.l.wrap.b32 %r4969, %r4946, %r4946, 30; - shf.l.wrap.b32 %r4970, %r4968, %r4968, 5; - xor.b32 %r4971, %r4959, %r4969; - and.b32 %r4972, %r4958, %r4971; - and.b32 %r4973, %r4959, %r4969; - xor.b32 %r4974, %r4972, %r4973; - add.s32 %r4975, %r4944, %r4948; - add.s32 %r4976, %r4975, %r4974; - add.s32 %r4977, %r4976, %r4970; - add.s32 %r4978, %r4977, -1894007588; - shf.l.wrap.b32 %r4979, %r4958, %r4958, 30; - shf.l.wrap.b32 %r4980, %r4978, %r4978, 5; - xor.b32 %r4981, %r4979, %r4969; - and.b32 %r4982, %r4968, %r4981; - and.b32 %r4983, %r4979, %r4969; - xor.b32 %r4984, %r4982, %r4983; - add.s32 %r4985, %r4945, %r4959; - add.s32 %r4986, %r4985, %r4984; - add.s32 %r4987, %r4986, %r4980; - add.s32 %r4988, %r4987, -1894007588; - shf.l.wrap.b32 %r4989, %r4968, %r4968, 30; - xor.b32 %r4990, %r4733, %r4731; - xor.b32 %r4991, %r4802, %r4732; - xor.b32 %r4992, %r4803, %r4733; - cvt.u64.u32 %rd3475, %r4992; - cvt.u64.u32 %rd3476, %r4990; - xor.b32 %r4993, %r4732, %r4730; - cvt.u64.u32 %rd3477, %r4993; - cvt.u64.u32 %rd3478, %r4991; - bfi.b64 %rd3479, %rd3475, %rd3478, 32, 32; - bfi.b64 %rd3480, %rd3476, %rd3477, 32, 32; - mov.b64 {%r4994, %r4995}, %rd3480; - mov.b64 {%r4996, %r4997}, %rd3479; - xor.b32 %r4998, %r4867, %r4993; - xor.b32 %r4999, %r4875, %r4995; - xor.b32 %r5000, %r4876, %r4996; - xor.b32 %r5001, %r4877, %r4997; - xor.b32 %r5002, %r4943, %r4998; - xor.b32 %r5003, %r4999, %r4944; - shf.l.wrap.b32 %r5004, %r5003, %r5003, 1; - xor.b32 %r5005, %r5000, %r4945; - shf.l.wrap.b32 %r5006, %r5005, %r5005, 1; - shf.l.wrap.b32 %r5007, %r5002, %r5002, 1; - xor.b32 %r5008, %r5001, %r5007; - shf.l.wrap.b32 %r5009, %r5008, %r5008, 1; - cvt.u64.u32 %rd3481, %r5009; - cvt.u64.u32 %rd3482, %r5004; - cvt.u64.u32 %rd3483, %r5006; - bfi.b64 %rd3484, %rd3481, %rd3483, 32, 32; - cvt.u64.u32 %rd3485, %r5007; - bfi.b64 %rd3486, %rd3482, %rd3485, 32, 32; - mov.b64 {%r5010, %r5011}, %rd3486; - mov.b64 {%r5012, %r5013}, %rd3484; - cvt.u64.u32 %rd3487, %r5013; - cvt.u64.u32 %rd3488, %r5011; - cvt.u64.u32 %rd3489, %r5012; - bfi.b64 %rd3490, %rd3487, %rd3489, 32, 32; - bfi.b64 %rd3491, %rd3488, %rd3485, 32, 32; - mov.b64 {%r5014, %r5015}, %rd3491; - mov.b64 {%r5016, %r5017}, %rd3490; - shf.l.wrap.b32 %r5018, %r4988, %r4988, 5; - xor.b32 %r5019, %r4989, %r4979; - xor.b32 %r5020, %r5019, %r4978; - add.s32 %r5021, %r5014, %r4969; - add.s32 %r5022, %r5021, %r5020; - add.s32 %r5023, %r5022, %r5018; - add.s32 %r5024, %r5023, -899497514; - shf.l.wrap.b32 %r5025, %r4978, %r4978, 30; - shf.l.wrap.b32 %r5026, %r5024, %r5024, 5; - xor.b32 %r5027, %r5025, %r4989; - xor.b32 %r5028, %r5027, %r4988; - add.s32 %r5029, %r5015, %r4979; - add.s32 %r5030, %r5029, %r5028; - add.s32 %r5031, %r5030, %r5026; - add.s32 %r5032, %r5031, -899497514; - shf.l.wrap.b32 %r5033, %r4988, %r4988, 30; - shf.l.wrap.b32 %r5034, %r5032, %r5032, 5; - xor.b32 %r5035, %r5033, %r5025; - xor.b32 %r5036, %r5035, %r5024; - add.s32 %r5037, %r5016, %r4989; - add.s32 %r5038, %r5037, %r5036; - add.s32 %r5039, %r5038, %r5034; - add.s32 %r5040, %r5039, -899497514; - shf.l.wrap.b32 %r5041, %r5024, %r5024, 30; - shf.l.wrap.b32 %r5042, %r5040, %r5040, 5; - xor.b32 %r5043, %r5041, %r5033; - xor.b32 %r5044, %r5043, %r5032; - add.s32 %r5045, %r5017, %r5025; - add.s32 %r5046, %r5045, %r5044; - add.s32 %r5047, %r5046, %r5042; - add.s32 %r5048, %r5047, -899497514; - shf.l.wrap.b32 %r5049, %r5032, %r5032, 30; - cvt.u64.u32 %rd3492, %r5041; - cvt.u64.u32 %rd3493, %r5049; - cvt.u64.u32 %rd3494, %r5040; - cvt.u64.u32 %rd3495, %r5048; - bfi.b64 %rd3496, %rd3494, %rd3495, 32, 32; - bfi.b64 %rd3497, %rd3492, %rd3493, 32, 32; - mov.b64 {%r5050, %r5051}, %rd3496; - mov.b64 {%r5052, %r5053}, %rd3497; - xor.b32 %r5054, %r4805, %r4803; - xor.b32 %r5055, %r4874, %r4804; - xor.b32 %r5056, %r4875, %r4805; - cvt.u64.u32 %rd3498, %r5056; - cvt.u64.u32 %rd3499, %r5054; - xor.b32 %r5057, %r4804, %r4802; - cvt.u64.u32 %rd3500, %r5057; - cvt.u64.u32 %rd3501, %r5055; - bfi.b64 %rd3502, %rd3498, %rd3501, 32, 32; - bfi.b64 %rd3503, %rd3499, %rd3500, 32, 32; - mov.b64 {%r5058, %r5059}, %rd3503; - mov.b64 {%r5060, %r5061}, %rd3502; - xor.b32 %r5062, %r4939, %r5057; - xor.b32 %r5063, %r4943, %r5059; - xor.b32 %r5064, %r4944, %r5060; - xor.b32 %r5065, %r4945, %r5061; - xor.b32 %r5066, %r5015, %r5062; - xor.b32 %r5067, %r5063, %r5016; - shf.l.wrap.b32 %r5068, %r5067, %r5067, 1; - xor.b32 %r5069, %r5064, %r5017; - shf.l.wrap.b32 %r5070, %r5069, %r5069, 1; - shf.l.wrap.b32 %r5071, %r5066, %r5066, 1; - xor.b32 %r5072, %r5065, %r5071; - shf.l.wrap.b32 %r5073, %r5072, %r5072, 1; - cvt.u64.u32 %rd3504, %r5073; - cvt.u64.u32 %rd3505, %r5068; - cvt.u64.u32 %rd3506, %r5070; - bfi.b64 %rd3507, %rd3504, %rd3506, 32, 32; - cvt.u64.u32 %rd3508, %r5071; - bfi.b64 %rd3509, %rd3505, %rd3508, 32, 32; - mov.b64 {%r5074, %r5075}, %rd3509; - mov.b64 {%r5076, %r5077}, %rd3507; - cvt.u64.u32 %rd3510, %r5077; - cvt.u64.u32 %rd3511, %r5075; - cvt.u64.u32 %rd3512, %r5076; - bfi.b64 %rd3513, %rd3510, %rd3512, 32, 32; - bfi.b64 %rd3514, %rd3511, %rd3508, 32, 32; - mov.b64 {%r5078, %r5079}, %rd3514; - mov.b64 {%r5080, %r5081}, %rd3513; - cvt.u64.u32 %rd3515, %r5053; - cvt.u64.u32 %rd3516, %r5051; - cvt.u64.u32 %rd3517, %r5052; - bfi.b64 %rd3518, %rd3516, %rd3495, 32, 32; - bfi.b64 %rd3519, %rd3515, %rd3517, 32, 32; - mov.b64 {%r5082, %r5083}, %rd3518; - mov.b64 {%r5084, %r5085}, %rd3519; - shf.l.wrap.b32 %r5086, %r5082, %r5082, 5; - xor.b32 %r5087, %r5084, %r5083; - xor.b32 %r5088, %r5087, %r5085; - add.s32 %r5089, %r5078, %r5033; - add.s32 %r5090, %r5089, %r5086; - add.s32 %r5091, %r5090, %r5088; - add.s32 %r5092, %r5091, -899497514; - shf.l.wrap.b32 %r5093, %r5083, %r5083, 30; - shf.l.wrap.b32 %r5094, %r5092, %r5092, 5; - xor.b32 %r5095, %r5084, %r5082; - xor.b32 %r5096, %r5095, %r5093; - add.s32 %r5097, %r5079, %r5085; - add.s32 %r5098, %r5097, %r5096; - add.s32 %r5099, %r5098, %r5094; - add.s32 %r5100, %r5099, -899497514; - shf.l.wrap.b32 %r5101, %r5082, %r5082, 30; - shf.l.wrap.b32 %r5102, %r5100, %r5100, 5; - xor.b32 %r5103, %r5093, %r5101; - xor.b32 %r5104, %r5103, %r5092; - add.s32 %r5105, %r5080, %r5084; - add.s32 %r5106, %r5105, %r5104; - add.s32 %r5107, %r5106, %r5102; - add.s32 %r5108, %r5107, -899497514; - shf.l.wrap.b32 %r5109, %r5092, %r5092, 30; - shf.l.wrap.b32 %r5110, %r5108, %r5108, 5; - xor.b32 %r5111, %r5109, %r5101; - xor.b32 %r5112, %r5111, %r5100; - add.s32 %r5113, %r5081, %r5093; - add.s32 %r5114, %r5113, %r5112; - add.s32 %r5115, %r5114, %r5110; - add.s32 %r5116, %r5115, -899497514; - shf.l.wrap.b32 %r5117, %r5100, %r5100, 30; - xor.b32 %r5118, %r4877, %r4875; - xor.b32 %r5119, %r4942, %r4876; - xor.b32 %r5120, %r4943, %r4877; - cvt.u64.u32 %rd3520, %r5120; - cvt.u64.u32 %rd3521, %r5118; - xor.b32 %r5121, %r4876, %r4874; - cvt.u64.u32 %rd3522, %r5121; - cvt.u64.u32 %rd3523, %r5119; - bfi.b64 %rd3524, %rd3520, %rd3523, 32, 32; - bfi.b64 %rd3525, %rd3521, %rd3522, 32, 32; - mov.b64 {%r5122, %r5123}, %rd3525; - mov.b64 {%r5124, %r5125}, %rd3524; - xor.b32 %r5126, %r5007, %r5121; - xor.b32 %r5127, %r5015, %r5123; - xor.b32 %r5128, %r5016, %r5124; - xor.b32 %r5129, %r5017, %r5125; - xor.b32 %r5130, %r5079, %r5126; - xor.b32 %r5131, %r5127, %r5080; - shf.l.wrap.b32 %r5132, %r5131, %r5131, 1; - xor.b32 %r5133, %r5128, %r5081; - shf.l.wrap.b32 %r5134, %r5133, %r5133, 1; - shf.l.wrap.b32 %r5135, %r5130, %r5130, 1; - xor.b32 %r5136, %r5129, %r5135; - shf.l.wrap.b32 %r5137, %r5136, %r5136, 1; - cvt.u64.u32 %rd3526, %r5137; - cvt.u64.u32 %rd3527, %r5132; - cvt.u64.u32 %rd3528, %r5134; - bfi.b64 %rd3529, %rd3526, %rd3528, 32, 32; - cvt.u64.u32 %rd3530, %r5135; - bfi.b64 %rd3531, %rd3527, %rd3530, 32, 32; - mov.b64 {%r5138, %r5139}, %rd3531; - mov.b64 {%r5140, %r5141}, %rd3529; - cvt.u64.u32 %rd3532, %r5141; - cvt.u64.u32 %rd3533, %r5139; - cvt.u64.u32 %rd3534, %r5140; - bfi.b64 %rd3535, %rd3532, %rd3534, 32, 32; - bfi.b64 %rd3536, %rd3533, %rd3530, 32, 32; - mov.b64 {%r5142, %r5143}, %rd3536; - mov.b64 {%r5144, %r5145}, %rd3535; - shf.l.wrap.b32 %r5146, %r5116, %r5116, 5; - xor.b32 %r5147, %r5117, %r5109; - xor.b32 %r5148, %r5147, %r5108; - add.s32 %r5149, %r5142, %r5101; - add.s32 %r5150, %r5149, %r5148; - add.s32 %r5151, %r5150, %r5146; - add.s32 %r5152, %r5151, -899497514; - shf.l.wrap.b32 %r5153, %r5108, %r5108, 30; - shf.l.wrap.b32 %r5154, %r5152, %r5152, 5; - xor.b32 %r5155, %r5153, %r5117; - xor.b32 %r5156, %r5155, %r5116; - add.s32 %r5157, %r5143, %r5109; - add.s32 %r5158, %r5157, %r5156; - add.s32 %r5159, %r5158, %r5154; - add.s32 %r5160, %r5159, -899497514; - shf.l.wrap.b32 %r5161, %r5116, %r5116, 30; - shf.l.wrap.b32 %r5162, %r5160, %r5160, 5; - xor.b32 %r5163, %r5161, %r5153; - xor.b32 %r5164, %r5163, %r5152; - add.s32 %r5165, %r5144, %r5117; - add.s32 %r5166, %r5165, %r5164; - add.s32 %r5167, %r5166, %r5162; - add.s32 %r5168, %r5167, -899497514; - shf.l.wrap.b32 %r5169, %r5152, %r5152, 30; - shf.l.wrap.b32 %r5170, %r5168, %r5168, 5; - xor.b32 %r5171, %r5169, %r5161; - xor.b32 %r5172, %r5171, %r5160; - add.s32 %r5173, %r5145, %r5153; - add.s32 %r5174, %r5173, %r5172; - add.s32 %r5175, %r5174, %r5170; - add.s32 %r5176, %r5175, -899497514; - shf.l.wrap.b32 %r5177, %r5160, %r5160, 30; - cvt.u64.u32 %rd3537, %r5169; - cvt.u64.u32 %rd3538, %r5177; - cvt.u64.u32 %rd3539, %r5168; - cvt.u64.u32 %rd3540, %r5176; - bfi.b64 %rd3541, %rd3539, %rd3540, 32, 32; - bfi.b64 %rd3542, %rd3537, %rd3538, 32, 32; - mov.b64 {%r5178, %r5179}, %rd3541; - mov.b64 {%r5180, %r5181}, %rd3542; - xor.b32 %r5182, %r4945, %r4943; - xor.b32 %r5183, %r5014, %r4944; - xor.b32 %r5184, %r5015, %r4945; - cvt.u64.u32 %rd3543, %r5184; - cvt.u64.u32 %rd3544, %r5182; - xor.b32 %r5185, %r4944, %r4942; - cvt.u64.u32 %rd3545, %r5185; - cvt.u64.u32 %rd3546, %r5183; - bfi.b64 %rd3547, %rd3543, %rd3546, 32, 32; - bfi.b64 %rd3548, %rd3544, %rd3545, 32, 32; - mov.b64 {%r5186, %r5187}, %rd3548; - mov.b64 {%r5188, %r5189}, %rd3547; - xor.b32 %r5190, %r5071, %r5185; - xor.b32 %r5191, %r5079, %r5187; - xor.b32 %r5192, %r5080, %r5188; - xor.b32 %r5193, %r5081, %r5189; - xor.b32 %r5194, %r5143, %r5190; - shf.l.wrap.b32 %r5195, %r5194, %r5194, 1; - xor.b32 %r5196, %r5191, %r5144; - shf.l.wrap.b32 %r5197, %r5196, %r5196, 1; - xor.b32 %r5198, %r5192, %r5145; - shf.l.wrap.b32 %r5199, %r5198, %r5198, 1; - xor.b32 %r5200, %r5193, %r5195; - shf.l.wrap.b32 %r5201, %r5200, %r5200, 1; - cvt.u64.u32 %rd3549, %r5201; - cvt.u64.u32 %rd3550, %r5197; - cvt.u64.u32 %rd3551, %r5199; - bfi.b64 %rd3552, %rd3549, %rd3551, 32, 32; - cvt.u64.u32 %rd3553, %r5195; - bfi.b64 %rd3554, %rd3550, %rd3553, 32, 32; - mov.b64 {%r5202, %r5203}, %rd3554; - mov.b64 {%r5204, %r5205}, %rd3552; - cvt.u64.u32 %rd3555, %r5205; - cvt.u64.u32 %rd3556, %r5203; - cvt.u64.u32 %rd3557, %r5204; - bfi.b64 %rd3558, %rd3555, %rd3557, 32, 32; - bfi.b64 %rd3559, %rd3556, %rd3553, 32, 32; - mov.b64 {%r5206, %r5207}, %rd3559; - mov.b64 {%r5208, %r5209}, %rd3558; - cvt.u64.u32 %rd3560, %r5181; - cvt.u64.u32 %rd3561, %r5179; - cvt.u64.u32 %rd3562, %r5180; - bfi.b64 %rd3563, %rd3561, %rd3540, 32, 32; - bfi.b64 %rd3564, %rd3560, %rd3562, 32, 32; - mov.b64 {%r5210, %r5211}, %rd3563; - mov.b64 {%r5212, %r5213}, %rd3564; - shf.l.wrap.b32 %r5214, %r5210, %r5210, 5; - xor.b32 %r5215, %r5212, %r5211; - xor.b32 %r5216, %r5215, %r5213; - add.s32 %r5217, %r5161, %r5206; - add.s32 %r5218, %r5217, %r5214; - add.s32 %r5219, %r5218, %r5216; - add.s32 %r5220, %r5219, -899497514; - shf.l.wrap.b32 %r5221, %r5211, %r5211, 30; - shf.l.wrap.b32 %r5222, %r5220, %r5220, 5; - xor.b32 %r5223, %r5212, %r5210; - xor.b32 %r5224, %r5223, %r5221; - add.s32 %r5225, %r5207, %r5213; - add.s32 %r5226, %r5225, %r5224; - add.s32 %r5227, %r5226, %r5222; - add.s32 %r5228, %r5227, -899497514; - shf.l.wrap.b32 %r5229, %r5210, %r5210, 30; - shf.l.wrap.b32 %r5230, %r5228, %r5228, 5; - xor.b32 %r5231, %r5221, %r5229; - xor.b32 %r5232, %r5231, %r5220; - add.s32 %r5233, %r5208, %r5212; - add.s32 %r5234, %r5233, %r5232; - add.s32 %r5235, %r5234, %r5230; - add.s32 %r5236, %r5235, -899497514; - shf.l.wrap.b32 %r5237, %r5220, %r5220, 30; - shf.l.wrap.b32 %r5238, %r5236, %r5236, 5; - xor.b32 %r5239, %r5237, %r5229; - xor.b32 %r5240, %r5239, %r5228; - add.s32 %r5241, %r5209, %r5221; - add.s32 %r5242, %r5241, %r5240; - add.s32 %r5243, %r5242, %r5238; - add.s32 %r5244, %r5243, -899497514; - shf.l.wrap.b32 %r5245, %r5228, %r5228, 30; - xor.b32 %r5246, %r5017, %r5015; - xor.b32 %r5247, %r5078, %r5016; - xor.b32 %r5248, %r5079, %r5017; - cvt.u64.u32 %rd3565, %r5248; - cvt.u64.u32 %rd3566, %r5246; - xor.b32 %r5249, %r5016, %r5014; - cvt.u64.u32 %rd3567, %r5249; - cvt.u64.u32 %rd3568, %r5247; - bfi.b64 %rd3569, %rd3565, %rd3568, 32, 32; - bfi.b64 %rd3570, %rd3566, %rd3567, 32, 32; - mov.b64 {%r5250, %r5251}, %rd3570; - mov.b64 {%r5252, %r5253}, %rd3569; - xor.b32 %r5254, %r5135, %r5249; - xor.b32 %r5255, %r5143, %r5251; - xor.b32 %r5256, %r5144, %r5252; - xor.b32 %r5257, %r5145, %r5253; - xor.b32 %r5258, %r5207, %r5254; - shf.l.wrap.b32 %r5259, %r5258, %r5258, 1; - xor.b32 %r5260, %r5255, %r5208; - shf.l.wrap.b32 %r5261, %r5260, %r5260, 1; - xor.b32 %r5262, %r5256, %r5209; - shf.l.wrap.b32 %r5263, %r5262, %r5262, 1; - xor.b32 %r5264, %r5257, %r5259; - shf.l.wrap.b32 %r5265, %r5264, %r5264, 1; - shf.l.wrap.b32 %r5266, %r5244, %r5244, 5; - xor.b32 %r5267, %r5245, %r5237; - xor.b32 %r5268, %r5267, %r5236; - add.s32 %r5269, %r5259, %r5229; - add.s32 %r5270, %r5269, %r5268; - add.s32 %r5271, %r5270, %r5266; - add.s32 %r5272, %r5271, -899497514; - shf.l.wrap.b32 %r5273, %r5236, %r5236, 30; - shf.l.wrap.b32 %r5274, %r5272, %r5272, 5; - xor.b32 %r5275, %r5273, %r5245; - xor.b32 %r5276, %r5275, %r5244; - add.s32 %r5277, %r5261, %r5237; - add.s32 %r5278, %r5277, %r5276; - add.s32 %r5279, %r5278, %r5274; - add.s32 %r5280, %r5279, -899497514; - shf.l.wrap.b32 %r5281, %r5244, %r5244, 30; - shf.l.wrap.b32 %r5282, %r5280, %r5280, 5; - xor.b32 %r5283, %r5281, %r5273; - xor.b32 %r5284, %r5283, %r5272; - add.s32 %r5285, %r5263, %r5245; - add.s32 %r5286, %r5285, %r5284; - add.s32 %r5287, %r5286, %r5282; - add.s32 %r5288, %r5287, -899497514; - shf.l.wrap.b32 %r5289, %r5272, %r5272, 30; - shf.l.wrap.b32 %r5290, %r5288, %r5288, 5; - xor.b32 %r5291, %r5289, %r5281; - xor.b32 %r5292, %r5291, %r5280; - shf.l.wrap.b32 %r5293, %r5280, %r5280, 30; - add.s32 %r5294, %r9085, %r5265; - add.s32 %r5295, %r5294, %r5273; - add.s32 %r5296, %r5295, %r5292; - add.s32 %r5297, %r5296, %r5290; - add.s32 %r9085, %r5297, -899497514; - add.s32 %r9086, %r5288, %r9086; - add.s32 %r9087, %r5293, %r9087; - add.s32 %r9088, %r5289, %r9088; - add.s32 %r9089, %r5281, %r9089; - setp.ne.s64 %p228, %rd4247, %rd821; - add.s64 %rd4248, %rd4248, 64; - @%p228 bra $L__BB1_307; - bra.uni $L__BB1_325; - -$L__BB1_66: - setp.gt.u16 %p41, %rs1, 10; - add.u64 %rd1271, %SP, 352; - add.u64 %rd177, %SPL, 352; - mov.u16 %rs1623, 0; - st.local.v4.u16 [%rd177], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1272, %rd1271, 8; - cvta.to.local.u64 %rd178, %rd1272; - st.local.v4.u16 [%rd178], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1273, %rd1271, 16; - cvta.to.local.u64 %rd179, %rd1273; - st.local.v4.u16 [%rd179], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1274, %rd1271, 24; - cvta.to.local.u64 %rd180, %rd1274; - st.local.v4.u16 [%rd180], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1275, %rd1271, 32; - cvta.to.local.u64 %rd181, %rd1275; - st.local.v4.u16 [%rd181], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1276, %rd1271, 40; - cvta.to.local.u64 %rd182, %rd1276; - st.local.v4.u16 [%rd182], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1277, %rd1271, 48; - cvta.to.local.u64 %rd183, %rd1277; - st.local.v4.u16 [%rd183], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1278, %rd1271, 56; - cvta.to.local.u64 %rd184, %rd1278; - st.local.v4.u16 [%rd184], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1279, %rd1271, 64; - cvta.to.local.u64 %rd185, %rd1279; - st.local.v4.u16 [%rd185], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1280, %rd1271, 72; - cvta.to.local.u64 %rd186, %rd1280; - st.local.v4.u16 [%rd186], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1281, %rd1271, 80; - cvta.to.local.u64 %rd187, %rd1281; - st.local.v4.u16 [%rd187], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1282, %rd1271, 88; - cvta.to.local.u64 %rd188, %rd1282; - st.local.v4.u16 [%rd188], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd1283, %rd1271, 96; - cvta.to.local.u64 %rd189, %rd1283; - st.local.v4.u16 [%rd189], {%rs1623, %rs1623, %rs1623, %rs1623}; - add.s64 %rd190, %rd1271, 104; - cvta.to.local.u64 %rd191, %rd190; - st.local.u8 [%rd191], %rs1623; - @%p41 bra $L__BB1_109; - - cvta.to.local.u64 %rd192, %rd978; - shr.u64 %rd193, %rd11, 1; - setp.eq.s64 %p42, %rd193, 0; - @%p42 bra $L__BB1_71; - - mov.u64 %rd4081, 1; - mov.u64 %rd4079, %rd192; - mov.u64 %rd4080, %rd177; - bra.uni $L__BB1_69; - -$L__BB1_70: - ld.local.u16 %rs2, [%rd4079+4]; - add.s64 %rd4081, %rd4081, 1; - add.s64 %rd4080, %rd4080, 2; - add.s64 %rd4079, %rd4079, 2; - -$L__BB1_69: - st.local.u16 [%rd4080], %rs2; - setp.ge.u64 %p43, %rd4081, %rd193; - @%p43 bra $L__BB1_71; - bra.uni $L__BB1_70; - -$L__BB1_71: - and.b64 %rd201, %rd11, 1; - setp.eq.s64 %p44, %rd201, 0; - @%p44 bra $L__BB1_74; - - and.b64 %rd1288, %rd11, 65534; - cvta.to.local.u64 %rd1290, %rd1271; - add.s64 %rd202, %rd1290, %rd1288; - add.s64 %rd1291, %rd192, %rd1288; - add.s64 %rd203, %rd1291, 2; - mov.u64 %rd4082, 0; - -$L__BB1_73: - add.s64 %rd1292, %rd203, %rd4082; - ld.local.u8 %rs1624, [%rd1292]; - add.s64 %rd1293, %rd202, %rd4082; - st.local.u8 [%rd1293], %rs1624; - add.s64 %rd4082, %rd4082, 1; - setp.lt.u64 %p45, %rd4082, %rd201; - @%p45 bra $L__BB1_73; - -$L__BB1_74: - mov.u64 %rd1294, 0; - st.local.u8 [%rd191], %rs1; - ld.local.v4.u16 {%rs1625, %rs1626, %rs1627, %rs1628}, [%rd177]; - ld.local.v4.u16 {%rs1633, %rs1634, %rs1635, %rs1636}, [%rd178]; - ld.local.v4.u16 {%rs1641, %rs1642, %rs1643, %rs1644}, [%rd179]; - ld.local.v4.u16 {%rs1649, %rs1650, %rs1651, %rs1652}, [%rd180]; - ld.local.v4.u16 {%rs1657, %rs1658, %rs1659, %rs1660}, [%rd181]; - shr.u16 %rs1663, %rs1660, 8; - ld.local.v4.u16 {%rs1664, %rs1665, %rs1666, %rs1667}, [%rd182]; - ld.local.v4.u16 {%rs1672, %rs1673, %rs1674, %rs1675}, [%rd183]; - ld.local.v4.u16 {%rs1680, %rs1681, %rs1682, %rs1683}, [%rd184]; - ld.local.v4.u16 {%rs1688, %rs1689, %rs1690, %rs1691}, [%rd185]; - ld.local.v4.u16 {%rs1696, %rs1697, %rs1698, %rs1699}, [%rd186]; - ld.local.v4.u16 {%rs1704, %rs1705, %rs1706, %rs1707}, [%rd187]; - ld.local.v4.u16 {%rs1712, %rs1713, %rs1714, %rs1715}, [%rd188]; - ld.local.v4.u16 {%rs1720, %rs1721, %rs1722, %rs1723}, [%rd189]; - shr.u16 %rs1726, %rs1723, 8; - ld.local.v4.u16 {%rs1727, %rs1728, %rs1729, %rs1730}, [%rd191]; - and.b16 %rs1731, %rs1727, 255; - shr.u16 %rs1734, %rs1730, 8; - st.local.u64 [%rd1], %rd1294; - st.local.u64 [%rd1+8], %rd1294; - st.local.u64 [%rd1+16], %rd1294; - st.local.u64 [%rd1+24], %rd1294; - st.local.u64 [%rd1+32], %rd1294; - st.local.u64 [%rd1+40], %rd1294; - st.local.u64 [%rd1+48], %rd1294; - st.local.u64 [%rd1+56], %rd1294; - st.local.u64 [%rd1+64], %rd1294; - st.local.u64 [%rd1+72], %rd1294; - st.local.u64 [%rd1+80], %rd1294; - st.local.u64 [%rd1+88], %rd1294; - st.local.u64 [%rd1+96], %rd1294; - st.local.u64 [%rd1+104], %rd1294; - st.local.u64 [%rd1+112], %rd1294; - st.local.u64 [%rd1+120], %rd1294; - st.local.u64 [%rd1+128], %rd1294; - st.local.u64 [%rd1+136], %rd1294; - st.local.u64 [%rd1+144], %rd1294; - st.local.u64 [%rd1+152], %rd1294; - st.local.u64 [%rd1+160], %rd1294; - st.local.u64 [%rd1+168], %rd1294; - st.local.u64 [%rd1+176], %rd1294; - st.local.u64 [%rd1+184], %rd1294; - st.local.u64 [%rd1+192], %rd1294; - st.local.v4.u16 [%rd1+200], {%rs1625, %rs1626, %rs1627, %rs1628}; - st.local.v4.u16 [%rd1+208], {%rs1633, %rs1634, %rs1635, %rs1636}; - st.local.v4.u16 [%rd1+216], {%rs1641, %rs1642, %rs1643, %rs1644}; - st.local.v4.u16 [%rd1+224], {%rs1649, %rs1650, %rs1651, %rs1652}; - st.local.v2.u16 [%rd1+232], {%rs1657, %rs1658}; - st.local.u16 [%rd1+236], %rs1659; - st.local.u8 [%rd1+238], %rs1660; - st.local.u8 [%rd1+239], %rs1663; - st.local.v4.u16 [%rd1+240], {%rs1664, %rs1665, %rs1666, %rs1667}; - st.local.v4.u16 [%rd1+248], {%rs1672, %rs1673, %rs1674, %rs1675}; - st.local.v4.u16 [%rd1+256], {%rs1680, %rs1681, %rs1682, %rs1683}; - st.local.v4.u16 [%rd1+264], {%rs1688, %rs1689, %rs1690, %rs1691}; - st.local.v4.u16 [%rd1+272], {%rs1696, %rs1697, %rs1698, %rs1699}; - st.local.v4.u16 [%rd1+280], {%rs1704, %rs1705, %rs1706, %rs1707}; - st.local.v4.u16 [%rd1+288], {%rs1712, %rs1713, %rs1714, %rs1715}; - st.local.v2.u16 [%rd1+296], {%rs1720, %rs1721}; - st.local.u16 [%rd1+300], %rs1722; - st.local.u8 [%rd1+302], %rs1723; - st.local.u8 [%rd1+303], %rs1726; - st.local.v2.u16 [%rd1+304], {%rs1727, %rs1728}; - st.local.u16 [%rd1+308], %rs1729; - st.local.u8 [%rd1+310], %rs1730; - st.local.u8 [%rd1+311], %rs1734; - setp.gt.u16 %p46, %rs1731, 104; - @%p46 bra $L__BB1_108; - - setp.eq.s16 %p47, %rs1731, 104; - @%p47 bra $L__BB1_106; - - cvt.u64.u16 %rd1296, %rs1727; - and.b64 %rd207, %rd1296, 255; - add.s64 %rd1297, %rd1, %rd207; - add.s64 %rd208, %rd1297, 200; - neg.s16 %rs1741, %rs1727; - and.b16 %rs91, %rs1741, 7; - setp.eq.s16 %p48, %rs91, 0; - mov.u64 %rd4089, %rd208; - @%p48 bra $L__BB1_79; - - cvt.u64.u16 %rd1298, %rs91; - neg.s64 %rd4083, %rd1298; - mov.u64 %rd4084, %rd208; - -$L__BB1_78: - .pragma "nounroll"; - add.s64 %rd4089, %rd4084, 1; - st.local.u8 [%rd4084], %rs1623; - add.s64 %rd4083, %rd4083, 1; - setp.ne.s64 %p49, %rd4083, 0; - mov.u64 %rd4084, %rd4089; - @%p49 bra $L__BB1_78; - -$L__BB1_79: - mov.u64 %rd1299, 103; - sub.s64 %rd1300, %rd1299, %rd207; - setp.lt.u64 %p50, %rd1300, 7; - @%p50 bra $L__BB1_86; - - add.s64 %rd1301, %rd1, 296; - sub.s64 %rd217, %rd1301, %rd4089; - shr.u64 %rd1302, %rd217, 3; - add.s64 %rd1303, %rd1302, 1; - and.b64 %rd218, %rd1303, 3; - setp.eq.s64 %p51, %rd218, 0; - mov.u64 %rd4092, %rd4089; - @%p51 bra $L__BB1_83; - - neg.s64 %rd4086, %rd218; - mov.u64 %rd4088, %rd4089; - -$L__BB1_82: - .pragma "nounroll"; - st.local.u8 [%rd4088], %rs1623; - st.local.u8 [%rd4088+1], %rs1623; - st.local.u8 [%rd4088+2], %rs1623; - st.local.u8 [%rd4088+3], %rs1623; - st.local.u8 [%rd4088+4], %rs1623; - st.local.u8 [%rd4088+5], %rs1623; - st.local.u8 [%rd4088+6], %rs1623; - add.s64 %rd4089, %rd4089, 8; - add.s64 %rd4092, %rd4088, 8; - st.local.u8 [%rd4088+7], %rs1623; - add.s64 %rd4086, %rd4086, 1; - setp.ne.s64 %p52, %rd4086, 0; - mov.u64 %rd4088, %rd4092; - @%p52 bra $L__BB1_82; - -$L__BB1_83: - setp.lt.u64 %p53, %rd217, 24; - @%p53 bra $L__BB1_86; - - sub.s64 %rd1304, %rd1, %rd4089; - add.s64 %rd4091, %rd1304, 304; - -$L__BB1_85: - st.local.u8 [%rd4092], %rs1623; - st.local.u8 [%rd4092+1], %rs1623; - st.local.u8 [%rd4092+2], %rs1623; - st.local.u8 [%rd4092+3], %rs1623; - st.local.u8 [%rd4092+4], %rs1623; - st.local.u8 [%rd4092+5], %rs1623; - st.local.u8 [%rd4092+6], %rs1623; - st.local.u8 [%rd4092+7], %rs1623; - st.local.u8 [%rd4092+8], %rs1623; - st.local.u8 [%rd4092+9], %rs1623; - st.local.u8 [%rd4092+10], %rs1623; - st.local.u8 [%rd4092+11], %rs1623; - st.local.u8 [%rd4092+12], %rs1623; - st.local.u8 [%rd4092+13], %rs1623; - st.local.u8 [%rd4092+14], %rs1623; - st.local.u8 [%rd4092+15], %rs1623; - st.local.u8 [%rd4092+16], %rs1623; - st.local.u8 [%rd4092+17], %rs1623; - st.local.u8 [%rd4092+18], %rs1623; - st.local.u8 [%rd4092+19], %rs1623; - st.local.u8 [%rd4092+20], %rs1623; - st.local.u8 [%rd4092+21], %rs1623; - st.local.u8 [%rd4092+22], %rs1623; - st.local.u8 [%rd4092+23], %rs1623; - st.local.u8 [%rd4092+24], %rs1623; - st.local.u8 [%rd4092+25], %rs1623; - st.local.u8 [%rd4092+26], %rs1623; - st.local.u8 [%rd4092+27], %rs1623; - st.local.u8 [%rd4092+28], %rs1623; - st.local.u8 [%rd4092+29], %rs1623; - st.local.u8 [%rd4092+30], %rs1623; - st.local.u8 [%rd4092+31], %rs1623; - add.s64 %rd4091, %rd4091, -32; - setp.ne.s64 %p54, %rd4091, 0; - add.s64 %rd4092, %rd4092, 32; - @%p54 bra $L__BB1_85; - -$L__BB1_86: - st.local.u8 [%rd1+304], %rs1623; - setp.gt.u16 %p55, %rs1731, 103; - @%p55 bra $L__BB1_107; - - mov.u16 %rs1747, 6; - st.local.u8 [%rd208], %rs1747; - ld.local.u8 %rs1748, [%rd1+303]; - or.b16 %rs1749, %rs1748, 128; - st.local.u8 [%rd1+303], %rs1749; - ld.local.u64 %rd1305, [%rd1+200]; - shl.b64 %rd1306, %rd1305, 8; - mov.b64 {%r359, %r360}, %rd1306; - shr.u64 %rd1307, %rd1305, 56; - mov.b64 {%r361, %r362}, %rd1307; - mov.b32 {%rs100, %rs1750}, %r361; - mov.b32 {%rs96, %rs98}, %r360; - shr.u16 %rs99, %rs98, 8; - shr.u16 %rs97, %rs96, 8; - mov.b32 {%rs92, %rs94}, %r359; - shr.u16 %rs95, %rs94, 8; - shr.u16 %rs93, %rs92, 8; - mov.pred %p56, 0; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1751, %rs94, 8; - or.b16 %rs1752, %rs93, %rs1751; - shl.b16 %rs1753, %rs96, 8; - or.b16 %rs1754, %rs95, %rs1753; - mov.b32 %r363, {%rs1752, %rs1754}; - shl.b16 %rs1755, %rs98, 8; - or.b16 %rs1756, %rs97, %rs1755; - shl.b16 %rs1757, %rs100, 8; - or.b16 %rs1758, %rs99, %rs1757; - mov.b32 %r364, {%rs1756, %rs1758}; - mov.b64 %rd1308, {%r363, %r364}; - ld.local.u64 %rd1309, [%rd1]; - xor.b64 %rd4125, %rd1309, %rd1308; - st.local.u64 [%rd1], %rd4125; - ld.local.u64 %rd1310, [%rd1+208]; - shl.b64 %rd1311, %rd1310, 8; - mov.b64 {%r365, %r366}, %rd1311; - shr.u64 %rd1312, %rd1310, 56; - mov.b64 {%r367, %r368}, %rd1312; - mov.b32 {%rs109, %rs1759}, %r367; - mov.b32 {%rs105, %rs107}, %r366; - shr.u16 %rs108, %rs107, 8; - shr.u16 %rs106, %rs105, 8; - mov.b32 {%rs101, %rs103}, %r365; - shr.u16 %rs104, %rs103, 8; - shr.u16 %rs102, %rs101, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1760, %rs103, 8; - or.b16 %rs1761, %rs102, %rs1760; - shl.b16 %rs1762, %rs105, 8; - or.b16 %rs1763, %rs104, %rs1762; - mov.b32 %r369, {%rs1761, %rs1763}; - shl.b16 %rs1764, %rs107, 8; - or.b16 %rs1765, %rs106, %rs1764; - shl.b16 %rs1766, %rs109, 8; - or.b16 %rs1767, %rs108, %rs1766; - mov.b32 %r370, {%rs1765, %rs1767}; - mov.b64 %rd1313, {%r369, %r370}; - ld.local.u64 %rd1314, [%rd1+8]; - xor.b64 %rd4124, %rd1314, %rd1313; - st.local.u64 [%rd1+8], %rd4124; - ld.local.u64 %rd1315, [%rd1+216]; - shl.b64 %rd1316, %rd1315, 8; - mov.b64 {%r371, %r372}, %rd1316; - shr.u64 %rd1317, %rd1315, 56; - mov.b64 {%r373, %r374}, %rd1317; - mov.b32 {%rs118, %rs1768}, %r373; - mov.b32 {%rs114, %rs116}, %r372; - shr.u16 %rs117, %rs116, 8; - shr.u16 %rs115, %rs114, 8; - mov.b32 {%rs110, %rs112}, %r371; - shr.u16 %rs113, %rs112, 8; - shr.u16 %rs111, %rs110, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1769, %rs112, 8; - or.b16 %rs1770, %rs111, %rs1769; - shl.b16 %rs1771, %rs114, 8; - or.b16 %rs1772, %rs113, %rs1771; - mov.b32 %r375, {%rs1770, %rs1772}; - shl.b16 %rs1773, %rs116, 8; - or.b16 %rs1774, %rs115, %rs1773; - shl.b16 %rs1775, %rs118, 8; - or.b16 %rs1776, %rs117, %rs1775; - mov.b32 %r376, {%rs1774, %rs1776}; - mov.b64 %rd1318, {%r375, %r376}; - ld.local.u64 %rd1319, [%rd1+16]; - xor.b64 %rd4123, %rd1319, %rd1318; - st.local.u64 [%rd1+16], %rd4123; - ld.local.u64 %rd1320, [%rd1+224]; - shl.b64 %rd1321, %rd1320, 8; - mov.b64 {%r377, %r378}, %rd1321; - shr.u64 %rd1322, %rd1320, 56; - mov.b64 {%r379, %r380}, %rd1322; - mov.b32 {%rs127, %rs1777}, %r379; - mov.b32 {%rs123, %rs125}, %r378; - shr.u16 %rs126, %rs125, 8; - shr.u16 %rs124, %rs123, 8; - mov.b32 {%rs119, %rs121}, %r377; - shr.u16 %rs122, %rs121, 8; - shr.u16 %rs120, %rs119, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1778, %rs121, 8; - or.b16 %rs1779, %rs120, %rs1778; - shl.b16 %rs1780, %rs123, 8; - or.b16 %rs1781, %rs122, %rs1780; - mov.b32 %r381, {%rs1779, %rs1781}; - shl.b16 %rs1782, %rs125, 8; - or.b16 %rs1783, %rs124, %rs1782; - shl.b16 %rs1784, %rs127, 8; - or.b16 %rs1785, %rs126, %rs1784; - mov.b32 %r382, {%rs1783, %rs1785}; - mov.b64 %rd1323, {%r381, %r382}; - ld.local.u64 %rd1324, [%rd1+24]; - xor.b64 %rd4122, %rd1324, %rd1323; - st.local.u64 [%rd1+24], %rd4122; - ld.local.u64 %rd1325, [%rd1+232]; - shl.b64 %rd1326, %rd1325, 8; - mov.b64 {%r383, %r384}, %rd1326; - shr.u64 %rd1327, %rd1325, 56; - mov.b64 {%r385, %r386}, %rd1327; - mov.b32 {%rs136, %rs1786}, %r385; - mov.b32 {%rs132, %rs134}, %r384; - shr.u16 %rs135, %rs134, 8; - shr.u16 %rs133, %rs132, 8; - mov.b32 {%rs128, %rs130}, %r383; - shr.u16 %rs131, %rs130, 8; - shr.u16 %rs129, %rs128, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1787, %rs130, 8; - or.b16 %rs1788, %rs129, %rs1787; - shl.b16 %rs1789, %rs132, 8; - or.b16 %rs1790, %rs131, %rs1789; - mov.b32 %r387, {%rs1788, %rs1790}; - shl.b16 %rs1791, %rs134, 8; - or.b16 %rs1792, %rs133, %rs1791; - shl.b16 %rs1793, %rs136, 8; - or.b16 %rs1794, %rs135, %rs1793; - mov.b32 %r388, {%rs1792, %rs1794}; - mov.b64 %rd1328, {%r387, %r388}; - ld.local.u64 %rd1329, [%rd1+32]; - xor.b64 %rd4121, %rd1329, %rd1328; - st.local.u64 [%rd1+32], %rd4121; - ld.local.u64 %rd1330, [%rd1+240]; - shl.b64 %rd1331, %rd1330, 8; - mov.b64 {%r389, %r390}, %rd1331; - shr.u64 %rd1332, %rd1330, 56; - mov.b64 {%r391, %r392}, %rd1332; - mov.b32 {%rs145, %rs1795}, %r391; - mov.b32 {%rs141, %rs143}, %r390; - shr.u16 %rs144, %rs143, 8; - shr.u16 %rs142, %rs141, 8; - mov.b32 {%rs137, %rs139}, %r389; - shr.u16 %rs140, %rs139, 8; - shr.u16 %rs138, %rs137, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1796, %rs139, 8; - or.b16 %rs1797, %rs138, %rs1796; - shl.b16 %rs1798, %rs141, 8; - or.b16 %rs1799, %rs140, %rs1798; - mov.b32 %r393, {%rs1797, %rs1799}; - shl.b16 %rs1800, %rs143, 8; - or.b16 %rs1801, %rs142, %rs1800; - shl.b16 %rs1802, %rs145, 8; - or.b16 %rs1803, %rs144, %rs1802; - mov.b32 %r394, {%rs1801, %rs1803}; - mov.b64 %rd1333, {%r393, %r394}; - ld.local.u64 %rd1334, [%rd1+40]; - xor.b64 %rd4120, %rd1334, %rd1333; - st.local.u64 [%rd1+40], %rd4120; - ld.local.u64 %rd1335, [%rd1+248]; - shl.b64 %rd1336, %rd1335, 8; - mov.b64 {%r395, %r396}, %rd1336; - shr.u64 %rd1337, %rd1335, 56; - mov.b64 {%r397, %r398}, %rd1337; - mov.b32 {%rs154, %rs1804}, %r397; - mov.b32 {%rs150, %rs152}, %r396; - shr.u16 %rs153, %rs152, 8; - shr.u16 %rs151, %rs150, 8; - mov.b32 {%rs146, %rs148}, %r395; - shr.u16 %rs149, %rs148, 8; - shr.u16 %rs147, %rs146, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1805, %rs148, 8; - or.b16 %rs1806, %rs147, %rs1805; - shl.b16 %rs1807, %rs150, 8; - or.b16 %rs1808, %rs149, %rs1807; - mov.b32 %r399, {%rs1806, %rs1808}; - shl.b16 %rs1809, %rs152, 8; - or.b16 %rs1810, %rs151, %rs1809; - shl.b16 %rs1811, %rs154, 8; - or.b16 %rs1812, %rs153, %rs1811; - mov.b32 %r400, {%rs1810, %rs1812}; - mov.b64 %rd1338, {%r399, %r400}; - ld.local.u64 %rd1339, [%rd1+48]; - xor.b64 %rd4113, %rd1339, %rd1338; - st.local.u64 [%rd1+48], %rd4113; - ld.local.u64 %rd1340, [%rd1+256]; - shl.b64 %rd1341, %rd1340, 8; - mov.b64 {%r401, %r402}, %rd1341; - shr.u64 %rd1342, %rd1340, 56; - mov.b64 {%r403, %r404}, %rd1342; - mov.b32 {%rs163, %rs1813}, %r403; - mov.b32 {%rs159, %rs161}, %r402; - shr.u16 %rs162, %rs161, 8; - shr.u16 %rs160, %rs159, 8; - mov.b32 {%rs155, %rs157}, %r401; - shr.u16 %rs158, %rs157, 8; - shr.u16 %rs156, %rs155, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1814, %rs157, 8; - or.b16 %rs1815, %rs156, %rs1814; - shl.b16 %rs1816, %rs159, 8; - or.b16 %rs1817, %rs158, %rs1816; - mov.b32 %r405, {%rs1815, %rs1817}; - shl.b16 %rs1818, %rs161, 8; - or.b16 %rs1819, %rs160, %rs1818; - shl.b16 %rs1820, %rs163, 8; - or.b16 %rs1821, %rs162, %rs1820; - mov.b32 %r406, {%rs1819, %rs1821}; - mov.b64 %rd1343, {%r405, %r406}; - ld.local.u64 %rd1344, [%rd1+56]; - xor.b64 %rd4109, %rd1344, %rd1343; - st.local.u64 [%rd1+56], %rd4109; - ld.local.u64 %rd1345, [%rd1+264]; - shl.b64 %rd1346, %rd1345, 8; - mov.b64 {%r407, %r408}, %rd1346; - shr.u64 %rd1347, %rd1345, 56; - mov.b64 {%r409, %r410}, %rd1347; - mov.b32 {%rs172, %rs1822}, %r409; - mov.b32 {%rs168, %rs170}, %r408; - shr.u16 %rs171, %rs170, 8; - shr.u16 %rs169, %rs168, 8; - mov.b32 {%rs164, %rs166}, %r407; - shr.u16 %rs167, %rs166, 8; - shr.u16 %rs165, %rs164, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1823, %rs166, 8; - or.b16 %rs1824, %rs165, %rs1823; - shl.b16 %rs1825, %rs168, 8; - or.b16 %rs1826, %rs167, %rs1825; - mov.b32 %r411, {%rs1824, %rs1826}; - shl.b16 %rs1827, %rs170, 8; - or.b16 %rs1828, %rs169, %rs1827; - shl.b16 %rs1829, %rs172, 8; - or.b16 %rs1830, %rs171, %rs1829; - mov.b32 %r412, {%rs1828, %rs1830}; - mov.b64 %rd1348, {%r411, %r412}; - ld.local.u64 %rd1349, [%rd1+64]; - xor.b64 %rd4105, %rd1349, %rd1348; - st.local.u64 [%rd1+64], %rd4105; - ld.local.u64 %rd1350, [%rd1+272]; - shl.b64 %rd1351, %rd1350, 8; - mov.b64 {%r413, %r414}, %rd1351; - shr.u64 %rd1352, %rd1350, 56; - mov.b64 {%r415, %r416}, %rd1352; - mov.b32 {%rs181, %rs1831}, %r415; - mov.b32 {%rs177, %rs179}, %r414; - shr.u16 %rs180, %rs179, 8; - shr.u16 %rs178, %rs177, 8; - mov.b32 {%rs173, %rs175}, %r413; - shr.u16 %rs176, %rs175, 8; - shr.u16 %rs174, %rs173, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1832, %rs175, 8; - or.b16 %rs1833, %rs174, %rs1832; - shl.b16 %rs1834, %rs177, 8; - or.b16 %rs1835, %rs176, %rs1834; - mov.b32 %r417, {%rs1833, %rs1835}; - shl.b16 %rs1836, %rs179, 8; - or.b16 %rs1837, %rs178, %rs1836; - shl.b16 %rs1838, %rs181, 8; - or.b16 %rs1839, %rs180, %rs1838; - mov.b32 %r418, {%rs1837, %rs1839}; - mov.b64 %rd1353, {%r417, %r418}; - ld.local.u64 %rd1354, [%rd1+72]; - xor.b64 %rd4101, %rd1354, %rd1353; - st.local.u64 [%rd1+72], %rd4101; - ld.local.u64 %rd1355, [%rd1+280]; - shl.b64 %rd1356, %rd1355, 8; - mov.b64 {%r419, %r420}, %rd1356; - shr.u64 %rd1357, %rd1355, 56; - mov.b64 {%r421, %r422}, %rd1357; - mov.b32 {%rs190, %rs1840}, %r421; - mov.b32 {%rs186, %rs188}, %r420; - shr.u16 %rs189, %rs188, 8; - shr.u16 %rs187, %rs186, 8; - mov.b32 {%rs182, %rs184}, %r419; - shr.u16 %rs185, %rs184, 8; - shr.u16 %rs183, %rs182, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1841, %rs184, 8; - or.b16 %rs1842, %rs183, %rs1841; - shl.b16 %rs1843, %rs186, 8; - or.b16 %rs1844, %rs185, %rs1843; - mov.b32 %r423, {%rs1842, %rs1844}; - shl.b16 %rs1845, %rs188, 8; - or.b16 %rs1846, %rs187, %rs1845; - shl.b16 %rs1847, %rs190, 8; - or.b16 %rs1848, %rs189, %rs1847; - mov.b32 %r424, {%rs1846, %rs1848}; - mov.b64 %rd1358, {%r423, %r424}; - ld.local.u64 %rd1359, [%rd1+80]; - xor.b64 %rd4116, %rd1359, %rd1358; - st.local.u64 [%rd1+80], %rd4116; - ld.local.u64 %rd1360, [%rd1+288]; - shl.b64 %rd1361, %rd1360, 8; - mov.b64 {%r425, %r426}, %rd1361; - shr.u64 %rd1362, %rd1360, 56; - mov.b64 {%r427, %r428}, %rd1362; - mov.b32 {%rs199, %rs1849}, %r427; - mov.b32 {%rs195, %rs197}, %r426; - shr.u16 %rs198, %rs197, 8; - shr.u16 %rs196, %rs195, 8; - mov.b32 {%rs191, %rs193}, %r425; - shr.u16 %rs194, %rs193, 8; - shr.u16 %rs192, %rs191, 8; - @%p56 bra $L__BB1_100; - - shl.b16 %rs1850, %rs193, 8; - or.b16 %rs1851, %rs192, %rs1850; - shl.b16 %rs1852, %rs195, 8; - or.b16 %rs1853, %rs194, %rs1852; - mov.b32 %r429, {%rs1851, %rs1853}; - shl.b16 %rs1854, %rs197, 8; - or.b16 %rs1855, %rs196, %rs1854; - shl.b16 %rs1856, %rs199, 8; - or.b16 %rs1857, %rs198, %rs1856; - mov.b32 %r430, {%rs1855, %rs1857}; - mov.b64 %rd1363, {%r429, %r430}; - ld.local.u64 %rd1364, [%rd1+88]; - xor.b64 %rd4112, %rd1364, %rd1363; - st.local.u64 [%rd1+88], %rd4112; - ld.local.u64 %rd1365, [%rd1+296]; - shl.b64 %rd1366, %rd1365, 8; - mov.b64 {%r431, %r432}, %rd1366; - shr.u64 %rd1367, %rd1365, 56; - mov.b64 {%r433, %r434}, %rd1367; - mov.b32 {%rs208, %rs1858}, %r433; - mov.b32 {%rs204, %rs206}, %r432; - shr.u16 %rs207, %rs206, 8; - shr.u16 %rs205, %rs204, 8; - mov.b32 {%rs200, %rs202}, %r431; - shr.u16 %rs203, %rs202, 8; - shr.u16 %rs201, %rs200, 8; - mov.pred %p68, -1; - @%p68 bra $L__BB1_101; - bra.uni $L__BB1_100; - -$L__BB1_101: - shl.b16 %rs1859, %rs202, 8; - or.b16 %rs1860, %rs201, %rs1859; - shl.b16 %rs1861, %rs204, 8; - or.b16 %rs1862, %rs203, %rs1861; - mov.b32 %r435, {%rs1860, %rs1862}; - shl.b16 %rs1863, %rs206, 8; - or.b16 %rs1864, %rs205, %rs1863; - shl.b16 %rs1865, %rs208, 8; - or.b16 %rs1866, %rs207, %rs1865; - mov.b32 %r436, {%rs1864, %rs1866}; - mov.b64 %rd1368, {%r435, %r436}; - ld.local.u64 %rd1369, [%rd1+96]; - xor.b64 %rd4108, %rd1369, %rd1368; - st.local.u64 [%rd1+96], %rd4108; - @%p56 bra $L__BB1_105; - - add.s64 %rd1373, %rd968, 40; - cvta.to.local.u64 %rd247, %rd1373; - add.s64 %rd1374, %rd968, 80; - cvta.to.local.u64 %rd248, %rd1374; - add.s64 %rd1375, %rd968, 120; - cvta.to.local.u64 %rd249, %rd1375; - add.s64 %rd1376, %rd968, 160; - cvta.to.local.u64 %rd250, %rd1376; - add.s64 %rd1377, %rd968, 8; - cvta.to.local.u64 %rd251, %rd1377; - add.s64 %rd1378, %rd968, 48; - cvta.to.local.u64 %rd252, %rd1378; - add.s64 %rd1379, %rd968, 88; - cvta.to.local.u64 %rd253, %rd1379; - add.s64 %rd1380, %rd968, 128; - cvta.to.local.u64 %rd254, %rd1380; - add.s64 %rd1381, %rd968, 168; - cvta.to.local.u64 %rd255, %rd1381; - add.s64 %rd1382, %rd968, 16; - cvta.to.local.u64 %rd256, %rd1382; - add.s64 %rd1383, %rd968, 56; - cvta.to.local.u64 %rd257, %rd1383; - add.s64 %rd1384, %rd968, 96; - cvta.to.local.u64 %rd258, %rd1384; - add.s64 %rd1385, %rd968, 136; - cvta.to.local.u64 %rd259, %rd1385; - add.s64 %rd1386, %rd968, 176; - cvta.to.local.u64 %rd260, %rd1386; - add.s64 %rd1387, %rd968, 24; - cvta.to.local.u64 %rd261, %rd1387; - add.s64 %rd1388, %rd968, 64; - cvta.to.local.u64 %rd262, %rd1388; - add.s64 %rd1389, %rd968, 104; - cvta.to.local.u64 %rd263, %rd1389; - add.s64 %rd1390, %rd968, 144; - cvta.to.local.u64 %rd264, %rd1390; - add.s64 %rd1391, %rd968, 184; - cvta.to.local.u64 %rd265, %rd1391; - add.s64 %rd1392, %rd968, 32; - cvta.to.local.u64 %rd266, %rd1392; - add.s64 %rd1393, %rd968, 72; - cvta.to.local.u64 %rd267, %rd1393; - add.s64 %rd1394, %rd968, 112; - cvta.to.local.u64 %rd268, %rd1394; - add.s64 %rd1395, %rd968, 152; - cvta.to.local.u64 %rd269, %rd1395; - add.s64 %rd1396, %rd968, 192; - mov.u64 %rd4093, 192; - cvta.to.local.u64 %rd270, %rd1396; - ld.local.u64 %rd4115, [%rd249]; - ld.local.u64 %rd4114, [%rd250]; - ld.local.u64 %rd4111, [%rd254]; - ld.local.u64 %rd4110, [%rd255]; - ld.local.u64 %rd4107, [%rd259]; - ld.local.u64 %rd4106, [%rd260]; - ld.local.u64 %rd4104, [%rd263]; - ld.local.u64 %rd4103, [%rd264]; - ld.local.u64 %rd4102, [%rd265]; - ld.local.u64 %rd4100, [%rd268]; - ld.local.u64 %rd4099, [%rd269]; - ld.local.u64 %rd4098, [%rd270]; - mov.u64 %rd4119, private$9214; - -$L__BB1_103: - add.s64 %rd310, %rd4119, 8; - xor.b64 %rd1397, %rd4115, %rd4114; - xor.b64 %rd1398, %rd1397, %rd4116; - xor.b64 %rd1399, %rd1398, %rd4120; - xor.b64 %rd1400, %rd1399, %rd4125; - xor.b64 %rd1401, %rd4110, %rd4124; - xor.b64 %rd1402, %rd1401, %rd4111; - xor.b64 %rd1403, %rd1402, %rd4112; - xor.b64 %rd1404, %rd1403, %rd4113; - xor.b64 %rd1405, %rd4106, %rd4123; - xor.b64 %rd1406, %rd1405, %rd4107; - xor.b64 %rd1407, %rd1406, %rd4108; - xor.b64 %rd1408, %rd1407, %rd4109; - xor.b64 %rd1409, %rd4102, %rd4122; - xor.b64 %rd1410, %rd1409, %rd4103; - xor.b64 %rd1411, %rd1410, %rd4104; - xor.b64 %rd1412, %rd1411, %rd4105; - xor.b64 %rd1413, %rd4098, %rd4121; - xor.b64 %rd1414, %rd1413, %rd4099; - xor.b64 %rd1415, %rd1414, %rd4100; - xor.b64 %rd1416, %rd1415, %rd4101; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1404, 1; - shr.b64 %rhs, %rd1404, 63; - add.u64 %rd1417, %lhs, %rhs; - } - xor.b64 %rd1418, %rd1417, %rd1416; - xor.b64 %rd1419, %rd4125, %rd1418; - xor.b64 %rd1420, %rd1418, %rd4120; - xor.b64 %rd1421, %rd1418, %rd4116; - xor.b64 %rd1422, %rd1418, %rd4115; - xor.b64 %rd1423, %rd1418, %rd4114; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1408, 1; - shr.b64 %rhs, %rd1408, 63; - add.u64 %rd1424, %lhs, %rhs; - } - xor.b64 %rd1425, %rd1400, %rd1424; - xor.b64 %rd1426, %rd1425, %rd4124; - xor.b64 %rd1427, %rd1425, %rd4113; - xor.b64 %rd1428, %rd1425, %rd4112; - xor.b64 %rd1429, %rd1425, %rd4111; - xor.b64 %rd1430, %rd1425, %rd4110; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1412, 1; - shr.b64 %rhs, %rd1412, 63; - add.u64 %rd1431, %lhs, %rhs; - } - xor.b64 %rd1432, %rd1404, %rd1431; - xor.b64 %rd1433, %rd1432, %rd4123; - xor.b64 %rd1434, %rd1432, %rd4109; - xor.b64 %rd1435, %rd1432, %rd4108; - xor.b64 %rd1436, %rd1432, %rd4107; - xor.b64 %rd1437, %rd1432, %rd4106; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1416, 1; - shr.b64 %rhs, %rd1416, 63; - add.u64 %rd1438, %lhs, %rhs; - } - xor.b64 %rd1439, %rd1408, %rd1438; - xor.b64 %rd1440, %rd1439, %rd4122; - xor.b64 %rd1441, %rd1439, %rd4105; - xor.b64 %rd1442, %rd1439, %rd4104; - xor.b64 %rd1443, %rd1439, %rd4103; - xor.b64 %rd1444, %rd1439, %rd4102; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1400, 1; - shr.b64 %rhs, %rd1400, 63; - add.u64 %rd1445, %lhs, %rhs; - } - xor.b64 %rd1446, %rd1445, %rd1412; - xor.b64 %rd1447, %rd1446, %rd4121; - xor.b64 %rd1448, %rd1446, %rd4101; - xor.b64 %rd1449, %rd1446, %rd4100; - xor.b64 %rd1450, %rd1446, %rd4099; - xor.b64 %rd1451, %rd1446, %rd4098; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1426, 1; - shr.b64 %rhs, %rd1426, 63; - add.u64 %rd1452, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1421, 3; - shr.b64 %rhs, %rd1421, 61; - add.u64 %rd1453, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1434, 6; - shr.b64 %rhs, %rd1434, 58; - add.u64 %rd1454, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1428, 10; - shr.b64 %rhs, %rd1428, 54; - add.u64 %rd1455, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1436, 15; - shr.b64 %rhs, %rd1436, 49; - add.u64 %rd1456, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1443, 21; - shr.b64 %rhs, %rd1443, 43; - add.u64 %rd1457, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1440, 28; - shr.b64 %rhs, %rd1440, 36; - add.u64 %rd1458, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1420, 36; - shr.b64 %rhs, %rd1420, 28; - add.u64 %rd1459, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1429, 45; - shr.b64 %rhs, %rd1429, 19; - add.u64 %rd1460, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1441, 55; - shr.b64 %rhs, %rd1441, 9; - add.u64 %rd1461, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1430, 2; - shr.b64 %rhs, %rd1430, 62; - add.u64 %rd1462, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1451, 14; - shr.b64 %rhs, %rd1451, 50; - add.u64 %rd1463, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1447, 27; - shr.b64 %rhs, %rd1447, 37; - add.u64 %rd1464, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1422, 41; - shr.b64 %rhs, %rd1422, 23; - add.u64 %rd1465, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1444, 56; - shr.b64 %rhs, %rd1444, 8; - add.u64 %rd1466, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1450, 8; - shr.b64 %rhs, %rd1450, 56; - add.u64 %rd1467, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1442, 25; - shr.b64 %rhs, %rd1442, 39; - add.u64 %rd1468, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1435, 43; - shr.b64 %rhs, %rd1435, 21; - add.u64 %rd1469, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1433, 62; - shr.b64 %rhs, %rd1433, 2; - add.u64 %rd1470, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1423, 18; - shr.b64 %rhs, %rd1423, 46; - add.u64 %rd1471, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1449, 39; - shr.b64 %rhs, %rd1449, 25; - add.u64 %rd1472, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1437, 61; - shr.b64 %rhs, %rd1437, 3; - add.u64 %rd1473, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1448, 20; - shr.b64 %rhs, %rd1448, 44; - add.u64 %rd1474, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1427, 44; - shr.b64 %rhs, %rd1427, 20; - add.u64 %rd1475, %lhs, %rhs; - } - not.b64 %rd1476, %rd1475; - and.b64 %rd1477, %rd1469, %rd1476; - not.b64 %rd1478, %rd1469; - and.b64 %rd1479, %rd1457, %rd1478; - xor.b64 %rd4124, %rd1475, %rd1479; - not.b64 %rd1480, %rd1457; - and.b64 %rd1481, %rd1463, %rd1480; - xor.b64 %rd4123, %rd1481, %rd1469; - not.b64 %rd1482, %rd1463; - and.b64 %rd1483, %rd1419, %rd1482; - xor.b64 %rd4122, %rd1483, %rd1457; - not.b64 %rd1484, %rd1419; - and.b64 %rd1485, %rd1475, %rd1484; - xor.b64 %rd4121, %rd1485, %rd1463; - not.b64 %rd1486, %rd1474; - and.b64 %rd1487, %rd1453, %rd1486; - xor.b64 %rd4120, %rd1487, %rd1458; - not.b64 %rd1488, %rd1453; - and.b64 %rd1489, %rd1460, %rd1488; - xor.b64 %rd4113, %rd1489, %rd1474; - not.b64 %rd1490, %rd1460; - and.b64 %rd1491, %rd1473, %rd1490; - xor.b64 %rd4109, %rd1491, %rd1453; - not.b64 %rd1492, %rd1473; - and.b64 %rd1493, %rd1458, %rd1492; - xor.b64 %rd4105, %rd1460, %rd1493; - not.b64 %rd1494, %rd1458; - and.b64 %rd1495, %rd1474, %rd1494; - xor.b64 %rd4101, %rd1495, %rd1473; - not.b64 %rd1496, %rd1454; - and.b64 %rd1497, %rd1468, %rd1496; - xor.b64 %rd4116, %rd1452, %rd1497; - not.b64 %rd1498, %rd1468; - and.b64 %rd1499, %rd1467, %rd1498; - xor.b64 %rd4112, %rd1499, %rd1454; - not.b64 %rd1500, %rd1467; - and.b64 %rd1501, %rd1471, %rd1500; - xor.b64 %rd4108, %rd1501, %rd1468; - not.b64 %rd1502, %rd1471; - and.b64 %rd1503, %rd1452, %rd1502; - xor.b64 %rd4104, %rd1503, %rd1467; - not.b64 %rd1504, %rd1452; - and.b64 %rd1505, %rd1454, %rd1504; - xor.b64 %rd4100, %rd1505, %rd1471; - not.b64 %rd1506, %rd1459; - and.b64 %rd1507, %rd1455, %rd1506; - xor.b64 %rd4115, %rd1507, %rd1464; - not.b64 %rd1508, %rd1455; - and.b64 %rd1509, %rd1456, %rd1508; - xor.b64 %rd4111, %rd1509, %rd1459; - not.b64 %rd1510, %rd1456; - and.b64 %rd1511, %rd1466, %rd1510; - xor.b64 %rd4107, %rd1455, %rd1511; - not.b64 %rd1512, %rd1466; - and.b64 %rd1513, %rd1464, %rd1512; - xor.b64 %rd4103, %rd1513, %rd1456; - not.b64 %rd1514, %rd1464; - and.b64 %rd1515, %rd1459, %rd1514; - xor.b64 %rd4099, %rd1515, %rd1466; - not.b64 %rd1516, %rd1461; - and.b64 %rd1517, %rd1472, %rd1516; - xor.b64 %rd4114, %rd1517, %rd1470; - not.b64 %rd1518, %rd1472; - and.b64 %rd1519, %rd1465, %rd1518; - xor.b64 %rd4110, %rd1519, %rd1461; - not.b64 %rd1520, %rd1465; - and.b64 %rd1521, %rd1462, %rd1520; - xor.b64 %rd4106, %rd1521, %rd1472; - not.b64 %rd1522, %rd1462; - and.b64 %rd1523, %rd1470, %rd1522; - xor.b64 %rd4102, %rd1523, %rd1465; - not.b64 %rd1524, %rd1470; - and.b64 %rd1525, %rd1461, %rd1524; - xor.b64 %rd4098, %rd1462, %rd1525; - ld.global.nc.u64 %rd1526, [%rd4119]; - xor.b64 %rd1527, %rd1526, %rd1419; - xor.b64 %rd4125, %rd1527, %rd1477; - add.s64 %rd4093, %rd4093, -8; - setp.ne.s64 %p70, %rd4093, 0; - mov.u64 %rd4119, %rd310; - @%p70 bra $L__BB1_103; - - st.local.u64 [%rd255], %rd4110; - st.local.u64 [%rd270], %rd4098; - st.local.u64 [%rd265], %rd4102; - st.local.u64 [%rd256], %rd4123; - st.local.u64 [%rd261], %rd4122; - st.local.u64 [%rd266], %rd4121; - st.local.u64 [%rd247], %rd4120; - st.local.u64 [%rd252], %rd4113; - st.local.u64 [%rd257], %rd4109; - st.local.u64 [%rd262], %rd4105; - st.local.u64 [%rd267], %rd4101; - st.local.u64 [%rd248], %rd4116; - st.local.u64 [%rd253], %rd4112; - st.local.u64 [%rd258], %rd4108; - st.local.u64 [%rd263], %rd4104; - st.local.u64 [%rd268], %rd4100; - st.local.u64 [%rd249], %rd4115; - st.local.u64 [%rd254], %rd4111; - st.local.u64 [%rd259], %rd4107; - st.local.u64 [%rd264], %rd4103; - st.local.u64 [%rd269], %rd4099; - st.local.u64 [%rd250], %rd4114; - st.local.u64 [%rd260], %rd4106; - st.local.u64 [%rd251], %rd4124; - st.local.u64 [%rd1], %rd4125; - -$L__BB1_105: - shr.u64 %rd1528, %rd4123, 8; - shr.u64 %rd1529, %rd4123, 16; - shr.u64 %rd1530, %rd4123, 24; - shr.u64 %rd1531, %rd4123, 32; - shr.u64 %rd1532, %rd4123, 40; - shr.u64 %rd1533, %rd4123, 48; - shr.u64 %rd1534, %rd4123, 56; - shr.u64 %rd1535, %rd4122, 8; - shr.u64 %rd1536, %rd4122, 16; - shr.u64 %rd1537, %rd4122, 24; - shr.u64 %rd1538, %rd4122, 32; - shr.u64 %rd1539, %rd4122, 40; - shr.u64 %rd1540, %rd4122, 48; - shr.u64 %rd1541, %rd4122, 56; - shr.u64 %rd1542, %rd4121, 8; - shr.u64 %rd1543, %rd4121, 16; - shr.u64 %rd1544, %rd4121, 24; - shr.u64 %rd1545, %rd4121, 32; - shr.u64 %rd1546, %rd4121, 40; - shr.u64 %rd1547, %rd4121, 48; - shr.u64 %rd1548, %rd4121, 56; - shr.u64 %rd1549, %rd4120, 8; - shr.u64 %rd1550, %rd4120, 16; - shr.u64 %rd1551, %rd4120, 24; - shr.u64 %rd1552, %rd4120, 32; - shr.u64 %rd1553, %rd4120, 40; - shr.u64 %rd1554, %rd4120, 48; - shr.u64 %rd1555, %rd4120, 56; - shr.u64 %rd1556, %rd4125, 8; - shr.u64 %rd1557, %rd4125, 16; - shr.u64 %rd1558, %rd4125, 24; - shr.u64 %rd1559, %rd4125, 32; - shr.u64 %rd1560, %rd4125, 40; - shr.u64 %rd1561, %rd4125, 48; - shr.u64 %rd1562, %rd4125, 56; - shr.u64 %rd1563, %rd4124, 8; - shr.u64 %rd1564, %rd4124, 16; - shr.u64 %rd1565, %rd4124, 24; - shr.u64 %rd1566, %rd4124, 32; - shr.u64 %rd1567, %rd4124, 40; - shr.u64 %rd1568, %rd4124, 48; - shr.u64 %rd1569, %rd4124, 56; - mov.u16 %rs1867, 48; - st.local.u16 [%rd12], %rs1867; - cvt.u16.u64 %rs1868, %rd4125; - cvt.u16.u64 %rs1869, %rd1556; - st.local.v2.u8 [%rd12+2], {%rs1868, %rs1869}; - cvt.u16.u64 %rs1870, %rd1558; - cvt.u16.u64 %rs1871, %rd1557; - st.local.v2.u8 [%rd12+4], {%rs1871, %rs1870}; - cvt.u16.u64 %rs1872, %rd1560; - cvt.u16.u64 %rs1873, %rd1559; - st.local.v2.u8 [%rd12+6], {%rs1873, %rs1872}; - cvt.u16.u64 %rs1874, %rd1562; - cvt.u16.u64 %rs1875, %rd1561; - st.local.v2.u8 [%rd12+8], {%rs1875, %rs1874}; - cvt.u16.u64 %rs1876, %rd4124; - cvt.u16.u64 %rs1877, %rd1563; - st.local.v2.u8 [%rd12+10], {%rs1876, %rs1877}; - cvt.u16.u64 %rs1878, %rd1565; - cvt.u16.u64 %rs1879, %rd1564; - st.local.v2.u8 [%rd12+12], {%rs1879, %rs1878}; - cvt.u16.u64 %rs1880, %rd1567; - cvt.u16.u64 %rs1881, %rd1566; - st.local.v2.u8 [%rd12+14], {%rs1881, %rs1880}; - cvt.u16.u64 %rs1882, %rd1569; - cvt.u16.u64 %rs1883, %rd1568; - st.local.v2.u8 [%rd12+16], {%rs1883, %rs1882}; - cvt.u16.u64 %rs1884, %rd4123; - cvt.u16.u64 %rs1885, %rd1528; - st.local.v2.u8 [%rd12+18], {%rs1884, %rs1885}; - cvt.u16.u64 %rs1886, %rd1530; - cvt.u16.u64 %rs1887, %rd1529; - st.local.v2.u8 [%rd12+20], {%rs1887, %rs1886}; - cvt.u16.u64 %rs1888, %rd1532; - cvt.u16.u64 %rs1889, %rd1531; - st.local.v2.u8 [%rd12+22], {%rs1889, %rs1888}; - cvt.u16.u64 %rs1890, %rd1534; - cvt.u16.u64 %rs1891, %rd1533; - st.local.v2.u8 [%rd12+24], {%rs1891, %rs1890}; - cvt.u16.u64 %rs1892, %rd4122; - cvt.u16.u64 %rs1893, %rd1535; - st.local.v2.u8 [%rd12+26], {%rs1892, %rs1893}; - cvt.u16.u64 %rs1894, %rd1537; - cvt.u16.u64 %rs1895, %rd1536; - st.local.v2.u8 [%rd12+28], {%rs1895, %rs1894}; - cvt.u16.u64 %rs1896, %rd1539; - cvt.u16.u64 %rs1897, %rd1538; - st.local.v2.u8 [%rd12+30], {%rs1897, %rs1896}; - cvt.u16.u64 %rs1898, %rd1541; - cvt.u16.u64 %rs1899, %rd1540; - st.local.v2.u8 [%rd12+32], {%rs1899, %rs1898}; - cvt.u16.u64 %rs1900, %rd4121; - cvt.u16.u64 %rs1901, %rd1542; - st.local.v2.u8 [%rd12+34], {%rs1900, %rs1901}; - cvt.u16.u64 %rs1902, %rd1544; - cvt.u16.u64 %rs1903, %rd1543; - st.local.v2.u8 [%rd12+36], {%rs1903, %rs1902}; - cvt.u16.u64 %rs1904, %rd1546; - cvt.u16.u64 %rs1905, %rd1545; - st.local.v2.u8 [%rd12+38], {%rs1905, %rs1904}; - cvt.u16.u64 %rs1906, %rd1548; - cvt.u16.u64 %rs1907, %rd1547; - st.local.v2.u8 [%rd12+40], {%rs1907, %rs1906}; - cvt.u16.u64 %rs1908, %rd4120; - cvt.u16.u64 %rs1909, %rd1549; - st.local.v2.u8 [%rd12+42], {%rs1908, %rs1909}; - cvt.u16.u64 %rs1910, %rd1551; - cvt.u16.u64 %rs1911, %rd1550; - st.local.v2.u8 [%rd12+44], {%rs1911, %rs1910}; - cvt.u16.u64 %rs1912, %rd1553; - cvt.u16.u64 %rs1913, %rd1552; - st.local.v2.u8 [%rd12+46], {%rs1913, %rs1912}; - cvt.u16.u64 %rs1914, %rd1555; - cvt.u16.u64 %rs1915, %rd1554; - st.local.v2.u8 [%rd12+48], {%rs1915, %rs1914}; - st.local.v2.u8 [%rd12+50], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+52], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+54], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+56], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+58], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+60], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+62], {%rs1623, %rs1623}; - st.local.v2.u8 [%rd12+64], {%rs1623, %rs1623}; - bra.uni $L__BB1_549; - -$L__BB1_110: - setp.gt.u16 %p71, %rs1, 10; - add.u64 %rd1570, %SP, 352; - add.u64 %rd343, %SPL, 352; - mov.u16 %rs1918, 0; - st.local.v4.u16 [%rd343], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1571, %rd1570, 8; - cvta.to.local.u64 %rd344, %rd1571; - st.local.v4.u16 [%rd344], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1572, %rd1570, 16; - cvta.to.local.u64 %rd345, %rd1572; - st.local.v4.u16 [%rd345], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1573, %rd1570, 24; - cvta.to.local.u64 %rd346, %rd1573; - st.local.v4.u16 [%rd346], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1574, %rd1570, 32; - cvta.to.local.u64 %rd347, %rd1574; - st.local.v4.u16 [%rd347], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1575, %rd1570, 40; - cvta.to.local.u64 %rd348, %rd1575; - st.local.v4.u16 [%rd348], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1576, %rd1570, 48; - cvta.to.local.u64 %rd349, %rd1576; - st.local.v4.u16 [%rd349], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1577, %rd1570, 56; - cvta.to.local.u64 %rd350, %rd1577; - st.local.v4.u16 [%rd350], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1578, %rd1570, 64; - cvta.to.local.u64 %rd351, %rd1578; - st.local.v4.u16 [%rd351], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1579, %rd1570, 72; - cvta.to.local.u64 %rd352, %rd1579; - st.local.v4.u16 [%rd352], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1580, %rd1570, 80; - cvta.to.local.u64 %rd353, %rd1580; - st.local.v4.u16 [%rd353], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1581, %rd1570, 88; - cvta.to.local.u64 %rd354, %rd1581; - st.local.v4.u16 [%rd354], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1582, %rd1570, 96; - cvta.to.local.u64 %rd355, %rd1582; - st.local.v4.u16 [%rd355], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1583, %rd1570, 104; - cvta.to.local.u64 %rd356, %rd1583; - st.local.v4.u16 [%rd356], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1584, %rd1570, 112; - cvta.to.local.u64 %rd357, %rd1584; - st.local.v4.u16 [%rd357], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1585, %rd1570, 120; - cvta.to.local.u64 %rd358, %rd1585; - st.local.v4.u16 [%rd358], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd1586, %rd1570, 128; - cvta.to.local.u64 %rd359, %rd1586; - st.local.v4.u16 [%rd359], {%rs1918, %rs1918, %rs1918, %rs1918}; - add.s64 %rd360, %rd1570, 136; - cvta.to.local.u64 %rd361, %rd360; - st.local.u8 [%rd361], %rs1918; - @%p71 bra $L__BB1_157; - - cvta.to.local.u64 %rd362, %rd978; - shr.u64 %rd363, %rd11, 1; - setp.eq.s64 %p72, %rd363, 0; - @%p72 bra $L__BB1_115; - - mov.u64 %rd4128, 1; - mov.u64 %rd4126, %rd362; - mov.u64 %rd4127, %rd343; - bra.uni $L__BB1_113; - -$L__BB1_114: - ld.local.u16 %rs2, [%rd4126+4]; - add.s64 %rd4128, %rd4128, 1; - add.s64 %rd4127, %rd4127, 2; - add.s64 %rd4126, %rd4126, 2; - -$L__BB1_113: - st.local.u16 [%rd4127], %rs2; - setp.ge.u64 %p73, %rd4128, %rd363; - @%p73 bra $L__BB1_115; - bra.uni $L__BB1_114; - -$L__BB1_115: - and.b64 %rd371, %rd11, 1; - setp.eq.s64 %p74, %rd371, 0; - @%p74 bra $L__BB1_118; - - and.b64 %rd1591, %rd11, 65534; - cvta.to.local.u64 %rd1593, %rd1570; - add.s64 %rd372, %rd1593, %rd1591; - add.s64 %rd1594, %rd362, %rd1591; - add.s64 %rd373, %rd1594, 2; - mov.u64 %rd4129, 0; - -$L__BB1_117: - add.s64 %rd1595, %rd373, %rd4129; - ld.local.u8 %rs1919, [%rd1595]; - add.s64 %rd1596, %rd372, %rd4129; - st.local.u8 [%rd1596], %rs1919; - add.s64 %rd4129, %rd4129, 1; - setp.lt.u64 %p75, %rd4129, %rd371; - @%p75 bra $L__BB1_117; - -$L__BB1_118: - mov.u64 %rd1597, 0; - st.local.u8 [%rd361], %rs1; - ld.local.v4.u16 {%rs1920, %rs1921, %rs1922, %rs1923}, [%rd343]; - ld.local.v4.u16 {%rs1928, %rs1929, %rs1930, %rs1931}, [%rd344]; - ld.local.v4.u16 {%rs1936, %rs1937, %rs1938, %rs1939}, [%rd345]; - ld.local.v4.u16 {%rs1944, %rs1945, %rs1946, %rs1947}, [%rd346]; - ld.local.v4.u16 {%rs1952, %rs1953, %rs1954, %rs1955}, [%rd347]; - shr.u16 %rs1958, %rs1955, 8; - ld.local.v4.u16 {%rs1959, %rs1960, %rs1961, %rs1962}, [%rd348]; - ld.local.v4.u16 {%rs1967, %rs1968, %rs1969, %rs1970}, [%rd349]; - ld.local.v4.u16 {%rs1975, %rs1976, %rs1977, %rs1978}, [%rd350]; - ld.local.v4.u16 {%rs1983, %rs1984, %rs1985, %rs1986}, [%rd351]; - ld.local.v4.u16 {%rs1991, %rs1992, %rs1993, %rs1994}, [%rd352]; - ld.local.v4.u16 {%rs1999, %rs2000, %rs2001, %rs2002}, [%rd353]; - ld.local.v4.u16 {%rs2007, %rs2008, %rs2009, %rs2010}, [%rd354]; - ld.local.v4.u16 {%rs2015, %rs2016, %rs2017, %rs2018}, [%rd355]; - shr.u16 %rs2021, %rs2018, 8; - ld.local.v4.u16 {%rs2022, %rs2023, %rs2024, %rs2025}, [%rd356]; - ld.local.v4.u16 {%rs2030, %rs2031, %rs2032, %rs2033}, [%rd357]; - ld.local.v4.u16 {%rs2038, %rs2039, %rs2040, %rs2041}, [%rd358]; - ld.local.v4.u16 {%rs2046, %rs2047, %rs2048, %rs2049}, [%rd359]; - ld.local.v4.u16 {%rs2054, %rs2055, %rs2056, %rs2057}, [%rd361]; - and.b16 %rs2061, %rs2054, 255; - st.local.u64 [%rd1], %rd1597; - st.local.u64 [%rd1+8], %rd1597; - st.local.u64 [%rd1+16], %rd1597; - st.local.u64 [%rd1+24], %rd1597; - st.local.u64 [%rd1+32], %rd1597; - st.local.u64 [%rd1+40], %rd1597; - st.local.u64 [%rd1+48], %rd1597; - st.local.u64 [%rd1+56], %rd1597; - st.local.u64 [%rd1+64], %rd1597; - st.local.u64 [%rd1+72], %rd1597; - st.local.u64 [%rd1+80], %rd1597; - st.local.u64 [%rd1+88], %rd1597; - st.local.u64 [%rd1+96], %rd1597; - st.local.u64 [%rd1+104], %rd1597; - st.local.u64 [%rd1+112], %rd1597; - st.local.u64 [%rd1+120], %rd1597; - st.local.u64 [%rd1+128], %rd1597; - st.local.u64 [%rd1+136], %rd1597; - st.local.u64 [%rd1+144], %rd1597; - st.local.u64 [%rd1+152], %rd1597; - st.local.u64 [%rd1+160], %rd1597; - st.local.u64 [%rd1+168], %rd1597; - st.local.u64 [%rd1+176], %rd1597; - st.local.u64 [%rd1+184], %rd1597; - st.local.u64 [%rd1+192], %rd1597; - st.local.v4.u16 [%rd1+200], {%rs1920, %rs1921, %rs1922, %rs1923}; - st.local.v4.u16 [%rd1+208], {%rs1928, %rs1929, %rs1930, %rs1931}; - st.local.v4.u16 [%rd1+216], {%rs1936, %rs1937, %rs1938, %rs1939}; - st.local.v4.u16 [%rd1+224], {%rs1944, %rs1945, %rs1946, %rs1947}; - st.local.v2.u16 [%rd1+232], {%rs1952, %rs1953}; - st.local.u16 [%rd1+236], %rs1954; - st.local.u8 [%rd1+238], %rs1955; - st.local.u8 [%rd1+239], %rs1958; - st.local.v4.u16 [%rd1+240], {%rs1959, %rs1960, %rs1961, %rs1962}; - st.local.v4.u16 [%rd1+248], {%rs1967, %rs1968, %rs1969, %rs1970}; - st.local.v4.u16 [%rd1+256], {%rs1975, %rs1976, %rs1977, %rs1978}; - st.local.v4.u16 [%rd1+264], {%rs1983, %rs1984, %rs1985, %rs1986}; - st.local.v4.u16 [%rd1+272], {%rs1991, %rs1992, %rs1993, %rs1994}; - st.local.v4.u16 [%rd1+280], {%rs1999, %rs2000, %rs2001, %rs2002}; - st.local.v4.u16 [%rd1+288], {%rs2007, %rs2008, %rs2009, %rs2010}; - st.local.v2.u16 [%rd1+296], {%rs2015, %rs2016}; - st.local.u16 [%rd1+300], %rs2017; - st.local.u8 [%rd1+302], %rs2018; - st.local.u8 [%rd1+303], %rs2021; - st.local.v4.u16 [%rd1+304], {%rs2022, %rs2023, %rs2024, %rs2025}; - st.local.v4.u16 [%rd1+312], {%rs2030, %rs2031, %rs2032, %rs2033}; - st.local.v4.u16 [%rd1+320], {%rs2038, %rs2039, %rs2040, %rs2041}; - st.local.v4.u16 [%rd1+328], {%rs2046, %rs2047, %rs2048, %rs2049}; - st.local.v4.u16 [%rd1+336], {%rs2054, %rs2055, %rs2056, %rs2057}; - setp.gt.u16 %p76, %rs2061, 136; - @%p76 bra $L__BB1_156; - - setp.eq.s16 %p77, %rs2061, 136; - @%p77 bra $L__BB1_154; - - cvt.u64.u16 %rd1599, %rs2054; - and.b64 %rd377, %rd1599, 255; - add.s64 %rd1600, %rd1, %rd377; - add.s64 %rd378, %rd1600, 200; - neg.s16 %rs2067, %rs2054; - and.b16 %rs212, %rs2067, 7; - setp.eq.s16 %p78, %rs212, 0; - mov.u64 %rd4136, %rd378; - @%p78 bra $L__BB1_123; - - cvt.u64.u16 %rd1601, %rs212; - neg.s64 %rd4130, %rd1601; - mov.u64 %rd4131, %rd378; - -$L__BB1_122: - .pragma "nounroll"; - add.s64 %rd4136, %rd4131, 1; - st.local.u8 [%rd4131], %rs1918; - add.s64 %rd4130, %rd4130, 1; - setp.ne.s64 %p79, %rd4130, 0; - mov.u64 %rd4131, %rd4136; - @%p79 bra $L__BB1_122; - -$L__BB1_123: - mov.u64 %rd1602, 135; - sub.s64 %rd1603, %rd1602, %rd377; - setp.lt.u64 %p80, %rd1603, 7; - @%p80 bra $L__BB1_130; - - add.s64 %rd1604, %rd1, 328; - sub.s64 %rd387, %rd1604, %rd4136; - shr.u64 %rd1605, %rd387, 3; - add.s64 %rd1606, %rd1605, 1; - and.b64 %rd388, %rd1606, 3; - setp.eq.s64 %p81, %rd388, 0; - mov.u64 %rd4139, %rd4136; - @%p81 bra $L__BB1_127; - - neg.s64 %rd4133, %rd388; - mov.u64 %rd4135, %rd4136; - -$L__BB1_126: - .pragma "nounroll"; - st.local.u8 [%rd4135], %rs1918; - st.local.u8 [%rd4135+1], %rs1918; - st.local.u8 [%rd4135+2], %rs1918; - st.local.u8 [%rd4135+3], %rs1918; - st.local.u8 [%rd4135+4], %rs1918; - st.local.u8 [%rd4135+5], %rs1918; - st.local.u8 [%rd4135+6], %rs1918; - add.s64 %rd4136, %rd4136, 8; - add.s64 %rd4139, %rd4135, 8; - st.local.u8 [%rd4135+7], %rs1918; - add.s64 %rd4133, %rd4133, 1; - setp.ne.s64 %p82, %rd4133, 0; - mov.u64 %rd4135, %rd4139; - @%p82 bra $L__BB1_126; - -$L__BB1_127: - setp.lt.u64 %p83, %rd387, 24; - @%p83 bra $L__BB1_130; - - sub.s64 %rd1607, %rd1, %rd4136; - add.s64 %rd4138, %rd1607, 336; - -$L__BB1_129: - st.local.u8 [%rd4139], %rs1918; - st.local.u8 [%rd4139+1], %rs1918; - st.local.u8 [%rd4139+2], %rs1918; - st.local.u8 [%rd4139+3], %rs1918; - st.local.u8 [%rd4139+4], %rs1918; - st.local.u8 [%rd4139+5], %rs1918; - st.local.u8 [%rd4139+6], %rs1918; - st.local.u8 [%rd4139+7], %rs1918; - st.local.u8 [%rd4139+8], %rs1918; - st.local.u8 [%rd4139+9], %rs1918; - st.local.u8 [%rd4139+10], %rs1918; - st.local.u8 [%rd4139+11], %rs1918; - st.local.u8 [%rd4139+12], %rs1918; - st.local.u8 [%rd4139+13], %rs1918; - st.local.u8 [%rd4139+14], %rs1918; - st.local.u8 [%rd4139+15], %rs1918; - st.local.u8 [%rd4139+16], %rs1918; - st.local.u8 [%rd4139+17], %rs1918; - st.local.u8 [%rd4139+18], %rs1918; - st.local.u8 [%rd4139+19], %rs1918; - st.local.u8 [%rd4139+20], %rs1918; - st.local.u8 [%rd4139+21], %rs1918; - st.local.u8 [%rd4139+22], %rs1918; - st.local.u8 [%rd4139+23], %rs1918; - st.local.u8 [%rd4139+24], %rs1918; - st.local.u8 [%rd4139+25], %rs1918; - st.local.u8 [%rd4139+26], %rs1918; - st.local.u8 [%rd4139+27], %rs1918; - st.local.u8 [%rd4139+28], %rs1918; - st.local.u8 [%rd4139+29], %rs1918; - st.local.u8 [%rd4139+30], %rs1918; - st.local.u8 [%rd4139+31], %rs1918; - add.s64 %rd4138, %rd4138, -32; - setp.ne.s64 %p84, %rd4138, 0; - add.s64 %rd4139, %rd4139, 32; - @%p84 bra $L__BB1_129; - -$L__BB1_130: - st.local.u8 [%rd1+336], %rs1918; - setp.gt.u16 %p85, %rs2061, 135; - @%p85 bra $L__BB1_155; - - mov.u16 %rs2073, 6; - st.local.u8 [%rd378], %rs2073; - ld.local.u8 %rs2074, [%rd1+335]; - or.b16 %rs2075, %rs2074, 128; - st.local.u8 [%rd1+335], %rs2075; - ld.local.u64 %rd1608, [%rd1+200]; - shl.b64 %rd1609, %rd1608, 8; - mov.b64 {%r437, %r438}, %rd1609; - shr.u64 %rd1610, %rd1608, 56; - mov.b64 {%r439, %r440}, %rd1610; - mov.b32 {%rs221, %rs2076}, %r439; - mov.b32 {%rs217, %rs219}, %r438; - shr.u16 %rs220, %rs219, 8; - shr.u16 %rs218, %rs217, 8; - mov.b32 {%rs213, %rs215}, %r437; - shr.u16 %rs216, %rs215, 8; - shr.u16 %rs214, %rs213, 8; - mov.pred %p86, 0; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2077, %rs215, 8; - or.b16 %rs2078, %rs214, %rs2077; - shl.b16 %rs2079, %rs217, 8; - or.b16 %rs2080, %rs216, %rs2079; - mov.b32 %r441, {%rs2078, %rs2080}; - shl.b16 %rs2081, %rs219, 8; - or.b16 %rs2082, %rs218, %rs2081; - shl.b16 %rs2083, %rs221, 8; - or.b16 %rs2084, %rs220, %rs2083; - mov.b32 %r442, {%rs2082, %rs2084}; - mov.b64 %rd1611, {%r441, %r442}; - ld.local.u64 %rd1612, [%rd1]; - xor.b64 %rd4170, %rd1612, %rd1611; - st.local.u64 [%rd1], %rd4170; - ld.local.u64 %rd1613, [%rd1+208]; - shl.b64 %rd1614, %rd1613, 8; - mov.b64 {%r443, %r444}, %rd1614; - shr.u64 %rd1615, %rd1613, 56; - mov.b64 {%r445, %r446}, %rd1615; - mov.b32 {%rs230, %rs2085}, %r445; - mov.b32 {%rs226, %rs228}, %r444; - shr.u16 %rs229, %rs228, 8; - shr.u16 %rs227, %rs226, 8; - mov.b32 {%rs222, %rs224}, %r443; - shr.u16 %rs225, %rs224, 8; - shr.u16 %rs223, %rs222, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2086, %rs224, 8; - or.b16 %rs2087, %rs223, %rs2086; - shl.b16 %rs2088, %rs226, 8; - or.b16 %rs2089, %rs225, %rs2088; - mov.b32 %r447, {%rs2087, %rs2089}; - shl.b16 %rs2090, %rs228, 8; - or.b16 %rs2091, %rs227, %rs2090; - shl.b16 %rs2092, %rs230, 8; - or.b16 %rs2093, %rs229, %rs2092; - mov.b32 %r448, {%rs2091, %rs2093}; - mov.b64 %rd1616, {%r447, %r448}; - ld.local.u64 %rd1617, [%rd1+8]; - xor.b64 %rd4169, %rd1617, %rd1616; - st.local.u64 [%rd1+8], %rd4169; - ld.local.u64 %rd1618, [%rd1+216]; - shl.b64 %rd1619, %rd1618, 8; - mov.b64 {%r449, %r450}, %rd1619; - shr.u64 %rd1620, %rd1618, 56; - mov.b64 {%r451, %r452}, %rd1620; - mov.b32 {%rs239, %rs2094}, %r451; - mov.b32 {%rs235, %rs237}, %r450; - shr.u16 %rs238, %rs237, 8; - shr.u16 %rs236, %rs235, 8; - mov.b32 {%rs231, %rs233}, %r449; - shr.u16 %rs234, %rs233, 8; - shr.u16 %rs232, %rs231, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2095, %rs233, 8; - or.b16 %rs2096, %rs232, %rs2095; - shl.b16 %rs2097, %rs235, 8; - or.b16 %rs2098, %rs234, %rs2097; - mov.b32 %r453, {%rs2096, %rs2098}; - shl.b16 %rs2099, %rs237, 8; - or.b16 %rs2100, %rs236, %rs2099; - shl.b16 %rs2101, %rs239, 8; - or.b16 %rs2102, %rs238, %rs2101; - mov.b32 %r454, {%rs2100, %rs2102}; - mov.b64 %rd1621, {%r453, %r454}; - ld.local.u64 %rd1622, [%rd1+16]; - xor.b64 %rd4168, %rd1622, %rd1621; - st.local.u64 [%rd1+16], %rd4168; - ld.local.u64 %rd1623, [%rd1+224]; - shl.b64 %rd1624, %rd1623, 8; - mov.b64 {%r455, %r456}, %rd1624; - shr.u64 %rd1625, %rd1623, 56; - mov.b64 {%r457, %r458}, %rd1625; - mov.b32 {%rs248, %rs2103}, %r457; - mov.b32 {%rs244, %rs246}, %r456; - shr.u16 %rs247, %rs246, 8; - shr.u16 %rs245, %rs244, 8; - mov.b32 {%rs240, %rs242}, %r455; - shr.u16 %rs243, %rs242, 8; - shr.u16 %rs241, %rs240, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2104, %rs242, 8; - or.b16 %rs2105, %rs241, %rs2104; - shl.b16 %rs2106, %rs244, 8; - or.b16 %rs2107, %rs243, %rs2106; - mov.b32 %r459, {%rs2105, %rs2107}; - shl.b16 %rs2108, %rs246, 8; - or.b16 %rs2109, %rs245, %rs2108; - shl.b16 %rs2110, %rs248, 8; - or.b16 %rs2111, %rs247, %rs2110; - mov.b32 %r460, {%rs2109, %rs2111}; - mov.b64 %rd1626, {%r459, %r460}; - ld.local.u64 %rd1627, [%rd1+24]; - xor.b64 %rd4167, %rd1627, %rd1626; - st.local.u64 [%rd1+24], %rd4167; - ld.local.u64 %rd1628, [%rd1+232]; - shl.b64 %rd1629, %rd1628, 8; - mov.b64 {%r461, %r462}, %rd1629; - shr.u64 %rd1630, %rd1628, 56; - mov.b64 {%r463, %r464}, %rd1630; - mov.b32 {%rs257, %rs2112}, %r463; - mov.b32 {%rs253, %rs255}, %r462; - shr.u16 %rs256, %rs255, 8; - shr.u16 %rs254, %rs253, 8; - mov.b32 {%rs249, %rs251}, %r461; - shr.u16 %rs252, %rs251, 8; - shr.u16 %rs250, %rs249, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2113, %rs251, 8; - or.b16 %rs2114, %rs250, %rs2113; - shl.b16 %rs2115, %rs253, 8; - or.b16 %rs2116, %rs252, %rs2115; - mov.b32 %r465, {%rs2114, %rs2116}; - shl.b16 %rs2117, %rs255, 8; - or.b16 %rs2118, %rs254, %rs2117; - shl.b16 %rs2119, %rs257, 8; - or.b16 %rs2120, %rs256, %rs2119; - mov.b32 %r466, {%rs2118, %rs2120}; - mov.b64 %rd1631, {%r465, %r466}; - ld.local.u64 %rd1632, [%rd1+32]; - xor.b64 %rd4141, %rd1632, %rd1631; - st.local.u64 [%rd1+32], %rd4141; - ld.local.u64 %rd1633, [%rd1+240]; - shl.b64 %rd1634, %rd1633, 8; - mov.b64 {%r467, %r468}, %rd1634; - shr.u64 %rd1635, %rd1633, 56; - mov.b64 {%r469, %r470}, %rd1635; - mov.b32 {%rs266, %rs2121}, %r469; - mov.b32 {%rs262, %rs264}, %r468; - shr.u16 %rs265, %rs264, 8; - shr.u16 %rs263, %rs262, 8; - mov.b32 {%rs258, %rs260}, %r467; - shr.u16 %rs261, %rs260, 8; - shr.u16 %rs259, %rs258, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2122, %rs260, 8; - or.b16 %rs2123, %rs259, %rs2122; - shl.b16 %rs2124, %rs262, 8; - or.b16 %rs2125, %rs261, %rs2124; - mov.b32 %r471, {%rs2123, %rs2125}; - shl.b16 %rs2126, %rs264, 8; - or.b16 %rs2127, %rs263, %rs2126; - shl.b16 %rs2128, %rs266, 8; - or.b16 %rs2129, %rs265, %rs2128; - mov.b32 %r472, {%rs2127, %rs2129}; - mov.b64 %rd1636, {%r471, %r472}; - ld.local.u64 %rd1637, [%rd1+40]; - xor.b64 %rd4164, %rd1637, %rd1636; - st.local.u64 [%rd1+40], %rd4164; - ld.local.u64 %rd1638, [%rd1+248]; - shl.b64 %rd1639, %rd1638, 8; - mov.b64 {%r473, %r474}, %rd1639; - shr.u64 %rd1640, %rd1638, 56; - mov.b64 {%r475, %r476}, %rd1640; - mov.b32 {%rs275, %rs2130}, %r475; - mov.b32 {%rs271, %rs273}, %r474; - shr.u16 %rs274, %rs273, 8; - shr.u16 %rs272, %rs271, 8; - mov.b32 {%rs267, %rs269}, %r473; - shr.u16 %rs270, %rs269, 8; - shr.u16 %rs268, %rs267, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2131, %rs269, 8; - or.b16 %rs2132, %rs268, %rs2131; - shl.b16 %rs2133, %rs271, 8; - or.b16 %rs2134, %rs270, %rs2133; - mov.b32 %r477, {%rs2132, %rs2134}; - shl.b16 %rs2135, %rs273, 8; - or.b16 %rs2136, %rs272, %rs2135; - shl.b16 %rs2137, %rs275, 8; - or.b16 %rs2138, %rs274, %rs2137; - mov.b32 %r478, {%rs2136, %rs2138}; - mov.b64 %rd1641, {%r477, %r478}; - ld.local.u64 %rd1642, [%rd1+48]; - xor.b64 %rd4160, %rd1642, %rd1641; - st.local.u64 [%rd1+48], %rd4160; - ld.local.u64 %rd1643, [%rd1+256]; - shl.b64 %rd1644, %rd1643, 8; - mov.b64 {%r479, %r480}, %rd1644; - shr.u64 %rd1645, %rd1643, 56; - mov.b64 {%r481, %r482}, %rd1645; - mov.b32 {%rs284, %rs2139}, %r481; - mov.b32 {%rs280, %rs282}, %r480; - shr.u16 %rs283, %rs282, 8; - shr.u16 %rs281, %rs280, 8; - mov.b32 {%rs276, %rs278}, %r479; - shr.u16 %rs279, %rs278, 8; - shr.u16 %rs277, %rs276, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2140, %rs278, 8; - or.b16 %rs2141, %rs277, %rs2140; - shl.b16 %rs2142, %rs280, 8; - or.b16 %rs2143, %rs279, %rs2142; - mov.b32 %r483, {%rs2141, %rs2143}; - shl.b16 %rs2144, %rs282, 8; - or.b16 %rs2145, %rs281, %rs2144; - shl.b16 %rs2146, %rs284, 8; - or.b16 %rs2147, %rs283, %rs2146; - mov.b32 %r484, {%rs2145, %rs2147}; - mov.b64 %rd1646, {%r483, %r484}; - ld.local.u64 %rd1647, [%rd1+56]; - xor.b64 %rd4156, %rd1647, %rd1646; - st.local.u64 [%rd1+56], %rd4156; - ld.local.u64 %rd1648, [%rd1+264]; - shl.b64 %rd1649, %rd1648, 8; - mov.b64 {%r485, %r486}, %rd1649; - shr.u64 %rd1650, %rd1648, 56; - mov.b64 {%r487, %r488}, %rd1650; - mov.b32 {%rs293, %rs2148}, %r487; - mov.b32 {%rs289, %rs291}, %r486; - shr.u16 %rs292, %rs291, 8; - shr.u16 %rs290, %rs289, 8; - mov.b32 {%rs285, %rs287}, %r485; - shr.u16 %rs288, %rs287, 8; - shr.u16 %rs286, %rs285, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2149, %rs287, 8; - or.b16 %rs2150, %rs286, %rs2149; - shl.b16 %rs2151, %rs289, 8; - or.b16 %rs2152, %rs288, %rs2151; - mov.b32 %r489, {%rs2150, %rs2152}; - shl.b16 %rs2153, %rs291, 8; - or.b16 %rs2154, %rs290, %rs2153; - shl.b16 %rs2155, %rs293, 8; - or.b16 %rs2156, %rs292, %rs2155; - mov.b32 %r490, {%rs2154, %rs2156}; - mov.b64 %rd1651, {%r489, %r490}; - ld.local.u64 %rd1652, [%rd1+64]; - xor.b64 %rd4152, %rd1652, %rd1651; - st.local.u64 [%rd1+64], %rd4152; - ld.local.u64 %rd1653, [%rd1+272]; - shl.b64 %rd1654, %rd1653, 8; - mov.b64 {%r491, %r492}, %rd1654; - shr.u64 %rd1655, %rd1653, 56; - mov.b64 {%r493, %r494}, %rd1655; - mov.b32 {%rs302, %rs2157}, %r493; - mov.b32 {%rs298, %rs300}, %r492; - shr.u16 %rs301, %rs300, 8; - shr.u16 %rs299, %rs298, 8; - mov.b32 {%rs294, %rs296}, %r491; - shr.u16 %rs297, %rs296, 8; - shr.u16 %rs295, %rs294, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2158, %rs296, 8; - or.b16 %rs2159, %rs295, %rs2158; - shl.b16 %rs2160, %rs298, 8; - or.b16 %rs2161, %rs297, %rs2160; - mov.b32 %r495, {%rs2159, %rs2161}; - shl.b16 %rs2162, %rs300, 8; - or.b16 %rs2163, %rs299, %rs2162; - shl.b16 %rs2164, %rs302, 8; - or.b16 %rs2165, %rs301, %rs2164; - mov.b32 %r496, {%rs2163, %rs2165}; - mov.b64 %rd1656, {%r495, %r496}; - ld.local.u64 %rd1657, [%rd1+72]; - xor.b64 %rd4148, %rd1657, %rd1656; - st.local.u64 [%rd1+72], %rd4148; - ld.local.u64 %rd1658, [%rd1+280]; - shl.b64 %rd1659, %rd1658, 8; - mov.b64 {%r497, %r498}, %rd1659; - shr.u64 %rd1660, %rd1658, 56; - mov.b64 {%r499, %r500}, %rd1660; - mov.b32 {%rs311, %rs2166}, %r499; - mov.b32 {%rs307, %rs309}, %r498; - shr.u16 %rs310, %rs309, 8; - shr.u16 %rs308, %rs307, 8; - mov.b32 {%rs303, %rs305}, %r497; - shr.u16 %rs306, %rs305, 8; - shr.u16 %rs304, %rs303, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2167, %rs305, 8; - or.b16 %rs2168, %rs304, %rs2167; - shl.b16 %rs2169, %rs307, 8; - or.b16 %rs2170, %rs306, %rs2169; - mov.b32 %r501, {%rs2168, %rs2170}; - shl.b16 %rs2171, %rs309, 8; - or.b16 %rs2172, %rs308, %rs2171; - shl.b16 %rs2173, %rs311, 8; - or.b16 %rs2174, %rs310, %rs2173; - mov.b32 %r502, {%rs2172, %rs2174}; - mov.b64 %rd1661, {%r501, %r502}; - ld.local.u64 %rd1662, [%rd1+80]; - xor.b64 %rd4163, %rd1662, %rd1661; - st.local.u64 [%rd1+80], %rd4163; - ld.local.u64 %rd1663, [%rd1+288]; - shl.b64 %rd1664, %rd1663, 8; - mov.b64 {%r503, %r504}, %rd1664; - shr.u64 %rd1665, %rd1663, 56; - mov.b64 {%r505, %r506}, %rd1665; - mov.b32 {%rs320, %rs2175}, %r505; - mov.b32 {%rs316, %rs318}, %r504; - shr.u16 %rs319, %rs318, 8; - shr.u16 %rs317, %rs316, 8; - mov.b32 {%rs312, %rs314}, %r503; - shr.u16 %rs315, %rs314, 8; - shr.u16 %rs313, %rs312, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2176, %rs314, 8; - or.b16 %rs2177, %rs313, %rs2176; - shl.b16 %rs2178, %rs316, 8; - or.b16 %rs2179, %rs315, %rs2178; - mov.b32 %r507, {%rs2177, %rs2179}; - shl.b16 %rs2180, %rs318, 8; - or.b16 %rs2181, %rs317, %rs2180; - shl.b16 %rs2182, %rs320, 8; - or.b16 %rs2183, %rs319, %rs2182; - mov.b32 %r508, {%rs2181, %rs2183}; - mov.b64 %rd1666, {%r507, %r508}; - ld.local.u64 %rd1667, [%rd1+88]; - xor.b64 %rd4159, %rd1667, %rd1666; - st.local.u64 [%rd1+88], %rd4159; - ld.local.u64 %rd1668, [%rd1+296]; - shl.b64 %rd1669, %rd1668, 8; - mov.b64 {%r509, %r510}, %rd1669; - shr.u64 %rd1670, %rd1668, 56; - mov.b64 {%r511, %r512}, %rd1670; - mov.b32 {%rs329, %rs2184}, %r511; - mov.b32 {%rs325, %rs327}, %r510; - shr.u16 %rs328, %rs327, 8; - shr.u16 %rs326, %rs325, 8; - mov.b32 {%rs321, %rs323}, %r509; - shr.u16 %rs324, %rs323, 8; - shr.u16 %rs322, %rs321, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2185, %rs323, 8; - or.b16 %rs2186, %rs322, %rs2185; - shl.b16 %rs2187, %rs325, 8; - or.b16 %rs2188, %rs324, %rs2187; - mov.b32 %r513, {%rs2186, %rs2188}; - shl.b16 %rs2189, %rs327, 8; - or.b16 %rs2190, %rs326, %rs2189; - shl.b16 %rs2191, %rs329, 8; - or.b16 %rs2192, %rs328, %rs2191; - mov.b32 %r514, {%rs2190, %rs2192}; - mov.b64 %rd1671, {%r513, %r514}; - ld.local.u64 %rd1672, [%rd1+96]; - xor.b64 %rd4155, %rd1672, %rd1671; - st.local.u64 [%rd1+96], %rd4155; - ld.local.u64 %rd1673, [%rd1+304]; - shl.b64 %rd1674, %rd1673, 8; - mov.b64 {%r515, %r516}, %rd1674; - shr.u64 %rd1675, %rd1673, 56; - mov.b64 {%r517, %r518}, %rd1675; - mov.b32 {%rs338, %rs2193}, %r517; - mov.b32 {%rs334, %rs336}, %r516; - shr.u16 %rs337, %rs336, 8; - shr.u16 %rs335, %rs334, 8; - mov.b32 {%rs330, %rs332}, %r515; - shr.u16 %rs333, %rs332, 8; - shr.u16 %rs331, %rs330, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2194, %rs332, 8; - or.b16 %rs2195, %rs331, %rs2194; - shl.b16 %rs2196, %rs334, 8; - or.b16 %rs2197, %rs333, %rs2196; - mov.b32 %r519, {%rs2195, %rs2197}; - shl.b16 %rs2198, %rs336, 8; - or.b16 %rs2199, %rs335, %rs2198; - shl.b16 %rs2200, %rs338, 8; - or.b16 %rs2201, %rs337, %rs2200; - mov.b32 %r520, {%rs2199, %rs2201}; - mov.b64 %rd1676, {%r519, %r520}; - ld.local.u64 %rd1677, [%rd1+104]; - xor.b64 %rd4151, %rd1677, %rd1676; - st.local.u64 [%rd1+104], %rd4151; - ld.local.u64 %rd1678, [%rd1+312]; - shl.b64 %rd1679, %rd1678, 8; - mov.b64 {%r521, %r522}, %rd1679; - shr.u64 %rd1680, %rd1678, 56; - mov.b64 {%r523, %r524}, %rd1680; - mov.b32 {%rs347, %rs2202}, %r523; - mov.b32 {%rs343, %rs345}, %r522; - shr.u16 %rs346, %rs345, 8; - shr.u16 %rs344, %rs343, 8; - mov.b32 {%rs339, %rs341}, %r521; - shr.u16 %rs342, %rs341, 8; - shr.u16 %rs340, %rs339, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2203, %rs341, 8; - or.b16 %rs2204, %rs340, %rs2203; - shl.b16 %rs2205, %rs343, 8; - or.b16 %rs2206, %rs342, %rs2205; - mov.b32 %r525, {%rs2204, %rs2206}; - shl.b16 %rs2207, %rs345, 8; - or.b16 %rs2208, %rs344, %rs2207; - shl.b16 %rs2209, %rs347, 8; - or.b16 %rs2210, %rs346, %rs2209; - mov.b32 %r526, {%rs2208, %rs2210}; - mov.b64 %rd1681, {%r525, %r526}; - ld.local.u64 %rd1682, [%rd1+112]; - xor.b64 %rd4147, %rd1682, %rd1681; - st.local.u64 [%rd1+112], %rd4147; - ld.local.u64 %rd1683, [%rd1+320]; - shl.b64 %rd1684, %rd1683, 8; - mov.b64 {%r527, %r528}, %rd1684; - shr.u64 %rd1685, %rd1683, 56; - mov.b64 {%r529, %r530}, %rd1685; - mov.b32 {%rs356, %rs2211}, %r529; - mov.b32 {%rs352, %rs354}, %r528; - shr.u16 %rs355, %rs354, 8; - shr.u16 %rs353, %rs352, 8; - mov.b32 {%rs348, %rs350}, %r527; - shr.u16 %rs351, %rs350, 8; - shr.u16 %rs349, %rs348, 8; - @%p86 bra $L__BB1_148; - - shl.b16 %rs2212, %rs350, 8; - or.b16 %rs2213, %rs349, %rs2212; - shl.b16 %rs2214, %rs352, 8; - or.b16 %rs2215, %rs351, %rs2214; - mov.b32 %r531, {%rs2213, %rs2215}; - shl.b16 %rs2216, %rs354, 8; - or.b16 %rs2217, %rs353, %rs2216; - shl.b16 %rs2218, %rs356, 8; - or.b16 %rs2219, %rs355, %rs2218; - mov.b32 %r532, {%rs2217, %rs2219}; - mov.b64 %rd1686, {%r531, %r532}; - ld.local.u64 %rd1687, [%rd1+120]; - xor.b64 %rd4162, %rd1687, %rd1686; - st.local.u64 [%rd1+120], %rd4162; - ld.local.u64 %rd1688, [%rd1+328]; - shl.b64 %rd1689, %rd1688, 8; - mov.b64 {%r533, %r534}, %rd1689; - shr.u64 %rd1690, %rd1688, 56; - mov.b64 {%r535, %r536}, %rd1690; - mov.b32 {%rs365, %rs2220}, %r535; - mov.b32 {%rs361, %rs363}, %r534; - shr.u16 %rs364, %rs363, 8; - shr.u16 %rs362, %rs361, 8; - mov.b32 {%rs357, %rs359}, %r533; - shr.u16 %rs360, %rs359, 8; - shr.u16 %rs358, %rs357, 8; - mov.pred %p102, -1; - @%p102 bra $L__BB1_149; - bra.uni $L__BB1_148; - -$L__BB1_149: - shl.b16 %rs2221, %rs359, 8; - or.b16 %rs2222, %rs358, %rs2221; - shl.b16 %rs2223, %rs361, 8; - or.b16 %rs2224, %rs360, %rs2223; - mov.b32 %r537, {%rs2222, %rs2224}; - shl.b16 %rs2225, %rs363, 8; - or.b16 %rs2226, %rs362, %rs2225; - shl.b16 %rs2227, %rs365, 8; - or.b16 %rs2228, %rs364, %rs2227; - mov.b32 %r538, {%rs2226, %rs2228}; - mov.b64 %rd1691, {%r537, %r538}; - ld.local.u64 %rd1692, [%rd1+128]; - xor.b64 %rd4158, %rd1692, %rd1691; - st.local.u64 [%rd1+128], %rd4158; - @%p86 bra $L__BB1_153; - - add.s64 %rd1696, %rd968, 40; - cvta.to.local.u64 %rd421, %rd1696; - add.s64 %rd1697, %rd968, 80; - cvta.to.local.u64 %rd422, %rd1697; - add.s64 %rd1698, %rd968, 120; - cvta.to.local.u64 %rd423, %rd1698; - add.s64 %rd1699, %rd968, 160; - cvta.to.local.u64 %rd424, %rd1699; - add.s64 %rd1700, %rd968, 8; - cvta.to.local.u64 %rd425, %rd1700; - add.s64 %rd1701, %rd968, 48; - cvta.to.local.u64 %rd426, %rd1701; - add.s64 %rd1702, %rd968, 88; - cvta.to.local.u64 %rd427, %rd1702; - add.s64 %rd1703, %rd968, 128; - cvta.to.local.u64 %rd428, %rd1703; - add.s64 %rd1704, %rd968, 168; - cvta.to.local.u64 %rd429, %rd1704; - add.s64 %rd1705, %rd968, 16; - cvta.to.local.u64 %rd430, %rd1705; - add.s64 %rd1706, %rd968, 56; - cvta.to.local.u64 %rd431, %rd1706; - add.s64 %rd1707, %rd968, 96; - cvta.to.local.u64 %rd432, %rd1707; - add.s64 %rd1708, %rd968, 136; - cvta.to.local.u64 %rd433, %rd1708; - add.s64 %rd1709, %rd968, 176; - cvta.to.local.u64 %rd434, %rd1709; - add.s64 %rd1710, %rd968, 24; - cvta.to.local.u64 %rd435, %rd1710; - add.s64 %rd1711, %rd968, 64; - cvta.to.local.u64 %rd436, %rd1711; - add.s64 %rd1712, %rd968, 104; - cvta.to.local.u64 %rd437, %rd1712; - add.s64 %rd1713, %rd968, 144; - cvta.to.local.u64 %rd438, %rd1713; - add.s64 %rd1714, %rd968, 184; - cvta.to.local.u64 %rd439, %rd1714; - add.s64 %rd1715, %rd968, 32; - cvta.to.local.u64 %rd440, %rd1715; - add.s64 %rd1716, %rd968, 72; - cvta.to.local.u64 %rd441, %rd1716; - add.s64 %rd1717, %rd968, 112; - cvta.to.local.u64 %rd442, %rd1717; - add.s64 %rd1718, %rd968, 152; - cvta.to.local.u64 %rd443, %rd1718; - add.s64 %rd1719, %rd968, 192; - mov.u64 %rd4140, 192; - cvta.to.local.u64 %rd444, %rd1719; - ld.local.u64 %rd4161, [%rd424]; - ld.local.u64 %rd4157, [%rd429]; - ld.local.u64 %rd4154, [%rd433]; - ld.local.u64 %rd4153, [%rd434]; - ld.local.u64 %rd4150, [%rd438]; - ld.local.u64 %rd4149, [%rd439]; - ld.local.u64 %rd4146, [%rd443]; - ld.local.u64 %rd4145, [%rd444]; - mov.u64 %rd4166, private$9214; - -$L__BB1_151: - add.s64 %rd480, %rd4166, 8; - xor.b64 %rd1720, %rd4162, %rd4161; - xor.b64 %rd1721, %rd1720, %rd4163; - xor.b64 %rd1722, %rd1721, %rd4164; - xor.b64 %rd1723, %rd1722, %rd4170; - xor.b64 %rd1724, %rd4157, %rd4169; - xor.b64 %rd1725, %rd1724, %rd4158; - xor.b64 %rd1726, %rd1725, %rd4159; - xor.b64 %rd1727, %rd1726, %rd4160; - xor.b64 %rd1728, %rd4153, %rd4168; - xor.b64 %rd1729, %rd1728, %rd4154; - xor.b64 %rd1730, %rd1729, %rd4155; - xor.b64 %rd1731, %rd1730, %rd4156; - xor.b64 %rd1732, %rd4149, %rd4167; - xor.b64 %rd1733, %rd1732, %rd4150; - xor.b64 %rd1734, %rd1733, %rd4151; - xor.b64 %rd1735, %rd1734, %rd4152; - xor.b64 %rd1736, %rd4145, %rd4141; - xor.b64 %rd1737, %rd1736, %rd4146; - xor.b64 %rd1738, %rd1737, %rd4147; - xor.b64 %rd1739, %rd1738, %rd4148; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1727, 1; - shr.b64 %rhs, %rd1727, 63; - add.u64 %rd1740, %lhs, %rhs; - } - xor.b64 %rd1741, %rd1740, %rd1739; - xor.b64 %rd1742, %rd4170, %rd1741; - xor.b64 %rd1743, %rd1741, %rd4164; - xor.b64 %rd1744, %rd1741, %rd4163; - xor.b64 %rd1745, %rd1741, %rd4162; - xor.b64 %rd1746, %rd1741, %rd4161; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1731, 1; - shr.b64 %rhs, %rd1731, 63; - add.u64 %rd1747, %lhs, %rhs; - } - xor.b64 %rd1748, %rd1723, %rd1747; - xor.b64 %rd1749, %rd1748, %rd4169; - xor.b64 %rd1750, %rd1748, %rd4160; - xor.b64 %rd1751, %rd1748, %rd4159; - xor.b64 %rd1752, %rd1748, %rd4158; - xor.b64 %rd1753, %rd1748, %rd4157; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1735, 1; - shr.b64 %rhs, %rd1735, 63; - add.u64 %rd1754, %lhs, %rhs; - } - xor.b64 %rd1755, %rd1727, %rd1754; - xor.b64 %rd1756, %rd1755, %rd4168; - xor.b64 %rd1757, %rd1755, %rd4156; - xor.b64 %rd1758, %rd1755, %rd4155; - xor.b64 %rd1759, %rd1755, %rd4154; - xor.b64 %rd1760, %rd1755, %rd4153; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1739, 1; - shr.b64 %rhs, %rd1739, 63; - add.u64 %rd1761, %lhs, %rhs; - } - xor.b64 %rd1762, %rd1731, %rd1761; - xor.b64 %rd1763, %rd1762, %rd4167; - xor.b64 %rd1764, %rd1762, %rd4152; - xor.b64 %rd1765, %rd1762, %rd4151; - xor.b64 %rd1766, %rd1762, %rd4150; - xor.b64 %rd1767, %rd1762, %rd4149; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1723, 1; - shr.b64 %rhs, %rd1723, 63; - add.u64 %rd1768, %lhs, %rhs; - } - xor.b64 %rd1769, %rd1768, %rd1735; - xor.b64 %rd1770, %rd1769, %rd4141; - xor.b64 %rd1771, %rd1769, %rd4148; - xor.b64 %rd1772, %rd1769, %rd4147; - xor.b64 %rd1773, %rd1769, %rd4146; - xor.b64 %rd1774, %rd1769, %rd4145; - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1749, 1; - shr.b64 %rhs, %rd1749, 63; - add.u64 %rd1775, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1744, 3; - shr.b64 %rhs, %rd1744, 61; - add.u64 %rd1776, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1757, 6; - shr.b64 %rhs, %rd1757, 58; - add.u64 %rd1777, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1751, 10; - shr.b64 %rhs, %rd1751, 54; - add.u64 %rd1778, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1759, 15; - shr.b64 %rhs, %rd1759, 49; - add.u64 %rd1779, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1766, 21; - shr.b64 %rhs, %rd1766, 43; - add.u64 %rd1780, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1763, 28; - shr.b64 %rhs, %rd1763, 36; - add.u64 %rd1781, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1743, 36; - shr.b64 %rhs, %rd1743, 28; - add.u64 %rd1782, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1752, 45; - shr.b64 %rhs, %rd1752, 19; - add.u64 %rd1783, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1764, 55; - shr.b64 %rhs, %rd1764, 9; - add.u64 %rd1784, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1753, 2; - shr.b64 %rhs, %rd1753, 62; - add.u64 %rd1785, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1774, 14; - shr.b64 %rhs, %rd1774, 50; - add.u64 %rd1786, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1770, 27; - shr.b64 %rhs, %rd1770, 37; - add.u64 %rd1787, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1745, 41; - shr.b64 %rhs, %rd1745, 23; - add.u64 %rd1788, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1767, 56; - shr.b64 %rhs, %rd1767, 8; - add.u64 %rd1789, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1773, 8; - shr.b64 %rhs, %rd1773, 56; - add.u64 %rd1790, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1765, 25; - shr.b64 %rhs, %rd1765, 39; - add.u64 %rd1791, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1758, 43; - shr.b64 %rhs, %rd1758, 21; - add.u64 %rd1792, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1756, 62; - shr.b64 %rhs, %rd1756, 2; - add.u64 %rd1793, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1746, 18; - shr.b64 %rhs, %rd1746, 46; - add.u64 %rd1794, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1772, 39; - shr.b64 %rhs, %rd1772, 25; - add.u64 %rd1795, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1760, 61; - shr.b64 %rhs, %rd1760, 3; - add.u64 %rd1796, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1771, 20; - shr.b64 %rhs, %rd1771, 44; - add.u64 %rd1797, %lhs, %rhs; - } - { - .reg .b64 %lhs; - .reg .b64 %rhs; - shl.b64 %lhs, %rd1750, 44; - shr.b64 %rhs, %rd1750, 20; - add.u64 %rd1798, %lhs, %rhs; - } - not.b64 %rd1799, %rd1798; - and.b64 %rd1800, %rd1792, %rd1799; - not.b64 %rd1801, %rd1792; - and.b64 %rd1802, %rd1780, %rd1801; - xor.b64 %rd4169, %rd1798, %rd1802; - not.b64 %rd1803, %rd1780; - and.b64 %rd1804, %rd1786, %rd1803; - xor.b64 %rd4168, %rd1804, %rd1792; - not.b64 %rd1805, %rd1786; - and.b64 %rd1806, %rd1742, %rd1805; - xor.b64 %rd4167, %rd1806, %rd1780; - not.b64 %rd1807, %rd1742; - and.b64 %rd1808, %rd1798, %rd1807; - xor.b64 %rd4141, %rd1808, %rd1786; - not.b64 %rd1809, %rd1797; - and.b64 %rd1810, %rd1776, %rd1809; - xor.b64 %rd4164, %rd1810, %rd1781; - not.b64 %rd1811, %rd1776; - and.b64 %rd1812, %rd1783, %rd1811; - xor.b64 %rd4160, %rd1812, %rd1797; - not.b64 %rd1813, %rd1783; - and.b64 %rd1814, %rd1796, %rd1813; - xor.b64 %rd4156, %rd1814, %rd1776; - not.b64 %rd1815, %rd1796; - and.b64 %rd1816, %rd1781, %rd1815; - xor.b64 %rd4152, %rd1783, %rd1816; - not.b64 %rd1817, %rd1781; - and.b64 %rd1818, %rd1797, %rd1817; - xor.b64 %rd4148, %rd1818, %rd1796; - not.b64 %rd1819, %rd1777; - and.b64 %rd1820, %rd1791, %rd1819; - xor.b64 %rd4163, %rd1775, %rd1820; - not.b64 %rd1821, %rd1791; - and.b64 %rd1822, %rd1790, %rd1821; - xor.b64 %rd4159, %rd1822, %rd1777; - not.b64 %rd1823, %rd1790; - and.b64 %rd1824, %rd1794, %rd1823; - xor.b64 %rd4155, %rd1824, %rd1791; - not.b64 %rd1825, %rd1794; - and.b64 %rd1826, %rd1775, %rd1825; - xor.b64 %rd4151, %rd1826, %rd1790; - not.b64 %rd1827, %rd1775; - and.b64 %rd1828, %rd1777, %rd1827; - xor.b64 %rd4147, %rd1828, %rd1794; - not.b64 %rd1829, %rd1782; - and.b64 %rd1830, %rd1778, %rd1829; - xor.b64 %rd4162, %rd1830, %rd1787; - not.b64 %rd1831, %rd1778; - and.b64 %rd1832, %rd1779, %rd1831; - xor.b64 %rd4158, %rd1832, %rd1782; - not.b64 %rd1833, %rd1779; - and.b64 %rd1834, %rd1789, %rd1833; - xor.b64 %rd4154, %rd1778, %rd1834; - not.b64 %rd1835, %rd1789; - and.b64 %rd1836, %rd1787, %rd1835; - xor.b64 %rd4150, %rd1836, %rd1779; - not.b64 %rd1837, %rd1787; - and.b64 %rd1838, %rd1782, %rd1837; - xor.b64 %rd4146, %rd1838, %rd1789; - not.b64 %rd1839, %rd1784; - and.b64 %rd1840, %rd1795, %rd1839; - xor.b64 %rd4161, %rd1840, %rd1793; - not.b64 %rd1841, %rd1795; - and.b64 %rd1842, %rd1788, %rd1841; - xor.b64 %rd4157, %rd1842, %rd1784; - not.b64 %rd1843, %rd1788; - and.b64 %rd1844, %rd1785, %rd1843; - xor.b64 %rd4153, %rd1844, %rd1795; - not.b64 %rd1845, %rd1785; - and.b64 %rd1846, %rd1793, %rd1845; - xor.b64 %rd4149, %rd1846, %rd1788; - not.b64 %rd1847, %rd1793; - and.b64 %rd1848, %rd1784, %rd1847; - xor.b64 %rd4145, %rd1785, %rd1848; - ld.global.nc.u64 %rd1849, [%rd4166]; - xor.b64 %rd1850, %rd1849, %rd1742; - xor.b64 %rd4170, %rd1850, %rd1800; - add.s64 %rd4140, %rd4140, -8; - setp.ne.s64 %p104, %rd4140, 0; - mov.u64 %rd4166, %rd480; - @%p104 bra $L__BB1_151; - - st.local.u64 [%rd429], %rd4157; - st.local.u64 [%rd444], %rd4145; - st.local.u64 [%rd439], %rd4149; - st.local.u64 [%rd430], %rd4168; - st.local.u64 [%rd435], %rd4167; - st.local.u64 [%rd440], %rd4141; - st.local.u64 [%rd421], %rd4164; - st.local.u64 [%rd426], %rd4160; - st.local.u64 [%rd431], %rd4156; - st.local.u64 [%rd436], %rd4152; - st.local.u64 [%rd441], %rd4148; - st.local.u64 [%rd422], %rd4163; - st.local.u64 [%rd427], %rd4159; - st.local.u64 [%rd432], %rd4155; - st.local.u64 [%rd437], %rd4151; - st.local.u64 [%rd442], %rd4147; - st.local.u64 [%rd423], %rd4162; - st.local.u64 [%rd428], %rd4158; - st.local.u64 [%rd433], %rd4154; - st.local.u64 [%rd438], %rd4150; - st.local.u64 [%rd443], %rd4146; - st.local.u64 [%rd424], %rd4161; - st.local.u64 [%rd434], %rd4153; - st.local.u64 [%rd425], %rd4169; - st.local.u64 [%rd1], %rd4170; - -$L__BB1_153: - shr.u64 %rd1851, %rd4168, 8; - shr.u64 %rd1852, %rd4168, 16; - shr.u64 %rd1853, %rd4168, 24; - shr.u64 %rd1854, %rd4168, 32; - shr.u64 %rd1855, %rd4168, 40; - shr.u64 %rd1856, %rd4168, 48; - shr.u64 %rd1857, %rd4168, 56; - shr.u64 %rd1858, %rd4167, 8; - shr.u64 %rd1859, %rd4167, 16; - shr.u64 %rd1860, %rd4167, 24; - shr.u64 %rd1861, %rd4167, 32; - shr.u64 %rd1862, %rd4167, 40; - shr.u64 %rd1863, %rd4167, 48; - shr.u64 %rd1864, %rd4167, 56; - shr.u64 %rd1865, %rd4170, 8; - shr.u64 %rd1866, %rd4170, 16; - shr.u64 %rd1867, %rd4170, 24; - shr.u64 %rd1868, %rd4170, 32; - shr.u64 %rd1869, %rd4170, 40; - shr.u64 %rd1870, %rd4170, 48; - shr.u64 %rd1871, %rd4170, 56; - shr.u64 %rd1872, %rd4169, 8; - shr.u64 %rd1873, %rd4169, 16; - shr.u64 %rd1874, %rd4169, 24; - shr.u64 %rd1875, %rd4169, 32; - shr.u64 %rd1876, %rd4169, 40; - shr.u64 %rd1877, %rd4169, 48; - shr.u64 %rd1878, %rd4169, 56; - mov.u16 %rs2229, 32; - st.local.u16 [%rd12], %rs2229; - cvt.u16.u64 %rs2230, %rd4170; - cvt.u16.u64 %rs2231, %rd1865; - st.local.v2.u8 [%rd12+2], {%rs2230, %rs2231}; - cvt.u16.u64 %rs2232, %rd1867; - cvt.u16.u64 %rs2233, %rd1866; - st.local.v2.u8 [%rd12+4], {%rs2233, %rs2232}; - cvt.u16.u64 %rs2234, %rd1869; - cvt.u16.u64 %rs2235, %rd1868; - st.local.v2.u8 [%rd12+6], {%rs2235, %rs2234}; - cvt.u16.u64 %rs2236, %rd1871; - cvt.u16.u64 %rs2237, %rd1870; - st.local.v2.u8 [%rd12+8], {%rs2237, %rs2236}; - cvt.u16.u64 %rs2238, %rd4169; - cvt.u16.u64 %rs2239, %rd1872; - st.local.v2.u8 [%rd12+10], {%rs2238, %rs2239}; - cvt.u16.u64 %rs2240, %rd1874; - cvt.u16.u64 %rs2241, %rd1873; - st.local.v2.u8 [%rd12+12], {%rs2241, %rs2240}; - cvt.u16.u64 %rs2242, %rd1876; - cvt.u16.u64 %rs2243, %rd1875; - st.local.v2.u8 [%rd12+14], {%rs2243, %rs2242}; - cvt.u16.u64 %rs2244, %rd1878; - cvt.u16.u64 %rs2245, %rd1877; - st.local.v2.u8 [%rd12+16], {%rs2245, %rs2244}; - cvt.u16.u64 %rs2246, %rd4168; - cvt.u16.u64 %rs2247, %rd1851; - st.local.v2.u8 [%rd12+18], {%rs2246, %rs2247}; - cvt.u16.u64 %rs2248, %rd1853; - cvt.u16.u64 %rs2249, %rd1852; - st.local.v2.u8 [%rd12+20], {%rs2249, %rs2248}; - cvt.u16.u64 %rs2250, %rd1855; - cvt.u16.u64 %rs2251, %rd1854; - st.local.v2.u8 [%rd12+22], {%rs2251, %rs2250}; - cvt.u16.u64 %rs2252, %rd1857; - cvt.u16.u64 %rs2253, %rd1856; - st.local.v2.u8 [%rd12+24], {%rs2253, %rs2252}; - cvt.u16.u64 %rs2254, %rd4167; - cvt.u16.u64 %rs2255, %rd1858; - st.local.v2.u8 [%rd12+26], {%rs2254, %rs2255}; - cvt.u16.u64 %rs2256, %rd1860; - cvt.u16.u64 %rs2257, %rd1859; - st.local.v2.u8 [%rd12+28], {%rs2257, %rs2256}; - cvt.u16.u64 %rs2258, %rd1862; - cvt.u16.u64 %rs2259, %rd1861; - st.local.v2.u8 [%rd12+30], {%rs2259, %rs2258}; - cvt.u16.u64 %rs2260, %rd1864; - cvt.u16.u64 %rs2261, %rd1863; - st.local.v2.u8 [%rd12+32], {%rs2261, %rs2260}; - st.local.v2.u8 [%rd12+34], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+36], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+38], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+40], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+42], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+44], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+46], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+48], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+50], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+52], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+54], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+56], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+58], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+60], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+62], {%rs1918, %rs1918}; - st.local.v2.u8 [%rd12+64], {%rs1918, %rs1918}; - bra.uni $L__BB1_549; - -$L__BB1_417: - st.local.u64 [%rd1+80], %rd914; - ld.local.u32 %rd3826, [%rd1+24]; - shl.b64 %rd3827, %rd3826, 8; - mov.b64 {%r7101, %r7102}, %rd3827; - mov.b32 {%rs1036, %rs3886}, %r7102; - mov.b32 {%rs1032, %rs1034}, %r7101; - shr.u16 %rs1035, %rs1034, 8; - shr.u16 %rs1033, %rs1032, 8; - mov.pred %p304, 0; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3828, [%rd1+28]; - shl.b64 %rd3829, %rd3828, 8; - mov.b64 {%r7103, %r7104}, %rd3829; - mov.b32 {%rs1041, %rs3887}, %r7104; - mov.b32 {%rs1037, %rs1039}, %r7103; - shr.u16 %rs1040, %rs1039, 8; - shr.u16 %rs1038, %rs1037, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3830, [%rd1+32]; - shl.b64 %rd3831, %rd3830, 8; - mov.b64 {%r7105, %r7106}, %rd3831; - mov.b32 {%rs1046, %rs3888}, %r7106; - mov.b32 {%rs1042, %rs1044}, %r7105; - shr.u16 %rs1045, %rs1044, 8; - shr.u16 %rs1043, %rs1042, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3832, [%rd1+36]; - shl.b64 %rd3833, %rd3832, 8; - mov.b64 {%r7107, %r7108}, %rd3833; - mov.b32 {%rs1051, %rs3889}, %r7108; - mov.b32 {%rs1047, %rs1049}, %r7107; - shr.u16 %rs1050, %rs1049, 8; - shr.u16 %rs1048, %rs1047, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3834, [%rd1+40]; - shl.b64 %rd3835, %rd3834, 8; - mov.b64 {%r7109, %r7110}, %rd3835; - mov.b32 {%rs1056, %rs3890}, %r7110; - mov.b32 {%rs1052, %rs1054}, %r7109; - shr.u16 %rs1055, %rs1054, 8; - shr.u16 %rs1053, %rs1052, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3836, [%rd1+44]; - shl.b64 %rd3837, %rd3836, 8; - mov.b64 {%r7111, %r7112}, %rd3837; - mov.b32 {%rs1061, %rs3891}, %r7112; - mov.b32 {%rs1057, %rs1059}, %r7111; - shr.u16 %rs1060, %rs1059, 8; - shr.u16 %rs1058, %rs1057, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3838, [%rd1+48]; - shl.b64 %rd3839, %rd3838, 8; - mov.b64 {%r7113, %r7114}, %rd3839; - mov.b32 {%rs1066, %rs3892}, %r7114; - mov.b32 {%rs1062, %rs1064}, %r7113; - shr.u16 %rs1065, %rs1064, 8; - shr.u16 %rs1063, %rs1062, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3840, [%rd1+52]; - shl.b64 %rd3841, %rd3840, 8; - mov.b64 {%r7115, %r7116}, %rd3841; - mov.b32 {%rs1071, %rs3893}, %r7116; - mov.b32 {%rs1067, %rs1069}, %r7115; - shr.u16 %rs1070, %rs1069, 8; - shr.u16 %rs1068, %rs1067, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3842, [%rd1+56]; - shl.b64 %rd3843, %rd3842, 8; - mov.b64 {%r7117, %r7118}, %rd3843; - mov.b32 {%rs1076, %rs3894}, %r7118; - mov.b32 {%rs1072, %rs1074}, %r7117; - shr.u16 %rs1075, %rs1074, 8; - shr.u16 %rs1073, %rs1072, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3844, [%rd1+60]; - shl.b64 %rd3845, %rd3844, 8; - mov.b64 {%r7119, %r7120}, %rd3845; - mov.b32 {%rs1081, %rs3895}, %r7120; - mov.b32 {%rs1077, %rs1079}, %r7119; - shr.u16 %rs1080, %rs1079, 8; - shr.u16 %rs1078, %rs1077, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3846, [%rd1+64]; - shl.b64 %rd3847, %rd3846, 8; - mov.b64 {%r7121, %r7122}, %rd3847; - mov.b32 {%rs1086, %rs3896}, %r7122; - mov.b32 {%rs1082, %rs1084}, %r7121; - shr.u16 %rs1085, %rs1084, 8; - shr.u16 %rs1083, %rs1082, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3848, [%rd1+68]; - shl.b64 %rd3849, %rd3848, 8; - mov.b64 {%r7123, %r7124}, %rd3849; - mov.b32 {%rs1091, %rs3897}, %r7124; - mov.b32 {%rs1087, %rs1089}, %r7123; - shr.u16 %rs1090, %rs1089, 8; - shr.u16 %rs1088, %rs1087, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3850, [%rd1+72]; - shl.b64 %rd3851, %rd3850, 8; - mov.b64 {%r7125, %r7126}, %rd3851; - mov.b32 {%rs1096, %rs3898}, %r7126; - mov.b32 {%rs1092, %rs1094}, %r7125; - shr.u16 %rs1095, %rs1094, 8; - shr.u16 %rs1093, %rs1092, 8; - @%p304 bra $L__BB1_432; - - ld.local.u32 %rd3852, [%rd1+76]; - shl.b64 %rd3853, %rd3852, 8; - mov.b64 {%r7127, %r7128}, %rd3853; - mov.b32 {%rs1101, %rs3899}, %r7128; - mov.b32 {%rs1097, %rs1099}, %r7127; - shr.u16 %rs1100, %rs1099, 8; - shr.u16 %rs1098, %rs1097, 8; - @%p304 bra $L__BB1_432; - - shl.b64 %rd3854, %rd913, 11; - mov.b64 {%r7129, %r7130}, %rd3854; - mov.b32 {%rs1106, %rs3900}, %r7130; - mov.b32 {%rs1102, %rs1104}, %r7129; - shr.u16 %rs1103, %rs1102, 8; - mov.pred %p318, -1; - @%p318 bra $L__BB1_433; - bra.uni $L__BB1_432; - -$L__BB1_433: - shl.b16 %rs3901, %rs1104, 8; - or.b16 %rs3902, %rs1103, %rs3901; - shl.b16 %rs3903, %rs1106, 8; - mov.b32 %r64, {%rs3902, %rs3903}; - shl.b16 %rs3904, %rs1099, 8; - or.b16 %rs3905, %rs1098, %rs3904; - shl.b16 %rs3906, %rs1101, 8; - or.b16 %rs3907, %rs1100, %rs3906; - mov.b32 %r65, {%rs3905, %rs3907}; - shl.b16 %rs3908, %rs1094, 8; - or.b16 %rs3909, %rs1093, %rs3908; - shl.b16 %rs3910, %rs1096, 8; - or.b16 %rs3911, %rs1095, %rs3910; - mov.b32 %r66, {%rs3909, %rs3911}; - shl.b16 %rs3912, %rs1089, 8; - or.b16 %rs3913, %rs1088, %rs3912; - shl.b16 %rs3914, %rs1091, 8; - or.b16 %rs3915, %rs1090, %rs3914; - mov.b32 %r67, {%rs3913, %rs3915}; - shl.b16 %rs3916, %rs1084, 8; - or.b16 %rs3917, %rs1083, %rs3916; - shl.b16 %rs3918, %rs1086, 8; - or.b16 %rs3919, %rs1085, %rs3918; - mov.b32 %r68, {%rs3917, %rs3919}; - shl.b16 %rs3920, %rs1079, 8; - or.b16 %rs3921, %rs1078, %rs3920; - shl.b16 %rs3922, %rs1081, 8; - or.b16 %rs3923, %rs1080, %rs3922; - mov.b32 %r69, {%rs3921, %rs3923}; - shl.b16 %rs3924, %rs1074, 8; - or.b16 %rs3925, %rs1073, %rs3924; - shl.b16 %rs3926, %rs1076, 8; - or.b16 %rs3927, %rs1075, %rs3926; - mov.b32 %r70, {%rs3925, %rs3927}; - shl.b16 %rs3928, %rs1069, 8; - or.b16 %rs3929, %rs1068, %rs3928; - shl.b16 %rs3930, %rs1071, 8; - or.b16 %rs3931, %rs1070, %rs3930; - mov.b32 %r71, {%rs3929, %rs3931}; - shl.b16 %rs3932, %rs1064, 8; - or.b16 %rs3933, %rs1063, %rs3932; - shl.b16 %rs3934, %rs1066, 8; - or.b16 %rs3935, %rs1065, %rs3934; - mov.b32 %r72, {%rs3933, %rs3935}; - shl.b16 %rs3936, %rs1059, 8; - or.b16 %rs3937, %rs1058, %rs3936; - shl.b16 %rs3938, %rs1061, 8; - or.b16 %rs3939, %rs1060, %rs3938; - mov.b32 %r73, {%rs3937, %rs3939}; - shl.b16 %rs3940, %rs1054, 8; - or.b16 %rs3941, %rs1053, %rs3940; - shl.b16 %rs3942, %rs1056, 8; - or.b16 %rs3943, %rs1055, %rs3942; - mov.b32 %r74, {%rs3941, %rs3943}; - shl.b16 %rs3944, %rs1049, 8; - or.b16 %rs3945, %rs1048, %rs3944; - shl.b16 %rs3946, %rs1051, 8; - or.b16 %rs3947, %rs1050, %rs3946; - mov.b32 %r75, {%rs3945, %rs3947}; - shl.b16 %rs3948, %rs1044, 8; - or.b16 %rs3949, %rs1043, %rs3948; - shl.b16 %rs3950, %rs1046, 8; - or.b16 %rs3951, %rs1045, %rs3950; - mov.b32 %r76, {%rs3949, %rs3951}; - shl.b16 %rs3952, %rs1039, 8; - or.b16 %rs3953, %rs1038, %rs3952; - shl.b16 %rs3954, %rs1041, 8; - or.b16 %rs3955, %rs1040, %rs3954; - mov.b32 %r77, {%rs3953, %rs3955}; - shl.b16 %rs3956, %rs1034, 8; - or.b16 %rs3957, %rs1033, %rs3956; - shl.b16 %rs3958, %rs1036, 8; - or.b16 %rs3959, %rs1035, %rs3958; - mov.b32 %r78, {%rs3957, %rs3959}; - mov.u32 %r9125, -1043882854; - mov.u32 %r9122, %r9121; - @%p304 bra $L__BB1_435; - - add.s32 %r7136, %r78, -1; - shf.l.wrap.b32 %r7137, %r7136, %r7136, 3; - not.b32 %r7138, %r7137; - and.b32 %r7139, %r7137, -271733879; - and.b32 %r7140, %r7138, -1732584194; - or.b32 %r7141, %r7140, %r7139; - add.s32 %r7142, %r7141, %r77; - add.s32 %r7143, %r7142, 271733878; - shf.l.wrap.b32 %r7144, %r7143, %r7143, 7; - not.b32 %r7145, %r7144; - and.b32 %r7146, %r7144, %r7137; - and.b32 %r7147, %r7145, -271733879; - or.b32 %r7148, %r7147, %r7146; - add.s32 %r7149, %r7148, %r76; - add.s32 %r7150, %r7149, -1732584194; - shf.l.wrap.b32 %r7151, %r7150, %r7150, 11; - and.b32 %r7152, %r7151, %r7144; - not.b32 %r7153, %r7151; - and.b32 %r7154, %r7137, %r7153; - or.b32 %r7155, %r7154, %r7152; - add.s32 %r7156, %r7155, %r75; - add.s32 %r7157, %r7156, -271733879; - shf.l.wrap.b32 %r7158, %r7157, %r7157, 19; - and.b32 %r7159, %r7151, %r7158; - not.b32 %r7160, %r7158; - and.b32 %r7161, %r7144, %r7160; - or.b32 %r7162, %r7161, %r7159; - add.s32 %r7163, %r7162, %r7137; - add.s32 %r7164, %r7163, %r74; - shf.l.wrap.b32 %r7165, %r7164, %r7164, 3; - and.b32 %r7166, %r7165, %r7158; - not.b32 %r7167, %r7165; - and.b32 %r7168, %r7151, %r7167; - or.b32 %r7169, %r7168, %r7166; - add.s32 %r7170, %r7169, %r7144; - add.s32 %r7171, %r7170, %r73; - shf.l.wrap.b32 %r7172, %r7171, %r7171, 7; - and.b32 %r7173, %r7172, %r7165; - not.b32 %r7174, %r7172; - and.b32 %r7175, %r7158, %r7174; - or.b32 %r7176, %r7175, %r7173; - add.s32 %r7177, %r7176, %r7151; - add.s32 %r7178, %r7177, %r72; - shf.l.wrap.b32 %r7179, %r7178, %r7178, 11; - and.b32 %r7180, %r7179, %r7172; - not.b32 %r7181, %r7179; - and.b32 %r7182, %r7165, %r7181; - or.b32 %r7183, %r7182, %r7180; - add.s32 %r7184, %r7183, %r7158; - add.s32 %r7185, %r7184, %r71; - shf.l.wrap.b32 %r7186, %r7185, %r7185, 19; - and.b32 %r7187, %r7179, %r7186; - not.b32 %r7188, %r7186; - and.b32 %r7189, %r7172, %r7188; - or.b32 %r7190, %r7189, %r7187; - add.s32 %r7191, %r7190, %r7165; - add.s32 %r7192, %r7191, %r70; - shf.l.wrap.b32 %r7193, %r7192, %r7192, 3; - and.b32 %r7194, %r7193, %r7186; - not.b32 %r7195, %r7193; - and.b32 %r7196, %r7179, %r7195; - or.b32 %r7197, %r7196, %r7194; - add.s32 %r7198, %r7197, %r7172; - add.s32 %r7199, %r7198, %r69; - shf.l.wrap.b32 %r7200, %r7199, %r7199, 7; - and.b32 %r7201, %r7200, %r7193; - not.b32 %r7202, %r7200; - and.b32 %r7203, %r7186, %r7202; - or.b32 %r7204, %r7203, %r7201; - add.s32 %r7205, %r7204, %r7179; - add.s32 %r7206, %r7205, %r68; - shf.l.wrap.b32 %r7207, %r7206, %r7206, 11; - and.b32 %r7208, %r7207, %r7200; - not.b32 %r7209, %r7207; - and.b32 %r7210, %r7193, %r7209; - or.b32 %r7211, %r7210, %r7208; - add.s32 %r7212, %r7211, %r7186; - add.s32 %r7213, %r7212, %r67; - shf.l.wrap.b32 %r7214, %r7213, %r7213, 19; - and.b32 %r7215, %r7207, %r7214; - not.b32 %r7216, %r7214; - and.b32 %r7217, %r7200, %r7216; - or.b32 %r7218, %r7217, %r7215; - add.s32 %r7219, %r7218, %r7193; - add.s32 %r7220, %r7219, %r66; - shf.l.wrap.b32 %r7221, %r7220, %r7220, 3; - and.b32 %r7222, %r7221, %r7214; - not.b32 %r7223, %r7221; - and.b32 %r7224, %r7207, %r7223; - or.b32 %r7225, %r7224, %r7222; - add.s32 %r7226, %r7225, %r7200; - add.s32 %r7227, %r7226, %r65; - shf.l.wrap.b32 %r9122, %r7227, %r7227, 7; - and.b32 %r7228, %r9122, %r7221; - not.b32 %r7229, %r9122; - and.b32 %r7230, %r7214, %r7229; - or.b32 %r7231, %r7230, %r7228; - add.s32 %r7232, %r7231, %r7207; - add.s32 %r7233, %r7232, %r64; - shf.l.wrap.b32 %r9123, %r7233, %r7233, 11; - and.b32 %r9121, %r9123, %r9122; - not.b32 %r7234, %r9123; - and.b32 %r7235, %r7221, %r7234; - or.b32 %r7236, %r7235, %r9121; - add.s32 %r7237, %r7236, %r7214; - shf.l.wrap.b32 %r9124, %r7237, %r7237, 19; - add.s32 %r9125, %r7221, 1518500249; - -$L__BB1_435: - or.b32 %r7238, %r9123, %r9122; - and.b32 %r7239, %r7238, %r9124; - or.b32 %r7240, %r7239, %r9121; - add.s32 %r7241, %r9125, %r7240; - add.s32 %r7242, %r7241, %r78; - shf.l.wrap.b32 %r7243, %r7242, %r7242, 3; - or.b32 %r7244, %r9124, %r9123; - and.b32 %r7245, %r7243, %r7244; - and.b32 %r7246, %r9124, %r9123; - or.b32 %r7247, %r7245, %r7246; - add.s32 %r7248, %r9122, %r74; - add.s32 %r7249, %r7248, %r7247; - add.s32 %r7250, %r7249, 1518500249; - shf.l.wrap.b32 %r7251, %r7250, %r7250, 5; - or.b32 %r7252, %r7243, %r9124; - and.b32 %r7253, %r7251, %r7252; - and.b32 %r7254, %r7243, %r9124; - or.b32 %r7255, %r7253, %r7254; - add.s32 %r7256, %r9123, %r70; - add.s32 %r7257, %r7256, %r7255; - add.s32 %r7258, %r7257, 1518500249; - shf.l.wrap.b32 %r7259, %r7258, %r7258, 9; - or.b32 %r7260, %r7251, %r7243; - and.b32 %r7261, %r7259, %r7260; - and.b32 %r7262, %r7251, %r7243; - or.b32 %r7263, %r7261, %r7262; - add.s32 %r7264, %r9124, %r66; - add.s32 %r7265, %r7264, %r7263; - add.s32 %r7266, %r7265, 1518500249; - shf.l.wrap.b32 %r7267, %r7266, %r7266, 13; - or.b32 %r7268, %r7259, %r7251; - and.b32 %r7269, %r7267, %r7268; - and.b32 %r7270, %r7259, %r7251; - or.b32 %r7271, %r7269, %r7270; - add.s32 %r7272, %r7243, %r77; - add.s32 %r7273, %r7272, %r7271; - add.s32 %r7274, %r7273, 1518500249; - shf.l.wrap.b32 %r7275, %r7274, %r7274, 3; - or.b32 %r7276, %r7267, %r7259; - and.b32 %r7277, %r7275, %r7276; - and.b32 %r7278, %r7267, %r7259; - or.b32 %r7279, %r7277, %r7278; - add.s32 %r7280, %r73, %r7251; - add.s32 %r7281, %r7280, %r7279; - add.s32 %r7282, %r7281, 1518500249; - shf.l.wrap.b32 %r7283, %r7282, %r7282, 5; - or.b32 %r7284, %r7275, %r7267; - and.b32 %r7285, %r7283, %r7284; - and.b32 %r7286, %r7275, %r7267; - or.b32 %r7287, %r7285, %r7286; - add.s32 %r7288, %r69, %r7259; - add.s32 %r7289, %r7288, %r7287; - add.s32 %r7290, %r7289, 1518500249; - shf.l.wrap.b32 %r7291, %r7290, %r7290, 9; - or.b32 %r7292, %r7283, %r7275; - and.b32 %r7293, %r7291, %r7292; - and.b32 %r7294, %r7283, %r7275; - or.b32 %r7295, %r7293, %r7294; - add.s32 %r7296, %r65, %r7267; - add.s32 %r7297, %r7296, %r7295; - add.s32 %r7298, %r7297, 1518500249; - shf.l.wrap.b32 %r7299, %r7298, %r7298, 13; - or.b32 %r7300, %r7291, %r7283; - and.b32 %r7301, %r7299, %r7300; - and.b32 %r7302, %r7291, %r7283; - or.b32 %r7303, %r7301, %r7302; - add.s32 %r7304, %r76, %r7275; - add.s32 %r7305, %r7304, %r7303; - add.s32 %r7306, %r7305, 1518500249; - shf.l.wrap.b32 %r7307, %r7306, %r7306, 3; - or.b32 %r7308, %r7299, %r7291; - and.b32 %r7309, %r7307, %r7308; - and.b32 %r7310, %r7299, %r7291; - or.b32 %r7311, %r7309, %r7310; - add.s32 %r7312, %r72, %r7283; - add.s32 %r7313, %r7312, %r7311; - add.s32 %r7314, %r7313, 1518500249; - shf.l.wrap.b32 %r7315, %r7314, %r7314, 5; - or.b32 %r7316, %r7307, %r7299; - and.b32 %r7317, %r7315, %r7316; - and.b32 %r7318, %r7307, %r7299; - or.b32 %r7319, %r7317, %r7318; - add.s32 %r7320, %r68, %r7291; - add.s32 %r7321, %r7320, %r7319; - add.s32 %r7322, %r7321, 1518500249; - shf.l.wrap.b32 %r7323, %r7322, %r7322, 9; - or.b32 %r7324, %r7315, %r7307; - and.b32 %r7325, %r7323, %r7324; - and.b32 %r7326, %r7315, %r7307; - or.b32 %r7327, %r7325, %r7326; - add.s32 %r7328, %r64, %r7299; - add.s32 %r7329, %r7328, %r7327; - add.s32 %r7330, %r7329, 1518500249; - shf.l.wrap.b32 %r7331, %r7330, %r7330, 13; - or.b32 %r7332, %r7323, %r7315; - and.b32 %r7333, %r7331, %r7332; - and.b32 %r7334, %r7323, %r7315; - or.b32 %r7335, %r7333, %r7334; - add.s32 %r7336, %r75, %r7307; - add.s32 %r7337, %r7336, %r7335; - add.s32 %r7338, %r7337, 1518500249; - shf.l.wrap.b32 %r9129, %r7338, %r7338, 3; - or.b32 %r7339, %r7331, %r7323; - and.b32 %r7340, %r9129, %r7339; - and.b32 %r7341, %r7331, %r7323; - or.b32 %r7342, %r7340, %r7341; - add.s32 %r7343, %r71, %r7315; - add.s32 %r7344, %r7343, %r7342; - add.s32 %r7345, %r7344, 1518500249; - shf.l.wrap.b32 %r9126, %r7345, %r7345, 5; - or.b32 %r7346, %r9129, %r7331; - and.b32 %r7347, %r9126, %r7346; - and.b32 %r7348, %r9129, %r7331; - or.b32 %r7349, %r7347, %r7348; - add.s32 %r7350, %r67, %r7323; - add.s32 %r7351, %r7350, %r7349; - add.s32 %r7352, %r7351, 1518500249; - shf.l.wrap.b32 %r9127, %r7352, %r7352, 9; - or.b32 %r7353, %r9126, %r9129; - and.b32 %r7354, %r9127, %r7353; - and.b32 %r7355, %r9126, %r9129; - or.b32 %r7356, %r7354, %r7355; - add.s32 %r7357, %r7331, %r7356; - add.s32 %r7358, %r7357, 1518500249; - shf.l.wrap.b32 %r9128, %r7358, %r7358, 13; - @%p304 bra $L__BB1_437; - - xor.b32 %r7359, %r9127, %r9128; - xor.b32 %r7360, %r7359, %r9126; - add.s32 %r7361, %r9129, %r7360; - add.s32 %r7362, %r7361, %r78; - add.s32 %r7363, %r7362, 1859775393; - shf.l.wrap.b32 %r7364, %r7363, %r7363, 3; - xor.b32 %r7365, %r7364, %r7359; - add.s32 %r7366, %r9126, %r7365; - add.s32 %r7367, %r7366, %r70; - add.s32 %r7368, %r7367, 1859775393; - shf.l.wrap.b32 %r7369, %r7368, %r7368, 9; - xor.b32 %r7370, %r7364, %r9128; - xor.b32 %r7371, %r7370, %r7369; - add.s32 %r7372, %r9127, %r74; - add.s32 %r7373, %r7372, %r7371; - add.s32 %r7374, %r7373, 1859775393; - shf.l.wrap.b32 %r7375, %r7374, %r7374, 11; - xor.b32 %r7376, %r7369, %r7364; - xor.b32 %r7377, %r7376, %r7375; - add.s32 %r7378, %r9128, %r7377; - add.s32 %r7379, %r7378, %r66; - add.s32 %r7380, %r7379, 1859775393; - shf.l.wrap.b32 %r7381, %r7380, %r7380, 15; - xor.b32 %r7382, %r7375, %r7381; - xor.b32 %r7383, %r7382, %r7369; - add.s32 %r7384, %r7364, %r7383; - add.s32 %r7385, %r7384, %r76; - add.s32 %r7386, %r7385, 1859775393; - shf.l.wrap.b32 %r7387, %r7386, %r7386, 3; - xor.b32 %r7388, %r7387, %r7382; - add.s32 %r7389, %r7369, %r7388; - add.s32 %r7390, %r7389, %r68; - add.s32 %r7391, %r7390, 1859775393; - shf.l.wrap.b32 %r7392, %r7391, %r7391, 9; - xor.b32 %r7393, %r7387, %r7381; - xor.b32 %r7394, %r7393, %r7392; - add.s32 %r7395, %r7375, %r72; - add.s32 %r7396, %r7395, %r7394; - add.s32 %r7397, %r7396, 1859775393; - shf.l.wrap.b32 %r7398, %r7397, %r7397, 11; - xor.b32 %r7399, %r7392, %r7387; - xor.b32 %r7400, %r7399, %r7398; - add.s32 %r7401, %r7381, %r7400; - add.s32 %r7402, %r7401, %r64; - add.s32 %r7403, %r7402, 1859775393; - shf.l.wrap.b32 %r7404, %r7403, %r7403, 15; - xor.b32 %r7405, %r7398, %r7404; - xor.b32 %r7406, %r7405, %r7392; - add.s32 %r7407, %r7387, %r7406; - add.s32 %r7408, %r7407, %r77; - add.s32 %r7409, %r7408, 1859775393; - shf.l.wrap.b32 %r7410, %r7409, %r7409, 3; - xor.b32 %r7411, %r7410, %r7405; - add.s32 %r7412, %r7392, %r7411; - add.s32 %r7413, %r7412, %r69; - add.s32 %r7414, %r7413, 1859775393; - shf.l.wrap.b32 %r7415, %r7414, %r7414, 9; - xor.b32 %r7416, %r7410, %r7404; - xor.b32 %r7417, %r7416, %r7415; - add.s32 %r7418, %r7398, %r73; - add.s32 %r7419, %r7418, %r7417; - add.s32 %r7420, %r7419, 1859775393; - shf.l.wrap.b32 %r7421, %r7420, %r7420, 11; - xor.b32 %r7422, %r7415, %r7410; - xor.b32 %r7423, %r7422, %r7421; - add.s32 %r7424, %r7404, %r7423; - add.s32 %r7425, %r7424, %r65; - add.s32 %r7426, %r7425, 1859775393; - shf.l.wrap.b32 %r7427, %r7426, %r7426, 15; - xor.b32 %r7428, %r7421, %r7427; - xor.b32 %r7429, %r7428, %r7415; - add.s32 %r7430, %r7410, %r7429; - add.s32 %r7431, %r7430, %r75; - add.s32 %r7432, %r7431, 1859775393; - shf.l.wrap.b32 %r9129, %r7432, %r7432, 3; - xor.b32 %r7433, %r9129, %r7428; - add.s32 %r7434, %r7415, %r7433; - add.s32 %r7435, %r7434, %r67; - add.s32 %r7436, %r7435, 1859775393; - shf.l.wrap.b32 %r9126, %r7436, %r7436, 9; - xor.b32 %r7437, %r9129, %r7427; - xor.b32 %r7438, %r7437, %r9126; - add.s32 %r7439, %r7421, %r71; - add.s32 %r7440, %r7439, %r7438; - add.s32 %r7441, %r7440, 1859775393; - shf.l.wrap.b32 %r9127, %r7441, %r7441, 11; - xor.b32 %r7442, %r9126, %r9129; - xor.b32 %r7443, %r7442, %r9127; - add.s32 %r7444, %r7427, %r7443; - add.s32 %r7445, %r7444, 1859775393; - shf.l.wrap.b32 %r9128, %r7445, %r7445, 15; - -$L__BB1_437: - add.s32 %r9151, %r9129, 1732584193; - add.s32 %r9150, %r9128, -271733879; - add.s32 %r9149, %r9127, -1732584194; - add.s32 %r9148, %r9126, 271733878; - bra.uni $L__BB1_468; - -$L__BB1_246: - st.local.u64 [%rd1+96], %rd749; - mov.u64 %rd2261, 1; - { // callseq 28, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd765; - .param .b64 param1; - st.param.b64 [param1+0], %rd764; - .param .b64 param2; - st.param.b64 [param2+0], %rd2261; - call.uni - _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE, - ( - param0, - param1, - param2 - ); - } // callseq 28 - -$L__BB1_248: - st.local.u8 [%rd1+104], %rs2770; - ld.local.u32 %r775, [%rd1+8]; - shr.u32 %r776, %r775, 24; - shr.u32 %r777, %r775, 8; - and.b32 %r778, %r777, 65280; - or.b32 %r779, %r778, %r776; - shl.b32 %r780, %r775, 24; - shl.b32 %r781, %r775, 8; - and.b32 %r782, %r781, 16711680; - or.b32 %r783, %r780, %r782; - or.b32 %r784, %r783, %r779; - shr.u32 %r785, %r784, 8; - shr.u32 %r786, %r783, 16; - ld.local.u32 %r787, [%rd1+12]; - shr.u32 %r788, %r787, 24; - shr.u32 %r789, %r787, 8; - and.b32 %r790, %r789, 65280; - or.b32 %r791, %r790, %r788; - shl.b32 %r792, %r787, 24; - shl.b32 %r793, %r787, 8; - and.b32 %r794, %r793, 16711680; - or.b32 %r795, %r792, %r794; - or.b32 %r796, %r795, %r791; - shr.u32 %r797, %r796, 8; - shr.u32 %r798, %r795, 16; - ld.local.u32 %r799, [%rd1+16]; - shr.u32 %r800, %r799, 24; - shr.u32 %r801, %r799, 8; - and.b32 %r802, %r801, 65280; - or.b32 %r803, %r802, %r800; - shl.b32 %r804, %r799, 24; - shl.b32 %r805, %r799, 8; - and.b32 %r806, %r805, 16711680; - or.b32 %r807, %r804, %r806; - or.b32 %r808, %r807, %r803; - shr.u32 %r809, %r808, 8; - shr.u32 %r810, %r807, 16; - ld.local.u32 %r811, [%rd1+20]; - shr.u32 %r812, %r811, 24; - shr.u32 %r813, %r811, 8; - and.b32 %r814, %r813, 65280; - or.b32 %r815, %r814, %r812; - shl.b32 %r816, %r811, 24; - shl.b32 %r817, %r811, 8; - and.b32 %r818, %r817, 16711680; - or.b32 %r819, %r816, %r818; - or.b32 %r820, %r819, %r815; - shr.u32 %r821, %r820, 8; - shr.u32 %r822, %r819, 16; - ld.local.u32 %r823, [%rd1+24]; - shr.u32 %r824, %r823, 24; - shr.u32 %r825, %r823, 8; - and.b32 %r826, %r825, 65280; - or.b32 %r827, %r826, %r824; - shl.b32 %r828, %r823, 24; - shl.b32 %r829, %r823, 8; - and.b32 %r830, %r829, 16711680; - or.b32 %r831, %r828, %r830; - or.b32 %r832, %r831, %r827; - shr.u32 %r833, %r832, 8; - shr.u32 %r834, %r831, 16; - ld.local.u32 %r835, [%rd1+28]; - shr.u32 %r836, %r835, 24; - shr.u32 %r837, %r835, 8; - and.b32 %r838, %r837, 65280; - or.b32 %r839, %r838, %r836; - shl.b32 %r840, %r835, 24; - shl.b32 %r841, %r835, 8; - and.b32 %r842, %r841, 16711680; - or.b32 %r843, %r840, %r842; - or.b32 %r844, %r843, %r839; - shr.u32 %r845, %r844, 8; - shr.u32 %r846, %r843, 16; - ld.local.u32 %r847, [%rd1+32]; - shr.u32 %r848, %r847, 24; - shr.u32 %r849, %r847, 8; - and.b32 %r850, %r849, 65280; - or.b32 %r851, %r850, %r848; - shl.b32 %r852, %r847, 24; - shl.b32 %r853, %r847, 8; - and.b32 %r854, %r853, 16711680; - or.b32 %r855, %r852, %r854; - or.b32 %r856, %r855, %r851; - shr.u32 %r857, %r856, 8; - shr.u32 %r858, %r855, 16; - mov.u16 %rs2852, 28; - st.local.u16 [%rd12], %rs2852; - cvt.u16.u32 %rs2853, %r785; - cvt.u16.u32 %rs2854, %r776; - cvt.u16.u32 %rs2855, %r777; - and.b16 %rs2856, %rs2855, -256; - or.b16 %rs2857, %rs2856, %rs2854; - st.local.v2.u8 [%rd12+2], {%rs2857, %rs2853}; - cvt.u16.u32 %rs2858, %r786; - cvt.u16.u32 %rs2859, %r775; - and.b16 %rs2860, %rs2859, 255; - st.local.v2.u8 [%rd12+4], {%rs2858, %rs2860}; - cvt.u16.u32 %rs2861, %r797; - cvt.u16.u32 %rs2862, %r788; - cvt.u16.u32 %rs2863, %r789; - and.b16 %rs2864, %rs2863, -256; - or.b16 %rs2865, %rs2864, %rs2862; - st.local.v2.u8 [%rd12+6], {%rs2865, %rs2861}; - cvt.u16.u32 %rs2866, %r798; - cvt.u16.u32 %rs2867, %r787; - and.b16 %rs2868, %rs2867, 255; - st.local.v2.u8 [%rd12+8], {%rs2866, %rs2868}; - cvt.u16.u32 %rs2869, %r809; - cvt.u16.u32 %rs2870, %r800; - cvt.u16.u32 %rs2871, %r801; - and.b16 %rs2872, %rs2871, -256; - or.b16 %rs2873, %rs2872, %rs2870; - st.local.v2.u8 [%rd12+10], {%rs2873, %rs2869}; - cvt.u16.u32 %rs2874, %r810; - cvt.u16.u32 %rs2875, %r799; - and.b16 %rs2876, %rs2875, 255; - st.local.v2.u8 [%rd12+12], {%rs2874, %rs2876}; - cvt.u16.u32 %rs2877, %r821; - cvt.u16.u32 %rs2878, %r812; - cvt.u16.u32 %rs2879, %r813; - and.b16 %rs2880, %rs2879, -256; - or.b16 %rs2881, %rs2880, %rs2878; - st.local.v2.u8 [%rd12+14], {%rs2881, %rs2877}; - cvt.u16.u32 %rs2882, %r822; - cvt.u16.u32 %rs2883, %r811; - and.b16 %rs2884, %rs2883, 255; - st.local.v2.u8 [%rd12+16], {%rs2882, %rs2884}; - cvt.u16.u32 %rs2885, %r833; - cvt.u16.u32 %rs2886, %r824; - cvt.u16.u32 %rs2887, %r825; - and.b16 %rs2888, %rs2887, -256; - or.b16 %rs2889, %rs2888, %rs2886; - st.local.v2.u8 [%rd12+18], {%rs2889, %rs2885}; - cvt.u16.u32 %rs2890, %r834; - cvt.u16.u32 %rs2891, %r823; - and.b16 %rs2892, %rs2891, 255; - st.local.v2.u8 [%rd12+20], {%rs2890, %rs2892}; - cvt.u16.u32 %rs2893, %r845; - cvt.u16.u32 %rs2894, %r836; - cvt.u16.u32 %rs2895, %r837; - and.b16 %rs2896, %rs2895, -256; - or.b16 %rs2897, %rs2896, %rs2894; - st.local.v2.u8 [%rd12+22], {%rs2897, %rs2893}; - cvt.u16.u32 %rs2898, %r846; - cvt.u16.u32 %rs2899, %r835; - and.b16 %rs2900, %rs2899, 255; - st.local.v2.u8 [%rd12+24], {%rs2898, %rs2900}; - cvt.u16.u32 %rs2901, %r857; - cvt.u16.u32 %rs2902, %r848; - cvt.u16.u32 %rs2903, %r849; - and.b16 %rs2904, %rs2903, -256; - or.b16 %rs2905, %rs2904, %rs2902; - st.local.v2.u8 [%rd12+26], {%rs2905, %rs2901}; - cvt.u16.u32 %rs2906, %r858; - cvt.u16.u32 %rs2907, %r847; - and.b16 %rs2908, %rs2907, 255; - st.local.v2.u8 [%rd12+28], {%rs2906, %rs2908}; - st.local.v2.u8 [%rd12+30], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+32], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+34], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+36], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+38], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+40], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+42], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+44], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+46], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+48], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+50], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+52], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+54], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+56], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+58], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+60], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+62], {%rs2770, %rs2770}; - st.local.v2.u8 [%rd12+64], {%rs2770, %rs2770}; - bra.uni $L__BB1_549; - -$L__BB1_340: - st.local.u64 [%rd1+80], %rd853; - mov.pred %p241, 0; - mov.pred %p256, -1; - mov.u64 %rd4259, %rd4258; - -$L__BB1_341: - ld.local.u32 %rd3598, [%rd4259]; - shl.b64 %rd3599, %rd3598, 8; - mov.b64 {%r5363, %r5364}, %rd3599; - mov.b32 {%rs792, %rs3545}, %r5364; - mov.b32 {%rs788, %rs790}, %r5363; - shr.u16 %rs791, %rs790, 8; - shr.u16 %rs789, %rs788, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3600, [%rd4259+4]; - shl.b64 %rd3601, %rd3600, 8; - mov.b64 {%r5365, %r5366}, %rd3601; - mov.b32 {%rs797, %rs3546}, %r5366; - mov.b32 {%rs793, %rs795}, %r5365; - shr.u16 %rs796, %rs795, 8; - shr.u16 %rs794, %rs793, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3602, [%rd4259+8]; - shl.b64 %rd3603, %rd3602, 8; - mov.b64 {%r5367, %r5368}, %rd3603; - mov.b32 {%rs802, %rs3547}, %r5368; - mov.b32 {%rs798, %rs800}, %r5367; - shr.u16 %rs801, %rs800, 8; - shr.u16 %rs799, %rs798, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3604, [%rd4259+12]; - shl.b64 %rd3605, %rd3604, 8; - mov.b64 {%r5369, %r5370}, %rd3605; - mov.b32 {%rs807, %rs3548}, %r5370; - mov.b32 {%rs803, %rs805}, %r5369; - shr.u16 %rs806, %rs805, 8; - shr.u16 %rs804, %rs803, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3606, [%rd4259+16]; - shl.b64 %rd3607, %rd3606, 8; - mov.b64 {%r5371, %r5372}, %rd3607; - mov.b32 {%rs812, %rs3549}, %r5372; - mov.b32 {%rs808, %rs810}, %r5371; - shr.u16 %rs811, %rs810, 8; - shr.u16 %rs809, %rs808, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3608, [%rd4259+20]; - shl.b64 %rd3609, %rd3608, 8; - mov.b64 {%r5373, %r5374}, %rd3609; - mov.b32 {%rs817, %rs3550}, %r5374; - mov.b32 {%rs813, %rs815}, %r5373; - shr.u16 %rs816, %rs815, 8; - shr.u16 %rs814, %rs813, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3610, [%rd4259+24]; - shl.b64 %rd3611, %rd3610, 8; - mov.b64 {%r5375, %r5376}, %rd3611; - mov.b32 {%rs822, %rs3551}, %r5376; - mov.b32 {%rs818, %rs820}, %r5375; - shr.u16 %rs821, %rs820, 8; - shr.u16 %rs819, %rs818, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3612, [%rd4259+28]; - shl.b64 %rd3613, %rd3612, 8; - mov.b64 {%r5377, %r5378}, %rd3613; - mov.b32 {%rs827, %rs3552}, %r5378; - mov.b32 {%rs823, %rs825}, %r5377; - shr.u16 %rs826, %rs825, 8; - shr.u16 %rs824, %rs823, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3614, [%rd4259+32]; - shl.b64 %rd3615, %rd3614, 8; - mov.b64 {%r5379, %r5380}, %rd3615; - mov.b32 {%rs832, %rs3553}, %r5380; - mov.b32 {%rs828, %rs830}, %r5379; - shr.u16 %rs831, %rs830, 8; - shr.u16 %rs829, %rs828, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3616, [%rd4259+36]; - shl.b64 %rd3617, %rd3616, 8; - mov.b64 {%r5381, %r5382}, %rd3617; - mov.b32 {%rs837, %rs3554}, %r5382; - mov.b32 {%rs833, %rs835}, %r5381; - shr.u16 %rs836, %rs835, 8; - shr.u16 %rs834, %rs833, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3618, [%rd4259+40]; - shl.b64 %rd3619, %rd3618, 8; - mov.b64 {%r5383, %r5384}, %rd3619; - mov.b32 {%rs842, %rs3555}, %r5384; - mov.b32 {%rs838, %rs840}, %r5383; - shr.u16 %rs841, %rs840, 8; - shr.u16 %rs839, %rs838, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3620, [%rd4259+44]; - shl.b64 %rd3621, %rd3620, 8; - mov.b64 {%r5385, %r5386}, %rd3621; - mov.b32 {%rs847, %rs3556}, %r5386; - mov.b32 {%rs843, %rs845}, %r5385; - shr.u16 %rs846, %rs845, 8; - shr.u16 %rs844, %rs843, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3622, [%rd4259+48]; - shl.b64 %rd3623, %rd3622, 8; - mov.b64 {%r5387, %r5388}, %rd3623; - mov.b32 {%rs852, %rs3557}, %r5388; - mov.b32 {%rs848, %rs850}, %r5387; - shr.u16 %rs851, %rs850, 8; - shr.u16 %rs849, %rs848, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3624, [%rd4259+52]; - shl.b64 %rd3625, %rd3624, 8; - mov.b64 {%r5389, %r5390}, %rd3625; - mov.b32 {%rs857, %rs3558}, %r5390; - mov.b32 {%rs853, %rs855}, %r5389; - shr.u16 %rs856, %rs855, 8; - shr.u16 %rs854, %rs853, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3626, [%rd4259+56]; - shl.b64 %rd3627, %rd3626, 8; - mov.b64 {%r5391, %r5392}, %rd3627; - mov.b32 {%rs862, %rs3559}, %r5392; - mov.b32 {%rs858, %rs860}, %r5391; - shr.u16 %rs861, %rs860, 8; - shr.u16 %rs859, %rs858, 8; - @%p241 bra $L__BB1_357; - - ld.local.u32 %rd3628, [%rd4259+60]; - shl.b64 %rd3629, %rd3628, 8; - mov.b64 {%r5393, %r5394}, %rd3629; - mov.b32 {%rs867, %rs3560}, %r5394; - mov.b32 {%rs863, %rs865}, %r5393; - shr.u16 %rs866, %rs865, 8; - shr.u16 %rs864, %rs863, 8; - @%p256 bra $L__BB1_358; - bra.uni $L__BB1_357; - -$L__BB1_358: - add.s64 %rd4258, %rd4258, 64; - shl.b16 %rs3561, %rs860, 8; - or.b16 %rs3562, %rs859, %rs3561; - shl.b16 %rs3563, %rs862, 8; - or.b16 %rs3564, %rs861, %rs3563; - shl.b16 %rs3565, %rs865, 8; - or.b16 %rs3566, %rs864, %rs3565; - shl.b16 %rs3567, %rs867, 8; - or.b16 %rs3568, %rs866, %rs3567; - mov.b32 %r5395, {%rs3566, %rs3568}; - not.b32 %r5396, %r9107; - and.b32 %r5397, %r9105, %r5396; - and.b32 %r5398, %r9106, %r9107; - or.b32 %r5399, %r5397, %r5398; - add.s32 %r5400, %r9108, %r5399; - shl.b16 %rs3569, %rs790, 8; - or.b16 %rs3570, %rs789, %rs3569; - shl.b16 %rs3571, %rs792, 8; - or.b16 %rs3572, %rs791, %rs3571; - mov.b32 %r5401, {%rs3570, %rs3572}; - add.s32 %r5402, %r5400, %r5401; - add.s32 %r5403, %r5402, -680876936; - shf.l.wrap.b32 %r5404, %r5403, %r5403, 7; - add.s32 %r5405, %r5404, %r9107; - and.b32 %r5406, %r5405, %r9107; - not.b32 %r5407, %r5405; - and.b32 %r5408, %r9106, %r5407; - or.b32 %r5409, %r5408, %r5406; - shl.b16 %rs3573, %rs795, 8; - or.b16 %rs3574, %rs794, %rs3573; - shl.b16 %rs3575, %rs797, 8; - or.b16 %rs3576, %rs796, %rs3575; - mov.b32 %r5410, {%rs3574, %rs3576}; - add.s32 %r5411, %r9105, %r5410; - add.s32 %r5412, %r5411, %r5409; - add.s32 %r5413, %r5412, -389564586; - shf.l.wrap.b32 %r5414, %r5413, %r5413, 12; - add.s32 %r5415, %r5414, %r5405; - and.b32 %r5416, %r5415, %r5405; - not.b32 %r5417, %r5415; - and.b32 %r5418, %r9107, %r5417; - or.b32 %r5419, %r5418, %r5416; - shl.b16 %rs3577, %rs800, 8; - or.b16 %rs3578, %rs799, %rs3577; - shl.b16 %rs3579, %rs802, 8; - or.b16 %rs3580, %rs801, %rs3579; - mov.b32 %r5420, {%rs3578, %rs3580}; - add.s32 %r5421, %r9106, %r5420; - add.s32 %r5422, %r5421, %r5419; - add.s32 %r5423, %r5422, 606105819; - shf.l.wrap.b32 %r5424, %r5423, %r5423, 17; - add.s32 %r5425, %r5424, %r5415; - and.b32 %r5426, %r5425, %r5415; - not.b32 %r5427, %r5425; - and.b32 %r5428, %r5405, %r5427; - or.b32 %r5429, %r5428, %r5426; - shl.b16 %rs3581, %rs805, 8; - or.b16 %rs3582, %rs804, %rs3581; - shl.b16 %rs3583, %rs807, 8; - or.b16 %rs3584, %rs806, %rs3583; - mov.b32 %r5430, {%rs3582, %rs3584}; - add.s32 %r5431, %r9107, %r5430; - add.s32 %r5432, %r5431, %r5429; - add.s32 %r5433, %r5432, -1044525330; - shf.l.wrap.b32 %r5434, %r5433, %r5433, 22; - add.s32 %r5435, %r5434, %r5425; - and.b32 %r5436, %r5435, %r5425; - not.b32 %r5437, %r5435; - and.b32 %r5438, %r5415, %r5437; - or.b32 %r5439, %r5438, %r5436; - shl.b16 %rs3585, %rs810, 8; - or.b16 %rs3586, %rs809, %rs3585; - shl.b16 %rs3587, %rs812, 8; - or.b16 %rs3588, %rs811, %rs3587; - mov.b32 %r5440, {%rs3586, %rs3588}; - add.s32 %r5441, %r5405, %r5440; - add.s32 %r5442, %r5441, %r5439; - add.s32 %r5443, %r5442, -176418897; - shf.l.wrap.b32 %r5444, %r5443, %r5443, 7; - add.s32 %r5445, %r5444, %r5435; - and.b32 %r5446, %r5445, %r5435; - not.b32 %r5447, %r5445; - and.b32 %r5448, %r5425, %r5447; - or.b32 %r5449, %r5448, %r5446; - shl.b16 %rs3589, %rs815, 8; - or.b16 %rs3590, %rs814, %rs3589; - shl.b16 %rs3591, %rs817, 8; - or.b16 %rs3592, %rs816, %rs3591; - mov.b32 %r5450, {%rs3590, %rs3592}; - add.s32 %r5451, %r5450, %r5415; - add.s32 %r5452, %r5451, %r5449; - add.s32 %r5453, %r5452, 1200080426; - shf.l.wrap.b32 %r5454, %r5453, %r5453, 12; - add.s32 %r5455, %r5454, %r5445; - and.b32 %r5456, %r5455, %r5445; - not.b32 %r5457, %r5455; - and.b32 %r5458, %r5435, %r5457; - or.b32 %r5459, %r5458, %r5456; - shl.b16 %rs3593, %rs820, 8; - or.b16 %rs3594, %rs819, %rs3593; - shl.b16 %rs3595, %rs822, 8; - or.b16 %rs3596, %rs821, %rs3595; - mov.b32 %r5460, {%rs3594, %rs3596}; - add.s32 %r5461, %r5460, %r5425; - add.s32 %r5462, %r5461, %r5459; - add.s32 %r5463, %r5462, -1473231341; - shf.l.wrap.b32 %r5464, %r5463, %r5463, 17; - add.s32 %r5465, %r5464, %r5455; - and.b32 %r5466, %r5465, %r5455; - not.b32 %r5467, %r5465; - and.b32 %r5468, %r5445, %r5467; - or.b32 %r5469, %r5468, %r5466; - shl.b16 %rs3597, %rs825, 8; - or.b16 %rs3598, %rs824, %rs3597; - shl.b16 %rs3599, %rs827, 8; - or.b16 %rs3600, %rs826, %rs3599; - mov.b32 %r5470, {%rs3598, %rs3600}; - add.s32 %r5471, %r5470, %r5435; - add.s32 %r5472, %r5471, %r5469; - add.s32 %r5473, %r5472, -45705983; - shf.l.wrap.b32 %r5474, %r5473, %r5473, 22; - add.s32 %r5475, %r5474, %r5465; - and.b32 %r5476, %r5475, %r5465; - not.b32 %r5477, %r5475; - and.b32 %r5478, %r5455, %r5477; - or.b32 %r5479, %r5478, %r5476; - shl.b16 %rs3601, %rs830, 8; - or.b16 %rs3602, %rs829, %rs3601; - shl.b16 %rs3603, %rs832, 8; - or.b16 %rs3604, %rs831, %rs3603; - mov.b32 %r5480, {%rs3602, %rs3604}; - add.s32 %r5481, %r5480, %r5445; - add.s32 %r5482, %r5481, %r5479; - add.s32 %r5483, %r5482, 1770035416; - shf.l.wrap.b32 %r5484, %r5483, %r5483, 7; - add.s32 %r5485, %r5484, %r5475; - and.b32 %r5486, %r5485, %r5475; - not.b32 %r5487, %r5485; - and.b32 %r5488, %r5465, %r5487; - or.b32 %r5489, %r5488, %r5486; - shl.b16 %rs3605, %rs835, 8; - or.b16 %rs3606, %rs834, %rs3605; - shl.b16 %rs3607, %rs837, 8; - or.b16 %rs3608, %rs836, %rs3607; - mov.b32 %r5490, {%rs3606, %rs3608}; - add.s32 %r5491, %r5490, %r5455; - add.s32 %r5492, %r5491, %r5489; - add.s32 %r5493, %r5492, -1958414417; - shf.l.wrap.b32 %r5494, %r5493, %r5493, 12; - add.s32 %r5495, %r5494, %r5485; - and.b32 %r5496, %r5495, %r5485; - not.b32 %r5497, %r5495; - and.b32 %r5498, %r5475, %r5497; - or.b32 %r5499, %r5498, %r5496; - shl.b16 %rs3609, %rs840, 8; - or.b16 %rs3610, %rs839, %rs3609; - shl.b16 %rs3611, %rs842, 8; - or.b16 %rs3612, %rs841, %rs3611; - mov.b32 %r5500, {%rs3610, %rs3612}; - add.s32 %r5501, %r5500, %r5465; - add.s32 %r5502, %r5501, %r5499; - add.s32 %r5503, %r5502, -42063; - shf.l.wrap.b32 %r5504, %r5503, %r5503, 17; - add.s32 %r5505, %r5504, %r5495; - and.b32 %r5506, %r5505, %r5495; - not.b32 %r5507, %r5505; - and.b32 %r5508, %r5485, %r5507; - or.b32 %r5509, %r5508, %r5506; - shl.b16 %rs3613, %rs845, 8; - or.b16 %rs3614, %rs844, %rs3613; - shl.b16 %rs3615, %rs847, 8; - or.b16 %rs3616, %rs846, %rs3615; - mov.b32 %r5510, {%rs3614, %rs3616}; - add.s32 %r5511, %r5510, %r5475; - add.s32 %r5512, %r5511, %r5509; - add.s32 %r5513, %r5512, -1990404162; - shf.l.wrap.b32 %r5514, %r5513, %r5513, 22; - add.s32 %r5515, %r5514, %r5505; - and.b32 %r5516, %r5515, %r5505; - not.b32 %r5517, %r5515; - and.b32 %r5518, %r5495, %r5517; - or.b32 %r5519, %r5518, %r5516; - shl.b16 %rs3617, %rs850, 8; - or.b16 %rs3618, %rs849, %rs3617; - shl.b16 %rs3619, %rs852, 8; - or.b16 %rs3620, %rs851, %rs3619; - mov.b32 %r5520, {%rs3618, %rs3620}; - add.s32 %r5521, %r5520, %r5485; - add.s32 %r5522, %r5521, %r5519; - add.s32 %r5523, %r5522, 1804603682; - shf.l.wrap.b32 %r5524, %r5523, %r5523, 7; - add.s32 %r5525, %r5524, %r5515; - and.b32 %r5526, %r5525, %r5515; - not.b32 %r5527, %r5525; - and.b32 %r5528, %r5505, %r5527; - or.b32 %r5529, %r5528, %r5526; - shl.b16 %rs3621, %rs855, 8; - or.b16 %rs3622, %rs854, %rs3621; - shl.b16 %rs3623, %rs857, 8; - or.b16 %rs3624, %rs856, %rs3623; - mov.b32 %r5530, {%rs3622, %rs3624}; - add.s32 %r5531, %r5530, %r5495; - add.s32 %r5532, %r5531, %r5529; - add.s32 %r5533, %r5532, -40341101; - shf.l.wrap.b32 %r5534, %r5533, %r5533, 12; - add.s32 %r5535, %r5534, %r5525; - mov.b32 %r5536, {%rs3562, %rs3564}; - and.b32 %r5537, %r5535, %r5525; - not.b32 %r5538, %r5535; - and.b32 %r5539, %r5515, %r5538; - or.b32 %r5540, %r5539, %r5537; - add.s32 %r5541, %r5536, %r5505; - add.s32 %r5542, %r5541, %r5540; - add.s32 %r5543, %r5542, -1502002290; - shf.l.wrap.b32 %r5544, %r5543, %r5543, 17; - add.s32 %r5545, %r5544, %r5535; - and.b32 %r5546, %r5545, %r5535; - not.b32 %r5547, %r5545; - and.b32 %r5548, %r5525, %r5547; - or.b32 %r5549, %r5548, %r5546; - add.s32 %r5550, %r5395, %r5515; - add.s32 %r5551, %r5550, %r5549; - add.s32 %r5552, %r5551, 1236535329; - shf.l.wrap.b32 %r5553, %r5552, %r5552, 22; - add.s32 %r5554, %r5553, %r5545; - and.b32 %r5555, %r5554, %r5535; - and.b32 %r5556, %r5545, %r5538; - or.b32 %r5557, %r5555, %r5556; - add.s32 %r5558, %r5410, %r5525; - add.s32 %r5559, %r5558, %r5557; - add.s32 %r5560, %r5559, -165796510; - shf.l.wrap.b32 %r5561, %r5560, %r5560, 5; - add.s32 %r5562, %r5561, %r5554; - and.b32 %r5563, %r5562, %r5545; - and.b32 %r5564, %r5554, %r5547; - or.b32 %r5565, %r5563, %r5564; - add.s32 %r5566, %r5460, %r5535; - add.s32 %r5567, %r5566, %r5565; - add.s32 %r5568, %r5567, -1069501632; - shf.l.wrap.b32 %r5569, %r5568, %r5568, 9; - add.s32 %r5570, %r5569, %r5562; - and.b32 %r5571, %r5570, %r5554; - not.b32 %r5572, %r5554; - and.b32 %r5573, %r5562, %r5572; - or.b32 %r5574, %r5571, %r5573; - add.s32 %r5575, %r5510, %r5545; - add.s32 %r5576, %r5575, %r5574; - add.s32 %r5577, %r5576, 643717713; - shf.l.wrap.b32 %r5578, %r5577, %r5577, 14; - add.s32 %r5579, %r5578, %r5570; - and.b32 %r5580, %r5579, %r5562; - not.b32 %r5581, %r5562; - and.b32 %r5582, %r5570, %r5581; - or.b32 %r5583, %r5580, %r5582; - add.s32 %r5584, %r5401, %r5554; - add.s32 %r5585, %r5584, %r5583; - add.s32 %r5586, %r5585, -373897302; - shf.l.wrap.b32 %r5587, %r5586, %r5586, 20; - add.s32 %r5588, %r5587, %r5579; - and.b32 %r5589, %r5588, %r5570; - not.b32 %r5590, %r5570; - and.b32 %r5591, %r5579, %r5590; - or.b32 %r5592, %r5589, %r5591; - add.s32 %r5593, %r5450, %r5562; - add.s32 %r5594, %r5593, %r5592; - add.s32 %r5595, %r5594, -701558691; - shf.l.wrap.b32 %r5596, %r5595, %r5595, 5; - add.s32 %r5597, %r5596, %r5588; - and.b32 %r5598, %r5597, %r5579; - not.b32 %r5599, %r5579; - and.b32 %r5600, %r5588, %r5599; - or.b32 %r5601, %r5598, %r5600; - add.s32 %r5602, %r5500, %r5570; - add.s32 %r5603, %r5602, %r5601; - add.s32 %r5604, %r5603, 38016083; - shf.l.wrap.b32 %r5605, %r5604, %r5604, 9; - add.s32 %r5606, %r5605, %r5597; - and.b32 %r5607, %r5606, %r5588; - not.b32 %r5608, %r5588; - and.b32 %r5609, %r5597, %r5608; - or.b32 %r5610, %r5607, %r5609; - add.s32 %r5611, %r5395, %r5579; - add.s32 %r5612, %r5611, %r5610; - add.s32 %r5613, %r5612, -660478335; - shf.l.wrap.b32 %r5614, %r5613, %r5613, 14; - add.s32 %r5615, %r5614, %r5606; - and.b32 %r5616, %r5615, %r5597; - not.b32 %r5617, %r5597; - and.b32 %r5618, %r5606, %r5617; - or.b32 %r5619, %r5616, %r5618; - add.s32 %r5620, %r5440, %r5588; - add.s32 %r5621, %r5620, %r5619; - add.s32 %r5622, %r5621, -405537848; - shf.l.wrap.b32 %r5623, %r5622, %r5622, 20; - add.s32 %r5624, %r5623, %r5615; - and.b32 %r5625, %r5624, %r5606; - not.b32 %r5626, %r5606; - and.b32 %r5627, %r5615, %r5626; - or.b32 %r5628, %r5625, %r5627; - add.s32 %r5629, %r5490, %r5597; - add.s32 %r5630, %r5629, %r5628; - add.s32 %r5631, %r5630, 568446438; - shf.l.wrap.b32 %r5632, %r5631, %r5631, 5; - add.s32 %r5633, %r5632, %r5624; - and.b32 %r5634, %r5633, %r5615; - not.b32 %r5635, %r5615; - and.b32 %r5636, %r5624, %r5635; - or.b32 %r5637, %r5634, %r5636; - add.s32 %r5638, %r5536, %r5606; - add.s32 %r5639, %r5638, %r5637; - add.s32 %r5640, %r5639, -1019803690; - shf.l.wrap.b32 %r5641, %r5640, %r5640, 9; - add.s32 %r5642, %r5641, %r5633; - and.b32 %r5643, %r5642, %r5624; - not.b32 %r5644, %r5624; - and.b32 %r5645, %r5633, %r5644; - or.b32 %r5646, %r5643, %r5645; - add.s32 %r5647, %r5430, %r5615; - add.s32 %r5648, %r5647, %r5646; - add.s32 %r5649, %r5648, -187363961; - shf.l.wrap.b32 %r5650, %r5649, %r5649, 14; - add.s32 %r5651, %r5650, %r5642; - and.b32 %r5652, %r5651, %r5633; - not.b32 %r5653, %r5633; - and.b32 %r5654, %r5642, %r5653; - or.b32 %r5655, %r5652, %r5654; - add.s32 %r5656, %r5480, %r5624; - add.s32 %r5657, %r5656, %r5655; - add.s32 %r5658, %r5657, 1163531501; - shf.l.wrap.b32 %r5659, %r5658, %r5658, 20; - add.s32 %r5660, %r5659, %r5651; - and.b32 %r5661, %r5660, %r5642; - not.b32 %r5662, %r5642; - and.b32 %r5663, %r5651, %r5662; - or.b32 %r5664, %r5661, %r5663; - add.s32 %r5665, %r5530, %r5633; - add.s32 %r5666, %r5665, %r5664; - add.s32 %r5667, %r5666, -1444681467; - shf.l.wrap.b32 %r5668, %r5667, %r5667, 5; - add.s32 %r5669, %r5668, %r5660; - and.b32 %r5670, %r5669, %r5651; - not.b32 %r5671, %r5651; - and.b32 %r5672, %r5660, %r5671; - or.b32 %r5673, %r5670, %r5672; - add.s32 %r5674, %r5420, %r5642; - add.s32 %r5675, %r5674, %r5673; - add.s32 %r5676, %r5675, -51403784; - shf.l.wrap.b32 %r5677, %r5676, %r5676, 9; - add.s32 %r5678, %r5677, %r5669; - and.b32 %r5679, %r5678, %r5660; - not.b32 %r5680, %r5660; - and.b32 %r5681, %r5669, %r5680; - or.b32 %r5682, %r5679, %r5681; - add.s32 %r5683, %r5470, %r5651; - add.s32 %r5684, %r5683, %r5682; - add.s32 %r5685, %r5684, 1735328473; - shf.l.wrap.b32 %r5686, %r5685, %r5685, 14; - add.s32 %r5687, %r5686, %r5678; - and.b32 %r5688, %r5687, %r5669; - not.b32 %r5689, %r5669; - and.b32 %r5690, %r5678, %r5689; - or.b32 %r5691, %r5688, %r5690; - add.s32 %r5692, %r5520, %r5660; - add.s32 %r5693, %r5692, %r5691; - add.s32 %r5694, %r5693, -1926607734; - shf.l.wrap.b32 %r5695, %r5694, %r5694, 20; - add.s32 %r5696, %r5695, %r5687; - xor.b32 %r5697, %r5696, %r5687; - xor.b32 %r5698, %r5697, %r5678; - add.s32 %r5699, %r5450, %r5669; - add.s32 %r5700, %r5699, %r5698; - add.s32 %r5701, %r5700, -378558; - shf.l.wrap.b32 %r5702, %r5701, %r5701, 4; - add.s32 %r5703, %r5702, %r5696; - xor.b32 %r5704, %r5703, %r5697; - add.s32 %r5705, %r5480, %r5678; - add.s32 %r5706, %r5705, %r5704; - add.s32 %r5707, %r5706, -2022574463; - shf.l.wrap.b32 %r5708, %r5707, %r5707, 11; - add.s32 %r5709, %r5708, %r5703; - xor.b32 %r5710, %r5709, %r5703; - xor.b32 %r5711, %r5710, %r5696; - add.s32 %r5712, %r5510, %r5687; - add.s32 %r5713, %r5712, %r5711; - add.s32 %r5714, %r5713, 1839030562; - shf.l.wrap.b32 %r5715, %r5714, %r5714, 16; - add.s32 %r5716, %r5715, %r5709; - xor.b32 %r5717, %r5716, %r5710; - add.s32 %r5718, %r5536, %r5696; - add.s32 %r5719, %r5718, %r5717; - add.s32 %r5720, %r5719, -35309556; - shf.l.wrap.b32 %r5721, %r5720, %r5720, 23; - add.s32 %r5722, %r5721, %r5716; - xor.b32 %r5723, %r5716, %r5709; - xor.b32 %r5724, %r5723, %r5722; - add.s32 %r5725, %r5410, %r5703; - add.s32 %r5726, %r5725, %r5724; - add.s32 %r5727, %r5726, -1530992060; - shf.l.wrap.b32 %r5728, %r5727, %r5727, 4; - add.s32 %r5729, %r5728, %r5722; - xor.b32 %r5730, %r5722, %r5716; - xor.b32 %r5731, %r5730, %r5729; - add.s32 %r5732, %r5440, %r5709; - add.s32 %r5733, %r5732, %r5731; - add.s32 %r5734, %r5733, 1272893353; - shf.l.wrap.b32 %r5735, %r5734, %r5734, 11; - add.s32 %r5736, %r5735, %r5729; - xor.b32 %r5737, %r5729, %r5722; - xor.b32 %r5738, %r5737, %r5736; - add.s32 %r5739, %r5470, %r5716; - add.s32 %r5740, %r5739, %r5738; - add.s32 %r5741, %r5740, -155497632; - shf.l.wrap.b32 %r5742, %r5741, %r5741, 16; - add.s32 %r5743, %r5742, %r5736; - xor.b32 %r5744, %r5736, %r5729; - xor.b32 %r5745, %r5744, %r5743; - add.s32 %r5746, %r5500, %r5722; - add.s32 %r5747, %r5746, %r5745; - add.s32 %r5748, %r5747, -1094730640; - shf.l.wrap.b32 %r5749, %r5748, %r5748, 23; - add.s32 %r5750, %r5749, %r5743; - xor.b32 %r5751, %r5743, %r5736; - xor.b32 %r5752, %r5751, %r5750; - add.s32 %r5753, %r5530, %r5729; - add.s32 %r5754, %r5753, %r5752; - add.s32 %r5755, %r5754, 681279174; - shf.l.wrap.b32 %r5756, %r5755, %r5755, 4; - add.s32 %r5757, %r5756, %r5750; - xor.b32 %r5758, %r5750, %r5743; - xor.b32 %r5759, %r5758, %r5757; - add.s32 %r5760, %r5401, %r5736; - add.s32 %r5761, %r5760, %r5759; - add.s32 %r5762, %r5761, -358537222; - shf.l.wrap.b32 %r5763, %r5762, %r5762, 11; - add.s32 %r5764, %r5763, %r5757; - xor.b32 %r5765, %r5757, %r5750; - xor.b32 %r5766, %r5765, %r5764; - add.s32 %r5767, %r5430, %r5743; - add.s32 %r5768, %r5767, %r5766; - add.s32 %r5769, %r5768, -722521979; - shf.l.wrap.b32 %r5770, %r5769, %r5769, 16; - add.s32 %r5771, %r5770, %r5764; - xor.b32 %r5772, %r5764, %r5757; - xor.b32 %r5773, %r5772, %r5771; - add.s32 %r5774, %r5460, %r5750; - add.s32 %r5775, %r5774, %r5773; - add.s32 %r5776, %r5775, 76029189; - shf.l.wrap.b32 %r5777, %r5776, %r5776, 23; - add.s32 %r5778, %r5777, %r5771; - xor.b32 %r5779, %r5771, %r5764; - xor.b32 %r5780, %r5779, %r5778; - add.s32 %r5781, %r5490, %r5757; - add.s32 %r5782, %r5781, %r5780; - add.s32 %r5783, %r5782, -640364487; - shf.l.wrap.b32 %r5784, %r5783, %r5783, 4; - add.s32 %r5785, %r5784, %r5778; - xor.b32 %r5786, %r5778, %r5771; - xor.b32 %r5787, %r5786, %r5785; - add.s32 %r5788, %r5520, %r5764; - add.s32 %r5789, %r5788, %r5787; - add.s32 %r5790, %r5789, -421815835; - shf.l.wrap.b32 %r5791, %r5790, %r5790, 11; - add.s32 %r5792, %r5791, %r5785; - xor.b32 %r5793, %r5785, %r5778; - xor.b32 %r5794, %r5793, %r5792; - add.s32 %r5795, %r5395, %r5771; - add.s32 %r5796, %r5795, %r5794; - add.s32 %r5797, %r5796, 530742520; - shf.l.wrap.b32 %r5798, %r5797, %r5797, 16; - add.s32 %r5799, %r5798, %r5792; - xor.b32 %r5800, %r5792, %r5785; - xor.b32 %r5801, %r5800, %r5799; - add.s32 %r5802, %r5420, %r5778; - add.s32 %r5803, %r5802, %r5801; - add.s32 %r5804, %r5803, -995338651; - shf.l.wrap.b32 %r5805, %r5804, %r5804, 23; - add.s32 %r5806, %r5805, %r5799; - not.b32 %r5807, %r5792; - or.b32 %r5808, %r5806, %r5807; - xor.b32 %r5809, %r5808, %r5799; - add.s32 %r5810, %r5401, %r5785; - add.s32 %r5811, %r5810, %r5809; - add.s32 %r5812, %r5811, -198630844; - shf.l.wrap.b32 %r5813, %r5812, %r5812, 6; - add.s32 %r5814, %r5813, %r5806; - not.b32 %r5815, %r5799; - or.b32 %r5816, %r5814, %r5815; - xor.b32 %r5817, %r5816, %r5806; - add.s32 %r5818, %r5470, %r5792; - add.s32 %r5819, %r5818, %r5817; - add.s32 %r5820, %r5819, 1126891415; - shf.l.wrap.b32 %r5821, %r5820, %r5820, 10; - add.s32 %r5822, %r5821, %r5814; - not.b32 %r5823, %r5806; - or.b32 %r5824, %r5822, %r5823; - xor.b32 %r5825, %r5824, %r5814; - add.s32 %r5826, %r5536, %r5799; - add.s32 %r5827, %r5826, %r5825; - add.s32 %r5828, %r5827, -1416354905; - shf.l.wrap.b32 %r5829, %r5828, %r5828, 15; - add.s32 %r5830, %r5829, %r5822; - not.b32 %r5831, %r5814; - or.b32 %r5832, %r5830, %r5831; - xor.b32 %r5833, %r5832, %r5822; - add.s32 %r5834, %r5450, %r5806; - add.s32 %r5835, %r5834, %r5833; - add.s32 %r5836, %r5835, -57434055; - shf.l.wrap.b32 %r5837, %r5836, %r5836, 21; - add.s32 %r5838, %r5837, %r5830; - not.b32 %r5839, %r5822; - or.b32 %r5840, %r5838, %r5839; - xor.b32 %r5841, %r5840, %r5830; - add.s32 %r5842, %r5520, %r5814; - add.s32 %r5843, %r5842, %r5841; - add.s32 %r5844, %r5843, 1700485571; - shf.l.wrap.b32 %r5845, %r5844, %r5844, 6; - add.s32 %r5846, %r5845, %r5838; - not.b32 %r5847, %r5830; - or.b32 %r5848, %r5846, %r5847; - xor.b32 %r5849, %r5848, %r5838; - add.s32 %r5850, %r5430, %r5822; - add.s32 %r5851, %r5850, %r5849; - add.s32 %r5852, %r5851, -1894986606; - shf.l.wrap.b32 %r5853, %r5852, %r5852, 10; - add.s32 %r5854, %r5853, %r5846; - not.b32 %r5855, %r5838; - or.b32 %r5856, %r5854, %r5855; - xor.b32 %r5857, %r5856, %r5846; - add.s32 %r5858, %r5500, %r5830; - add.s32 %r5859, %r5858, %r5857; - add.s32 %r5860, %r5859, -1051523; - shf.l.wrap.b32 %r5861, %r5860, %r5860, 15; - add.s32 %r5862, %r5861, %r5854; - not.b32 %r5863, %r5846; - or.b32 %r5864, %r5862, %r5863; - xor.b32 %r5865, %r5864, %r5854; - add.s32 %r5866, %r5410, %r5838; - add.s32 %r5867, %r5866, %r5865; - add.s32 %r5868, %r5867, -2054922799; - shf.l.wrap.b32 %r5869, %r5868, %r5868, 21; - add.s32 %r5870, %r5869, %r5862; - not.b32 %r5871, %r5854; - or.b32 %r5872, %r5870, %r5871; - xor.b32 %r5873, %r5872, %r5862; - add.s32 %r5874, %r5480, %r5846; - add.s32 %r5875, %r5874, %r5873; - add.s32 %r5876, %r5875, 1873313359; - shf.l.wrap.b32 %r5877, %r5876, %r5876, 6; - add.s32 %r5878, %r5877, %r5870; - not.b32 %r5879, %r5862; - or.b32 %r5880, %r5878, %r5879; - xor.b32 %r5881, %r5880, %r5870; - add.s32 %r5882, %r5395, %r5854; - add.s32 %r5883, %r5882, %r5881; - add.s32 %r5884, %r5883, -30611744; - shf.l.wrap.b32 %r5885, %r5884, %r5884, 10; - add.s32 %r5886, %r5885, %r5878; - not.b32 %r5887, %r5870; - or.b32 %r5888, %r5886, %r5887; - xor.b32 %r5889, %r5888, %r5878; - add.s32 %r5890, %r5460, %r5862; - add.s32 %r5891, %r5890, %r5889; - add.s32 %r5892, %r5891, -1560198380; - shf.l.wrap.b32 %r5893, %r5892, %r5892, 15; - add.s32 %r5894, %r5893, %r5886; - not.b32 %r5895, %r5878; - or.b32 %r5896, %r5894, %r5895; - xor.b32 %r5897, %r5896, %r5886; - add.s32 %r5898, %r5530, %r5870; - add.s32 %r5899, %r5898, %r5897; - add.s32 %r5900, %r5899, 1309151649; - shf.l.wrap.b32 %r5901, %r5900, %r5900, 21; - add.s32 %r5902, %r5901, %r5894; - not.b32 %r5903, %r5886; - or.b32 %r5904, %r5902, %r5903; - xor.b32 %r5905, %r5904, %r5894; - add.s32 %r5906, %r5440, %r5878; - add.s32 %r5907, %r5906, %r5905; - add.s32 %r5908, %r5907, -145523070; - shf.l.wrap.b32 %r5909, %r5908, %r5908, 6; - add.s32 %r5910, %r5909, %r5902; - not.b32 %r5911, %r5894; - or.b32 %r5912, %r5910, %r5911; - xor.b32 %r5913, %r5912, %r5902; - add.s32 %r5914, %r5510, %r5886; - add.s32 %r5915, %r5914, %r5913; - add.s32 %r5916, %r5915, -1120210379; - shf.l.wrap.b32 %r5917, %r5916, %r5916, 10; - add.s32 %r5918, %r5917, %r5910; - not.b32 %r5919, %r5902; - or.b32 %r5920, %r5918, %r5919; - xor.b32 %r5921, %r5920, %r5910; - add.s32 %r5922, %r5420, %r5894; - add.s32 %r5923, %r5922, %r5921; - add.s32 %r5924, %r5923, 718787259; - shf.l.wrap.b32 %r5925, %r5924, %r5924, 15; - add.s32 %r5926, %r5925, %r5918; - not.b32 %r5927, %r5910; - or.b32 %r5928, %r5926, %r5927; - xor.b32 %r5929, %r5928, %r5918; - add.s32 %r5930, %r5490, %r5902; - add.s32 %r5931, %r5930, %r5929; - add.s32 %r5932, %r5931, -343485551; - shf.l.wrap.b32 %r5933, %r5932, %r5932, 21; - add.s32 %r9108, %r5910, %r9108; - add.s32 %r5934, %r5926, %r9107; - add.s32 %r9107, %r5934, %r5933; - add.s32 %r9106, %r5926, %r9106; - add.s32 %r9105, %r5918, %r9105; - setp.eq.s64 %p257, %rd4258, %rd854; - add.s64 %rd4259, %rd4259, 64; - @%p257 bra $L__BB1_397; - bra.uni $L__BB1_341; - -$L__BB1_397: - mov.u16 %rs4343, 0; - ld.param.u64 %rd4024, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_0]; - cvta.to.local.u64 %rd4023, %rd4024; - shr.u32 %r7083, %r9108, 8; - shr.u32 %r7084, %r9108, 16; - shr.u32 %r7085, %r9108, 24; - shr.u32 %r7086, %r9107, 8; - shr.u32 %r7087, %r9107, 16; - shr.u32 %r7088, %r9107, 24; - shr.u32 %r7089, %r9106, 8; - shr.u32 %r7090, %r9106, 16; - shr.u32 %r7091, %r9106, 24; - shr.u32 %r7092, %r9105, 8; - shr.u32 %r7093, %r9105, 16; - shr.u32 %r7094, %r9105, 24; - mov.u16 %rs3786, 16; - st.local.u16 [%rd4023], %rs3786; - cvt.u16.u32 %rs3787, %r9108; - cvt.u16.u32 %rs3788, %r7083; - st.local.v2.u8 [%rd4023+2], {%rs3787, %rs3788}; - cvt.u16.u32 %rs3789, %r7085; - cvt.u16.u32 %rs3790, %r7084; - st.local.v2.u8 [%rd4023+4], {%rs3790, %rs3789}; - cvt.u16.u32 %rs3791, %r9107; - cvt.u16.u32 %rs3792, %r7086; - st.local.v2.u8 [%rd4023+6], {%rs3791, %rs3792}; - cvt.u16.u32 %rs3793, %r7088; - cvt.u16.u32 %rs3794, %r7087; - st.local.v2.u8 [%rd4023+8], {%rs3794, %rs3793}; - cvt.u16.u32 %rs3795, %r9106; - cvt.u16.u32 %rs3796, %r7089; - st.local.v2.u8 [%rd4023+10], {%rs3795, %rs3796}; - cvt.u16.u32 %rs3797, %r7091; - cvt.u16.u32 %rs3798, %r7090; - st.local.v2.u8 [%rd4023+12], {%rs3798, %rs3797}; - cvt.u16.u32 %rs3799, %r9105; - cvt.u16.u32 %rs3800, %r7092; - st.local.v2.u8 [%rd4023+14], {%rs3799, %rs3800}; - cvt.u16.u32 %rs3801, %r7094; - cvt.u16.u32 %rs3802, %r7093; - st.local.v2.u8 [%rd4023+16], {%rs3802, %rs3801}; - st.local.v2.u8 [%rd4023+18], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+20], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+22], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+24], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+26], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+28], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+30], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+32], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+34], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+36], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+38], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+40], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+42], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+44], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+46], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+48], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+50], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+52], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+54], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+56], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+58], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+60], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+62], {%rs4343, %rs4343}; - st.local.v2.u8 [%rd4023+64], {%rs4343, %rs4343}; - bra.uni $L__BB1_549; - -$L__BB1_224: - st.local.u64 [%rd1+96], %rd706; - mov.u64 %rd2220, 1; - { // callseq 24, 0 - .reg .b32 temp_param_reg; - .param .b64 param0; - st.param.b64 [param0+0], %rd722; - .param .b64 param1; - st.param.b64 [param1+0], %rd721; - .param .b64 param2; - st.param.b64 [param2+0], %rd2220; - call.uni - _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE, - ( - param0, - param1, - param2 - ); - } // callseq 24 - -$L__BB1_226: - st.local.u8 [%rd1+104], %rs2623; - ld.local.u32 %r663, [%rd1+8]; - shr.u32 %r664, %r663, 24; - shr.u32 %r665, %r663, 8; - and.b32 %r666, %r665, 65280; - or.b32 %r667, %r666, %r664; - shl.b32 %r668, %r663, 24; - shl.b32 %r669, %r663, 8; - and.b32 %r670, %r669, 16711680; - or.b32 %r671, %r668, %r670; - or.b32 %r672, %r671, %r667; - shr.u32 %r673, %r672, 8; - shr.u32 %r674, %r671, 16; - ld.local.u32 %r675, [%rd1+12]; - shr.u32 %r676, %r675, 24; - shr.u32 %r677, %r675, 8; - and.b32 %r678, %r677, 65280; - or.b32 %r679, %r678, %r676; - shl.b32 %r680, %r675, 24; - shl.b32 %r681, %r675, 8; - and.b32 %r682, %r681, 16711680; - or.b32 %r683, %r680, %r682; - or.b32 %r684, %r683, %r679; - shr.u32 %r685, %r684, 8; - shr.u32 %r686, %r683, 16; - ld.local.u32 %r687, [%rd1+16]; - shr.u32 %r688, %r687, 24; - shr.u32 %r689, %r687, 8; - and.b32 %r690, %r689, 65280; - or.b32 %r691, %r690, %r688; - shl.b32 %r692, %r687, 24; - shl.b32 %r693, %r687, 8; - and.b32 %r694, %r693, 16711680; - or.b32 %r695, %r692, %r694; - or.b32 %r696, %r695, %r691; - shr.u32 %r697, %r696, 8; - shr.u32 %r698, %r695, 16; - ld.local.u32 %r699, [%rd1+20]; - shr.u32 %r700, %r699, 24; - shr.u32 %r701, %r699, 8; - and.b32 %r702, %r701, 65280; - or.b32 %r703, %r702, %r700; - shl.b32 %r704, %r699, 24; - shl.b32 %r705, %r699, 8; - and.b32 %r706, %r705, 16711680; - or.b32 %r707, %r704, %r706; - or.b32 %r708, %r707, %r703; - shr.u32 %r709, %r708, 8; - shr.u32 %r710, %r707, 16; - ld.local.u32 %r711, [%rd1+24]; - shr.u32 %r712, %r711, 24; - shr.u32 %r713, %r711, 8; - and.b32 %r714, %r713, 65280; - or.b32 %r715, %r714, %r712; - shl.b32 %r716, %r711, 24; - shl.b32 %r717, %r711, 8; - and.b32 %r718, %r717, 16711680; - or.b32 %r719, %r716, %r718; - or.b32 %r720, %r719, %r715; - shr.u32 %r721, %r720, 8; - shr.u32 %r722, %r719, 16; - ld.local.u32 %r723, [%rd1+28]; - shr.u32 %r724, %r723, 24; - shr.u32 %r725, %r723, 8; - and.b32 %r726, %r725, 65280; - or.b32 %r727, %r726, %r724; - shl.b32 %r728, %r723, 24; - shl.b32 %r729, %r723, 8; - and.b32 %r730, %r729, 16711680; - or.b32 %r731, %r728, %r730; - or.b32 %r732, %r731, %r727; - shr.u32 %r733, %r732, 8; - shr.u32 %r734, %r731, 16; - ld.local.u32 %r735, [%rd1+32]; - shr.u32 %r736, %r735, 24; - shr.u32 %r737, %r735, 8; - and.b32 %r738, %r737, 65280; - or.b32 %r739, %r738, %r736; - shl.b32 %r740, %r735, 24; - shl.b32 %r741, %r735, 8; - and.b32 %r742, %r741, 16711680; - or.b32 %r743, %r740, %r742; - or.b32 %r744, %r743, %r739; - shr.u32 %r745, %r744, 8; - shr.u32 %r746, %r743, 16; - ld.local.u32 %r747, [%rd1+36]; - shr.u32 %r748, %r747, 24; - shr.u32 %r749, %r747, 8; - and.b32 %r750, %r749, 65280; - or.b32 %r751, %r750, %r748; - shl.b32 %r752, %r747, 24; - shl.b32 %r753, %r747, 8; - and.b32 %r754, %r753, 16711680; - or.b32 %r755, %r752, %r754; - or.b32 %r756, %r755, %r751; - shr.u32 %r757, %r756, 8; - shr.u32 %r758, %r755, 16; - mov.u16 %rs2705, 32; - st.local.u16 [%rd12], %rs2705; - cvt.u16.u32 %rs2706, %r673; - cvt.u16.u32 %rs2707, %r664; - cvt.u16.u32 %rs2708, %r665; - and.b16 %rs2709, %rs2708, -256; - or.b16 %rs2710, %rs2709, %rs2707; - st.local.v2.u8 [%rd12+2], {%rs2710, %rs2706}; - cvt.u16.u32 %rs2711, %r674; - cvt.u16.u32 %rs2712, %r663; - and.b16 %rs2713, %rs2712, 255; - st.local.v2.u8 [%rd12+4], {%rs2711, %rs2713}; - cvt.u16.u32 %rs2714, %r685; - cvt.u16.u32 %rs2715, %r676; - cvt.u16.u32 %rs2716, %r677; - and.b16 %rs2717, %rs2716, -256; - or.b16 %rs2718, %rs2717, %rs2715; - st.local.v2.u8 [%rd12+6], {%rs2718, %rs2714}; - cvt.u16.u32 %rs2719, %r686; - cvt.u16.u32 %rs2720, %r675; - and.b16 %rs2721, %rs2720, 255; - st.local.v2.u8 [%rd12+8], {%rs2719, %rs2721}; - cvt.u16.u32 %rs2722, %r697; - cvt.u16.u32 %rs2723, %r688; - cvt.u16.u32 %rs2724, %r689; - and.b16 %rs2725, %rs2724, -256; - or.b16 %rs2726, %rs2725, %rs2723; - st.local.v2.u8 [%rd12+10], {%rs2726, %rs2722}; - cvt.u16.u32 %rs2727, %r698; - cvt.u16.u32 %rs2728, %r687; - and.b16 %rs2729, %rs2728, 255; - st.local.v2.u8 [%rd12+12], {%rs2727, %rs2729}; - cvt.u16.u32 %rs2730, %r709; - cvt.u16.u32 %rs2731, %r700; - cvt.u16.u32 %rs2732, %r701; - and.b16 %rs2733, %rs2732, -256; - or.b16 %rs2734, %rs2733, %rs2731; - st.local.v2.u8 [%rd12+14], {%rs2734, %rs2730}; - cvt.u16.u32 %rs2735, %r710; - cvt.u16.u32 %rs2736, %r699; - and.b16 %rs2737, %rs2736, 255; - st.local.v2.u8 [%rd12+16], {%rs2735, %rs2737}; - cvt.u16.u32 %rs2738, %r721; - cvt.u16.u32 %rs2739, %r712; - cvt.u16.u32 %rs2740, %r713; - and.b16 %rs2741, %rs2740, -256; - or.b16 %rs2742, %rs2741, %rs2739; - st.local.v2.u8 [%rd12+18], {%rs2742, %rs2738}; - cvt.u16.u32 %rs2743, %r722; - cvt.u16.u32 %rs2744, %r711; - and.b16 %rs2745, %rs2744, 255; - st.local.v2.u8 [%rd12+20], {%rs2743, %rs2745}; - cvt.u16.u32 %rs2746, %r733; - cvt.u16.u32 %rs2747, %r724; - cvt.u16.u32 %rs2748, %r725; - and.b16 %rs2749, %rs2748, -256; - or.b16 %rs2750, %rs2749, %rs2747; - st.local.v2.u8 [%rd12+22], {%rs2750, %rs2746}; - cvt.u16.u32 %rs2751, %r734; - cvt.u16.u32 %rs2752, %r723; - and.b16 %rs2753, %rs2752, 255; - st.local.v2.u8 [%rd12+24], {%rs2751, %rs2753}; - cvt.u16.u32 %rs2754, %r745; - cvt.u16.u32 %rs2755, %r736; - cvt.u16.u32 %rs2756, %r737; - and.b16 %rs2757, %rs2756, -256; - or.b16 %rs2758, %rs2757, %rs2755; - st.local.v2.u8 [%rd12+26], {%rs2758, %rs2754}; - cvt.u16.u32 %rs2759, %r746; - cvt.u16.u32 %rs2760, %r735; - and.b16 %rs2761, %rs2760, 255; - st.local.v2.u8 [%rd12+28], {%rs2759, %rs2761}; - cvt.u16.u32 %rs2762, %r757; - cvt.u16.u32 %rs2763, %r748; - cvt.u16.u32 %rs2764, %r749; - and.b16 %rs2765, %rs2764, -256; - or.b16 %rs2766, %rs2765, %rs2763; - st.local.v2.u8 [%rd12+30], {%rs2766, %rs2762}; - cvt.u16.u32 %rs2767, %r758; - cvt.u16.u32 %rs2768, %r747; - and.b16 %rs2769, %rs2768, 255; - st.local.v2.u8 [%rd12+32], {%rs2767, %rs2769}; - st.local.v2.u8 [%rd12+34], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+36], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+38], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+40], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+42], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+44], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+46], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+48], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+50], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+52], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+54], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+56], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+58], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+60], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+62], {%rs2623, %rs2623}; - st.local.v2.u8 [%rd12+64], {%rs2623, %rs2623}; - bra.uni $L__BB1_549; - -$L__BB1_268: - st.local.u64 [%rd1+88], %rd792; - mov.pred %p178, 0; - mov.pred %p193, -1; - mov.u64 %rd4244, %rd4243; - -$L__BB1_269: - ld.local.u32 %rd2300, [%rd4244]; - shl.b64 %rd2301, %rd2300, 8; - mov.b64 {%r877, %r878}, %rd2301; - mov.b32 {%rs548, %rs2988}, %r878; - mov.b32 {%rs544, %rs546}, %r877; - shr.u16 %rs547, %rs546, 8; - shr.u16 %rs545, %rs544, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2302, [%rd4244+4]; - shl.b64 %rd2303, %rd2302, 8; - mov.b64 {%r879, %r880}, %rd2303; - mov.b32 {%rs553, %rs2989}, %r880; - mov.b32 {%rs549, %rs551}, %r879; - shr.u16 %rs552, %rs551, 8; - shr.u16 %rs550, %rs549, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2304, [%rd4244+8]; - shl.b64 %rd2305, %rd2304, 8; - mov.b64 {%r881, %r882}, %rd2305; - mov.b32 {%rs558, %rs2990}, %r882; - mov.b32 {%rs554, %rs556}, %r881; - shr.u16 %rs557, %rs556, 8; - shr.u16 %rs555, %rs554, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2306, [%rd4244+12]; - shl.b64 %rd2307, %rd2306, 8; - mov.b64 {%r883, %r884}, %rd2307; - mov.b32 {%rs563, %rs2991}, %r884; - mov.b32 {%rs559, %rs561}, %r883; - shr.u16 %rs562, %rs561, 8; - shr.u16 %rs560, %rs559, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2308, [%rd4244+16]; - shl.b64 %rd2309, %rd2308, 8; - mov.b64 {%r885, %r886}, %rd2309; - mov.b32 {%rs568, %rs2992}, %r886; - mov.b32 {%rs564, %rs566}, %r885; - shr.u16 %rs567, %rs566, 8; - shr.u16 %rs565, %rs564, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2310, [%rd4244+20]; - shl.b64 %rd2311, %rd2310, 8; - mov.b64 {%r887, %r888}, %rd2311; - mov.b32 {%rs573, %rs2993}, %r888; - mov.b32 {%rs569, %rs571}, %r887; - shr.u16 %rs572, %rs571, 8; - shr.u16 %rs570, %rs569, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2312, [%rd4244+24]; - shl.b64 %rd2313, %rd2312, 8; - mov.b64 {%r889, %r890}, %rd2313; - mov.b32 {%rs578, %rs2994}, %r890; - mov.b32 {%rs574, %rs576}, %r889; - shr.u16 %rs577, %rs576, 8; - shr.u16 %rs575, %rs574, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2314, [%rd4244+28]; - shl.b64 %rd2315, %rd2314, 8; - mov.b64 {%r891, %r892}, %rd2315; - mov.b32 {%rs583, %rs2995}, %r892; - mov.b32 {%rs579, %rs581}, %r891; - shr.u16 %rs582, %rs581, 8; - shr.u16 %rs580, %rs579, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2316, [%rd4244+32]; - shl.b64 %rd2317, %rd2316, 8; - mov.b64 {%r893, %r894}, %rd2317; - mov.b32 {%rs588, %rs2996}, %r894; - mov.b32 {%rs584, %rs586}, %r893; - shr.u16 %rs587, %rs586, 8; - shr.u16 %rs585, %rs584, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2318, [%rd4244+36]; - shl.b64 %rd2319, %rd2318, 8; - mov.b64 {%r895, %r896}, %rd2319; - mov.b32 {%rs593, %rs2997}, %r896; - mov.b32 {%rs589, %rs591}, %r895; - shr.u16 %rs592, %rs591, 8; - shr.u16 %rs590, %rs589, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2320, [%rd4244+40]; - shl.b64 %rd2321, %rd2320, 8; - mov.b64 {%r897, %r898}, %rd2321; - mov.b32 {%rs598, %rs2998}, %r898; - mov.b32 {%rs594, %rs596}, %r897; - shr.u16 %rs597, %rs596, 8; - shr.u16 %rs595, %rs594, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2322, [%rd4244+44]; - shl.b64 %rd2323, %rd2322, 8; - mov.b64 {%r899, %r900}, %rd2323; - mov.b32 {%rs603, %rs2999}, %r900; - mov.b32 {%rs599, %rs601}, %r899; - shr.u16 %rs602, %rs601, 8; - shr.u16 %rs600, %rs599, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2324, [%rd4244+48]; - shl.b64 %rd2325, %rd2324, 8; - mov.b64 {%r901, %r902}, %rd2325; - mov.b32 {%rs608, %rs3000}, %r902; - mov.b32 {%rs604, %rs606}, %r901; - shr.u16 %rs607, %rs606, 8; - shr.u16 %rs605, %rs604, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2326, [%rd4244+52]; - shl.b64 %rd2327, %rd2326, 8; - mov.b64 {%r903, %r904}, %rd2327; - mov.b32 {%rs613, %rs3001}, %r904; - mov.b32 {%rs609, %rs611}, %r903; - shr.u16 %rs612, %rs611, 8; - shr.u16 %rs610, %rs609, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2328, [%rd4244+56]; - shl.b64 %rd2329, %rd2328, 8; - mov.b64 {%r905, %r906}, %rd2329; - mov.b32 {%rs618, %rs3002}, %r906; - mov.b32 {%rs614, %rs616}, %r905; - shr.u16 %rs617, %rs616, 8; - shr.u16 %rs615, %rs614, 8; - @%p178 bra $L__BB1_285; - - ld.local.u32 %rd2330, [%rd4244+60]; - shl.b64 %rd2331, %rd2330, 8; - mov.b64 {%r907, %r908}, %rd2331; - mov.b32 {%rs623, %rs3003}, %r908; - mov.b32 {%rs619, %rs621}, %r907; - shr.u16 %rs622, %rs621, 8; - shr.u16 %rs620, %rs619, 8; - @%p193 bra $L__BB1_286; - bra.uni $L__BB1_285; - -$L__BB1_286: - add.s64 %rd4243, %rd4243, 64; - shl.b16 %rs3004, %rs546, 8; - or.b16 %rs3005, %rs545, %rs3004; - shl.b16 %rs3006, %rs548, 8; - or.b16 %rs3007, %rs547, %rs3006; - mov.b32 %r909, {%rs3005, %rs3007}; - shr.u32 %r910, %r909, 24; - shr.u32 %r911, %r909, 8; - and.b32 %r912, %r911, 65280; - or.b32 %r913, %r912, %r910; - shl.b32 %r914, %r909, 24; - shl.b32 %r915, %r909, 8; - and.b32 %r916, %r915, 16711680; - or.b32 %r917, %r914, %r916; - or.b32 %r918, %r917, %r913; - shl.b16 %rs3008, %rs551, 8; - or.b16 %rs3009, %rs550, %rs3008; - shl.b16 %rs3010, %rs553, 8; - or.b16 %rs3011, %rs552, %rs3010; - mov.b32 %r919, {%rs3009, %rs3011}; - shr.u32 %r920, %r919, 24; - shr.u32 %r921, %r919, 8; - and.b32 %r922, %r921, 65280; - or.b32 %r923, %r922, %r920; - shl.b32 %r924, %r919, 24; - shl.b32 %r925, %r919, 8; - and.b32 %r926, %r925, 16711680; - or.b32 %r927, %r924, %r926; - or.b32 %r928, %r927, %r923; - shl.b16 %rs3012, %rs556, 8; - or.b16 %rs3013, %rs555, %rs3012; - shl.b16 %rs3014, %rs558, 8; - or.b16 %rs3015, %rs557, %rs3014; - mov.b32 %r929, {%rs3013, %rs3015}; - shr.u32 %r930, %r929, 24; - shr.u32 %r931, %r929, 8; - and.b32 %r932, %r931, 65280; - or.b32 %r933, %r932, %r930; - shl.b32 %r934, %r929, 24; - shl.b32 %r935, %r929, 8; - and.b32 %r936, %r935, 16711680; - or.b32 %r937, %r934, %r936; - or.b32 %r938, %r937, %r933; - xor.b16 %rs3016, %rs555, %rs545; - xor.b16 %rs3017, %rs556, %rs546; - shl.b16 %rs3018, %rs3017, 8; - or.b16 %rs3019, %rs3016, %rs3018; - xor.b16 %rs3020, %rs557, %rs547; - xor.b16 %rs3021, %rs558, %rs548; - shl.b16 %rs3022, %rs3021, 8; - or.b16 %rs3023, %rs3020, %rs3022; - mov.b32 %r939, {%rs3019, %rs3023}; - shl.b16 %rs3024, %rs561, 8; - or.b16 %rs3025, %rs560, %rs3024; - shl.b16 %rs3026, %rs563, 8; - or.b16 %rs3027, %rs562, %rs3026; - mov.b32 %r940, {%rs3025, %rs3027}; - shr.u32 %r941, %r940, 24; - shr.u32 %r942, %r940, 8; - and.b32 %r943, %r942, 65280; - or.b32 %r944, %r943, %r941; - shl.b32 %r945, %r940, 24; - shl.b32 %r946, %r940, 8; - and.b32 %r947, %r946, 16711680; - or.b32 %r948, %r945, %r947; - or.b32 %r949, %r948, %r944; - xor.b16 %rs3028, %rs560, %rs550; - xor.b16 %rs3029, %rs561, %rs551; - shl.b16 %rs3030, %rs3029, 8; - or.b16 %rs3031, %rs3028, %rs3030; - xor.b16 %rs3032, %rs562, %rs552; - xor.b16 %rs3033, %rs563, %rs553; - shl.b16 %rs3034, %rs3033, 8; - or.b16 %rs3035, %rs3032, %rs3034; - mov.b32 %r950, {%rs3031, %rs3035}; - shl.b16 %rs3036, %rs566, 8; - or.b16 %rs3037, %rs565, %rs3036; - shl.b16 %rs3038, %rs568, 8; - or.b16 %rs3039, %rs567, %rs3038; - mov.b32 %r951, {%rs3037, %rs3039}; - shr.u32 %r952, %r951, 24; - shr.u32 %r953, %r951, 8; - and.b32 %r954, %r953, 65280; - or.b32 %r955, %r954, %r952; - shl.b32 %r956, %r951, 24; - shl.b32 %r957, %r951, 8; - and.b32 %r958, %r957, 16711680; - or.b32 %r959, %r956, %r958; - or.b32 %r960, %r959, %r955; - xor.b16 %rs3040, %rs565, %rs555; - xor.b16 %rs3041, %rs566, %rs556; - shl.b16 %rs3042, %rs3041, 8; - or.b16 %rs3043, %rs3040, %rs3042; - xor.b16 %rs3044, %rs567, %rs557; - xor.b16 %rs3045, %rs568, %rs558; - shl.b16 %rs3046, %rs3045, 8; - or.b16 %rs3047, %rs3044, %rs3046; - mov.b32 %r961, {%rs3043, %rs3047}; - shl.b16 %rs3048, %rs571, 8; - or.b16 %rs3049, %rs570, %rs3048; - shl.b16 %rs3050, %rs573, 8; - or.b16 %rs3051, %rs572, %rs3050; - mov.b32 %r962, {%rs3049, %rs3051}; - shr.u32 %r963, %r962, 24; - shr.u32 %r964, %r962, 8; - and.b32 %r965, %r964, 65280; - or.b32 %r966, %r965, %r963; - shl.b32 %r967, %r962, 24; - shl.b32 %r968, %r962, 8; - and.b32 %r969, %r968, 16711680; - or.b32 %r970, %r967, %r969; - or.b32 %r971, %r970, %r966; - xor.b16 %rs3052, %rs570, %rs560; - xor.b16 %rs3053, %rs571, %rs561; - shl.b16 %rs3054, %rs3053, 8; - or.b16 %rs3055, %rs3052, %rs3054; - xor.b16 %rs3056, %rs572, %rs562; - xor.b16 %rs3057, %rs573, %rs563; - shl.b16 %rs3058, %rs3057, 8; - or.b16 %rs3059, %rs3056, %rs3058; - mov.b32 %r972, {%rs3055, %rs3059}; - shl.b16 %rs3060, %rs576, 8; - or.b16 %rs3061, %rs575, %rs3060; - shl.b16 %rs3062, %rs578, 8; - or.b16 %rs3063, %rs577, %rs3062; - mov.b32 %r973, {%rs3061, %rs3063}; - shr.u32 %r974, %r973, 24; - shr.u32 %r975, %r973, 8; - and.b32 %r976, %r975, 65280; - or.b32 %r977, %r976, %r974; - shl.b32 %r978, %r973, 24; - shl.b32 %r979, %r973, 8; - and.b32 %r980, %r979, 16711680; - or.b32 %r981, %r978, %r980; - or.b32 %r982, %r981, %r977; - xor.b16 %rs3064, %rs575, %rs565; - xor.b16 %rs3065, %rs576, %rs566; - shl.b16 %rs3066, %rs3065, 8; - or.b16 %rs3067, %rs3064, %rs3066; - xor.b16 %rs3068, %rs577, %rs567; - xor.b16 %rs3069, %rs578, %rs568; - shl.b16 %rs3070, %rs3069, 8; - or.b16 %rs3071, %rs3068, %rs3070; - mov.b32 %r983, {%rs3067, %rs3071}; - shl.b16 %rs3072, %rs581, 8; - or.b16 %rs3073, %rs580, %rs3072; - shl.b16 %rs3074, %rs583, 8; - or.b16 %rs3075, %rs582, %rs3074; - mov.b32 %r984, {%rs3073, %rs3075}; - shr.u32 %r985, %r984, 24; - shr.u32 %r986, %r984, 8; - and.b32 %r987, %r986, 65280; - or.b32 %r988, %r987, %r985; - shl.b32 %r989, %r984, 24; - shl.b32 %r990, %r984, 8; - and.b32 %r991, %r990, 16711680; - or.b32 %r992, %r989, %r991; - or.b32 %r993, %r992, %r988; - xor.b16 %rs3076, %rs580, %rs570; - xor.b16 %rs3077, %rs581, %rs571; - shl.b16 %rs3078, %rs3077, 8; - or.b16 %rs3079, %rs3076, %rs3078; - xor.b16 %rs3080, %rs582, %rs572; - xor.b16 %rs3081, %rs583, %rs573; - shl.b16 %rs3082, %rs3081, 8; - or.b16 %rs3083, %rs3080, %rs3082; - mov.b32 %r994, {%rs3079, %rs3083}; - shl.b16 %rs3084, %rs616, 8; - or.b16 %rs3085, %rs615, %rs3084; - shl.b16 %rs3086, %rs618, 8; - or.b16 %rs3087, %rs617, %rs3086; - mov.b32 %r995, {%rs3085, %rs3087}; - shr.u32 %r996, %r995, 24; - shr.u32 %r997, %r995, 8; - and.b32 %r998, %r997, 65280; - or.b32 %r999, %r998, %r996; - shl.b32 %r1000, %r995, 24; - shl.b32 %r1001, %r995, 8; - and.b32 %r1002, %r1001, 16711680; - or.b32 %r1003, %r1000, %r1002; - or.b32 %r1004, %r1003, %r999; - shl.b16 %rs3088, %rs621, 8; - or.b16 %rs3089, %rs620, %rs3088; - shl.b16 %rs3090, %rs623, 8; - or.b16 %rs3091, %rs622, %rs3090; - mov.b32 %r1005, {%rs3089, %rs3091}; - shr.u32 %r1006, %r1005, 24; - shr.u32 %r1007, %r1005, 8; - and.b32 %r1008, %r1007, 65280; - or.b32 %r1009, %r1008, %r1006; - shl.b32 %r1010, %r1005, 24; - shl.b32 %r1011, %r1005, 8; - and.b32 %r1012, %r1011, 16711680; - or.b32 %r1013, %r1010, %r1012; - or.b32 %r1014, %r1013, %r1009; - xor.b32 %r1015, %r9088, %r9087; - and.b32 %r1016, %r1015, %r9086; - xor.b32 %r1017, %r1016, %r9088; - shf.l.wrap.b32 %r1018, %r9085, %r9085, 5; - add.s32 %r1019, %r1018, %r9089; - add.s32 %r1020, %r1019, %r1017; - add.s32 %r1021, %r1020, %r918; - add.s32 %r1022, %r1021, 1518500249; - shf.l.wrap.b32 %r1023, %r1022, %r1022, 5; - shf.l.wrap.b32 %r1024, %r9086, %r9086, 30; - xor.b32 %r1025, %r1024, %r9087; - and.b32 %r1026, %r1025, %r9085; - xor.b32 %r1027, %r1026, %r9087; - add.s32 %r1028, %r9088, %r1027; - add.s32 %r1029, %r1028, %r928; - add.s32 %r1030, %r1029, %r1023; - add.s32 %r1031, %r1030, 1518500249; - shf.l.wrap.b32 %r1032, %r1031, %r1031, 5; - shf.l.wrap.b32 %r1033, %r9085, %r9085, 30; - xor.b32 %r1034, %r1024, %r1033; - and.b32 %r1035, %r1022, %r1034; - xor.b32 %r1036, %r1035, %r1024; - add.s32 %r1037, %r9087, %r938; - add.s32 %r1038, %r1037, %r1036; - add.s32 %r1039, %r1038, %r1032; - add.s32 %r1040, %r1039, 1518500249; - shf.l.wrap.b32 %r1041, %r1022, %r1022, 30; - shf.l.wrap.b32 %r1042, %r1040, %r1040, 5; - xor.b32 %r1043, %r1041, %r1033; - and.b32 %r1044, %r1031, %r1043; - xor.b32 %r1045, %r1044, %r1033; - add.s32 %r1046, %r1024, %r949; - add.s32 %r1047, %r1046, %r1045; - add.s32 %r1048, %r1047, %r1042; - add.s32 %r1049, %r1048, 1518500249; - shf.l.wrap.b32 %r1050, %r1031, %r1031, 30; - shf.l.wrap.b32 %r1051, %r1049, %r1049, 5; - xor.b32 %r1052, %r1050, %r1041; - and.b32 %r1053, %r1052, %r1040; - xor.b32 %r1054, %r1053, %r1041; - add.s32 %r1055, %r1033, %r960; - add.s32 %r1056, %r1055, %r1054; - add.s32 %r1057, %r1056, %r1051; - add.s32 %r1058, %r1057, 1518500249; - shf.l.wrap.b32 %r1059, %r1040, %r1040, 30; - shf.l.wrap.b32 %r1060, %r1058, %r1058, 5; - xor.b32 %r1061, %r1059, %r1050; - and.b32 %r1062, %r1061, %r1049; - xor.b32 %r1063, %r1062, %r1050; - add.s32 %r1064, %r1041, %r971; - add.s32 %r1065, %r1064, %r1063; - add.s32 %r1066, %r1065, %r1060; - add.s32 %r1067, %r1066, 1518500249; - shf.l.wrap.b32 %r1068, %r1049, %r1049, 30; - shf.l.wrap.b32 %r1069, %r1067, %r1067, 5; - xor.b32 %r1070, %r1068, %r1059; - and.b32 %r1071, %r1058, %r1070; - xor.b32 %r1072, %r1071, %r1059; - add.s32 %r1073, %r1050, %r982; - add.s32 %r1074, %r1073, %r1072; - add.s32 %r1075, %r1074, %r1069; - add.s32 %r1076, %r1075, 1518500249; - shf.l.wrap.b32 %r1077, %r1058, %r1058, 30; - shf.l.wrap.b32 %r1078, %r1076, %r1076, 5; - xor.b32 %r1079, %r1077, %r1068; - and.b32 %r1080, %r1067, %r1079; - xor.b32 %r1081, %r1080, %r1068; - add.s32 %r1082, %r1059, %r993; - add.s32 %r1083, %r1082, %r1081; - add.s32 %r1084, %r1083, %r1078; - add.s32 %r1085, %r1084, 1518500249; - shf.l.wrap.b32 %r1086, %r1067, %r1067, 30; - cvt.u64.u32 %rd2332, %r1077; - cvt.u64.u32 %rd2333, %r1086; - cvt.u64.u32 %rd2334, %r1076; - cvt.u64.u32 %rd2335, %r1085; - bfi.b64 %rd2336, %rd2334, %rd2335, 32, 32; - bfi.b64 %rd2337, %rd2332, %rd2333, 32, 32; - mov.b64 {%r1087, %r1088}, %rd2336; - mov.b64 {%r1089, %r1090}, %rd2337; - shl.b16 %rs3092, %rs601, 8; - or.b16 %rs3093, %rs600, %rs3092; - shl.b16 %rs3094, %rs603, 8; - or.b16 %rs3095, %rs602, %rs3094; - mov.b32 %r1091, {%rs3093, %rs3095}; - shr.u32 %r1092, %r1091, 24; - shr.u32 %r1093, %r1091, 8; - and.b32 %r1094, %r1093, 65280; - or.b32 %r1095, %r1094, %r1092; - shl.b32 %r1096, %r1091, 24; - shl.b32 %r1097, %r1091, 8; - and.b32 %r1098, %r1097, 16711680; - or.b32 %r1099, %r1096, %r1098; - or.b32 %r1100, %r1099, %r1095; - cvt.u64.u32 %rd2338, %r1100; - shl.b16 %rs3096, %rs596, 8; - or.b16 %rs3097, %rs595, %rs3096; - shl.b16 %rs3098, %rs598, 8; - or.b16 %rs3099, %rs597, %rs3098; - mov.b32 %r1101, {%rs3097, %rs3099}; - shr.u32 %r1102, %r1101, 24; - shr.u32 %r1103, %r1101, 8; - and.b32 %r1104, %r1103, 65280; - or.b32 %r1105, %r1104, %r1102; - shl.b32 %r1106, %r1101, 24; - shl.b32 %r1107, %r1101, 8; - and.b32 %r1108, %r1107, 16711680; - or.b32 %r1109, %r1106, %r1108; - or.b32 %r1110, %r1109, %r1105; - shl.b16 %rs3100, %rs591, 8; - or.b16 %rs3101, %rs590, %rs3100; - shl.b16 %rs3102, %rs593, 8; - or.b16 %rs3103, %rs592, %rs3102; - mov.b32 %r1111, {%rs3101, %rs3103}; - shr.u32 %r1112, %r1111, 24; - shr.u32 %r1113, %r1111, 8; - and.b32 %r1114, %r1113, 65280; - or.b32 %r1115, %r1114, %r1112; - shl.b32 %r1116, %r1111, 24; - shl.b32 %r1117, %r1111, 8; - and.b32 %r1118, %r1117, 16711680; - or.b32 %r1119, %r1116, %r1118; - or.b32 %r1120, %r1119, %r1115; - cvt.u64.u32 %rd2339, %r1120; - shl.b16 %rs3104, %rs586, 8; - or.b16 %rs3105, %rs585, %rs3104; - shl.b16 %rs3106, %rs588, 8; - or.b16 %rs3107, %rs587, %rs3106; - mov.b32 %r1121, {%rs3105, %rs3107}; - shr.u32 %r1122, %r1121, 24; - shr.u32 %r1123, %r1121, 8; - and.b32 %r1124, %r1123, 65280; - or.b32 %r1125, %r1124, %r1122; - shl.b32 %r1126, %r1121, 24; - shl.b32 %r1127, %r1121, 8; - and.b32 %r1128, %r1127, 16711680; - or.b32 %r1129, %r1126, %r1128; - or.b32 %r1130, %r1129, %r1125; - cvt.u64.u32 %rd2340, %r1130; - cvt.u64.u32 %rd2341, %r1110; - bfi.b64 %rd2342, %rd2338, %rd2341, 32, 32; - bfi.b64 %rd2343, %rd2339, %rd2340, 32, 32; - mov.b64 {%r1131, %r1132}, %rd2343; - mov.b64 {%r1133, %r1134}, %rd2342; - cvt.u64.u32 %rd2344, %r1090; - cvt.u64.u32 %rd2345, %r1088; - cvt.u64.u32 %rd2346, %r1089; - bfi.b64 %rd2347, %rd2345, %rd2335, 32, 32; - bfi.b64 %rd2348, %rd2344, %rd2346, 32, 32; - mov.b64 {%r1135, %r1136}, %rd2347; - mov.b64 {%r1137, %r1138}, %rd2348; - shf.l.wrap.b32 %r1139, %r1135, %r1135, 5; - xor.b32 %r1140, %r1138, %r1137; - and.b32 %r1141, %r1140, %r1136; - xor.b32 %r1142, %r1141, %r1138; - add.s32 %r1143, %r1068, %r1131; - add.s32 %r1144, %r1143, %r1139; - add.s32 %r1145, %r1144, %r1142; - add.s32 %r1146, %r1145, 1518500249; - shf.l.wrap.b32 %r1147, %r1136, %r1136, 30; - shf.l.wrap.b32 %r1148, %r1146, %r1146, 5; - xor.b32 %r1149, %r1147, %r1137; - and.b32 %r1150, %r1149, %r1135; - xor.b32 %r1151, %r1150, %r1137; - add.s32 %r1152, %r1132, %r1138; - add.s32 %r1153, %r1152, %r1151; - add.s32 %r1154, %r1153, %r1148; - add.s32 %r1155, %r1154, 1518500249; - shf.l.wrap.b32 %r1156, %r1135, %r1135, 30; - shf.l.wrap.b32 %r1157, %r1155, %r1155, 5; - xor.b32 %r1158, %r1147, %r1156; - and.b32 %r1159, %r1146, %r1158; - xor.b32 %r1160, %r1159, %r1147; - add.s32 %r1161, %r1133, %r1137; - add.s32 %r1162, %r1161, %r1160; - add.s32 %r1163, %r1162, %r1157; - add.s32 %r1164, %r1163, 1518500249; - shf.l.wrap.b32 %r1165, %r1146, %r1146, 30; - shf.l.wrap.b32 %r1166, %r1164, %r1164, 5; - xor.b32 %r1167, %r1165, %r1156; - and.b32 %r1168, %r1155, %r1167; - xor.b32 %r1169, %r1168, %r1156; - add.s32 %r1170, %r1134, %r1147; - add.s32 %r1171, %r1170, %r1169; - add.s32 %r1172, %r1171, %r1166; - add.s32 %r1173, %r1172, 1518500249; - shf.l.wrap.b32 %r1174, %r1155, %r1155, 30; - cvt.u64.u32 %rd2349, %r1014; - shl.b16 %rs3108, %rs611, 8; - or.b16 %rs3109, %rs610, %rs3108; - shl.b16 %rs3110, %rs613, 8; - or.b16 %rs3111, %rs612, %rs3110; - mov.b32 %r1175, {%rs3109, %rs3111}; - shr.u32 %r1176, %r1175, 24; - shr.u32 %r1177, %r1175, 8; - and.b32 %r1178, %r1177, 65280; - or.b32 %r1179, %r1178, %r1176; - shl.b32 %r1180, %r1175, 24; - shl.b32 %r1181, %r1175, 8; - and.b32 %r1182, %r1181, 16711680; - or.b32 %r1183, %r1180, %r1182; - or.b32 %r1184, %r1183, %r1179; - cvt.u64.u32 %rd2350, %r1184; - shl.b16 %rs3112, %rs606, 8; - or.b16 %rs3113, %rs605, %rs3112; - shl.b16 %rs3114, %rs608, 8; - or.b16 %rs3115, %rs607, %rs3114; - mov.b32 %r1185, {%rs3113, %rs3115}; - shr.u32 %r1186, %r1185, 24; - shr.u32 %r1187, %r1185, 8; - and.b32 %r1188, %r1187, 65280; - or.b32 %r1189, %r1188, %r1186; - shl.b32 %r1190, %r1185, 24; - shl.b32 %r1191, %r1185, 8; - and.b32 %r1192, %r1191, 16711680; - or.b32 %r1193, %r1190, %r1192; - or.b32 %r1194, %r1193, %r1189; - cvt.u64.u32 %rd2351, %r1194; - cvt.u64.u32 %rd2352, %r1004; - bfi.b64 %rd2353, %rd2349, %rd2352, 32, 32; - bfi.b64 %rd2354, %rd2350, %rd2351, 32, 32; - mov.b64 {%r1195, %r1196}, %rd2354; - mov.b64 {%r1197, %r1198}, %rd2353; - shf.l.wrap.b32 %r1199, %r1173, %r1173, 5; - xor.b32 %r1200, %r1174, %r1165; - and.b32 %r1201, %r1200, %r1164; - xor.b32 %r1202, %r1201, %r1165; - add.s32 %r1203, %r1195, %r1156; - add.s32 %r1204, %r1203, %r1202; - add.s32 %r1205, %r1204, %r1199; - add.s32 %r1206, %r1205, 1518500249; - shf.l.wrap.b32 %r1207, %r1164, %r1164, 30; - shf.l.wrap.b32 %r1208, %r1206, %r1206, 5; - xor.b32 %r1209, %r1207, %r1174; - and.b32 %r1210, %r1209, %r1173; - xor.b32 %r1211, %r1210, %r1174; - add.s32 %r1212, %r1196, %r1165; - add.s32 %r1213, %r1212, %r1211; - add.s32 %r1214, %r1213, %r1208; - add.s32 %r1215, %r1214, 1518500249; - shf.l.wrap.b32 %r1216, %r1173, %r1173, 30; - shf.l.wrap.b32 %r1217, %r1215, %r1215, 5; - xor.b32 %r1218, %r1216, %r1207; - and.b32 %r1219, %r1206, %r1218; - xor.b32 %r1220, %r1219, %r1207; - add.s32 %r1221, %r1197, %r1174; - add.s32 %r1222, %r1221, %r1220; - add.s32 %r1223, %r1222, %r1217; - add.s32 %r1224, %r1223, 1518500249; - shf.l.wrap.b32 %r1225, %r1206, %r1206, 30; - shf.l.wrap.b32 %r1226, %r1224, %r1224, 5; - xor.b32 %r1227, %r1225, %r1216; - and.b32 %r1228, %r1215, %r1227; - xor.b32 %r1229, %r1228, %r1216; - add.s32 %r1230, %r1198, %r1207; - add.s32 %r1231, %r1230, %r1229; - add.s32 %r1232, %r1231, %r1226; - add.s32 %r1233, %r1232, 1518500249; - shf.l.wrap.b32 %r1234, %r1215, %r1215, 30; - cvt.u64.u32 %rd2355, %r1225; - cvt.u64.u32 %rd2356, %r1234; - cvt.u64.u32 %rd2357, %r1224; - cvt.u64.u32 %rd2358, %r1233; - bfi.b64 %rd2359, %rd2357, %rd2358, 32, 32; - bfi.b64 %rd2360, %rd2355, %rd2356, 32, 32; - mov.b64 {%r1235, %r1236}, %rd2359; - mov.b64 {%r1237, %r1238}, %rd2360; - shr.u32 %r1239, %r972, 24; - shr.u32 %r1240, %r972, 8; - and.b32 %r1241, %r1240, 65280; - or.b32 %r1242, %r1241, %r1239; - shl.b32 %r1243, %r972, 24; - shl.b32 %r1244, %r972, 8; - and.b32 %r1245, %r1244, 16711680; - or.b32 %r1246, %r1243, %r1245; - or.b32 %r1247, %r1246, %r1242; - cvt.u64.u32 %rd2361, %r1247; - shr.u32 %r1248, %r961, 24; - shr.u32 %r1249, %r961, 8; - and.b32 %r1250, %r1249, 65280; - or.b32 %r1251, %r1250, %r1248; - shl.b32 %r1252, %r961, 24; - shl.b32 %r1253, %r961, 8; - and.b32 %r1254, %r1253, 16711680; - or.b32 %r1255, %r1252, %r1254; - or.b32 %r1256, %r1255, %r1251; - shr.u32 %r1257, %r950, 24; - shr.u32 %r1258, %r950, 8; - and.b32 %r1259, %r1258, 65280; - or.b32 %r1260, %r1259, %r1257; - shl.b32 %r1261, %r950, 24; - shl.b32 %r1262, %r950, 8; - and.b32 %r1263, %r1262, 16711680; - or.b32 %r1264, %r1261, %r1263; - or.b32 %r1265, %r1264, %r1260; - cvt.u64.u32 %rd2362, %r1265; - shr.u32 %r1266, %r939, 24; - shr.u32 %r1267, %r939, 8; - and.b32 %r1268, %r1267, 65280; - or.b32 %r1269, %r1268, %r1266; - shl.b32 %r1270, %r939, 24; - shl.b32 %r1271, %r939, 8; - and.b32 %r1272, %r1271, 16711680; - or.b32 %r1273, %r1270, %r1272; - or.b32 %r1274, %r1273, %r1269; - cvt.u64.u32 %rd2363, %r1274; - cvt.u64.u32 %rd2364, %r1256; - bfi.b64 %rd2365, %rd2361, %rd2364, 32, 32; - bfi.b64 %rd2366, %rd2362, %rd2363, 32, 32; - mov.b64 {%r1275, %r1276}, %rd2366; - mov.b64 {%r1277, %r1278}, %rd2365; - xor.b16 %rs3116, %rs585, %rs3016; - xor.b16 %rs3117, %rs586, %rs3017; - shl.b16 %rs3118, %rs3117, 8; - or.b16 %rs3119, %rs3116, %rs3118; - xor.b16 %rs3120, %rs587, %rs3020; - xor.b16 %rs3121, %rs588, %rs3021; - shl.b16 %rs3122, %rs3121, 8; - or.b16 %rs3123, %rs3120, %rs3122; - mov.b32 %r1279, {%rs3119, %rs3123}; - shr.u32 %r1280, %r1279, 24; - shr.u32 %r1281, %r1279, 8; - and.b32 %r1282, %r1281, 65280; - or.b32 %r1283, %r1282, %r1280; - shl.b32 %r1284, %r1279, 24; - shl.b32 %r1285, %r1279, 8; - and.b32 %r1286, %r1285, 16711680; - or.b32 %r1287, %r1284, %r1286; - or.b32 %r1288, %r1287, %r1283; - xor.b32 %r1289, %r1132, %r1276; - xor.b32 %r1290, %r1133, %r1277; - xor.b32 %r1291, %r1134, %r1278; - xor.b32 %r1292, %r1196, %r1288; - xor.b32 %r1293, %r1289, %r1197; - shf.l.wrap.b32 %r1294, %r1293, %r1293, 1; - xor.b32 %r1295, %r1290, %r1198; - shf.l.wrap.b32 %r1296, %r1295, %r1295, 1; - shf.l.wrap.b32 %r1297, %r1292, %r1292, 1; - xor.b32 %r1298, %r1291, %r1297; - shf.l.wrap.b32 %r1299, %r1298, %r1298, 1; - cvt.u64.u32 %rd2367, %r1299; - cvt.u64.u32 %rd2368, %r1294; - cvt.u64.u32 %rd2369, %r1297; - cvt.u64.u32 %rd2370, %r1296; - bfi.b64 %rd2371, %rd2367, %rd2370, 32, 32; - bfi.b64 %rd2372, %rd2368, %rd2369, 32, 32; - mov.b64 {%r1300, %r1301}, %rd2372; - mov.b64 {%r1302, %r1303}, %rd2371; - cvt.u64.u32 %rd2373, %r1238; - cvt.u64.u32 %rd2374, %r1236; - cvt.u64.u32 %rd2375, %r1237; - bfi.b64 %rd2376, %rd2374, %rd2358, 32, 32; - bfi.b64 %rd2377, %rd2373, %rd2375, 32, 32; - mov.b64 {%r1304, %r1305}, %rd2376; - mov.b64 {%r1306, %r1307}, %rd2377; - shf.l.wrap.b32 %r1308, %r1304, %r1304, 5; - xor.b32 %r1309, %r1307, %r1306; - and.b32 %r1310, %r1309, %r1305; - xor.b32 %r1311, %r1310, %r1307; - add.s32 %r1312, %r1300, %r1216; - add.s32 %r1313, %r1312, %r1308; - add.s32 %r1314, %r1313, %r1311; - add.s32 %r1315, %r1314, 1518500249; - shf.l.wrap.b32 %r1316, %r1305, %r1305, 30; - shf.l.wrap.b32 %r1317, %r1315, %r1315, 5; - xor.b32 %r1318, %r1316, %r1306; - and.b32 %r1319, %r1318, %r1304; - xor.b32 %r1320, %r1319, %r1306; - add.s32 %r1321, %r1301, %r1307; - add.s32 %r1322, %r1321, %r1320; - add.s32 %r1323, %r1322, %r1317; - add.s32 %r1324, %r1323, 1518500249; - shf.l.wrap.b32 %r1325, %r1304, %r1304, 30; - shf.l.wrap.b32 %r1326, %r1324, %r1324, 5; - xor.b32 %r1327, %r1316, %r1325; - and.b32 %r1328, %r1315, %r1327; - xor.b32 %r1329, %r1328, %r1316; - add.s32 %r1330, %r1302, %r1306; - add.s32 %r1331, %r1330, %r1329; - add.s32 %r1332, %r1331, %r1326; - add.s32 %r1333, %r1332, 1518500249; - shf.l.wrap.b32 %r1334, %r1315, %r1315, 30; - shf.l.wrap.b32 %r1335, %r1333, %r1333, 5; - xor.b32 %r1336, %r1334, %r1325; - and.b32 %r1337, %r1324, %r1336; - xor.b32 %r1338, %r1337, %r1325; - add.s32 %r1339, %r1303, %r1316; - add.s32 %r1340, %r1339, %r1338; - add.s32 %r1341, %r1340, %r1335; - add.s32 %r1342, %r1341, 1518500249; - shf.l.wrap.b32 %r1343, %r1324, %r1324, 30; - xor.b32 %r1344, %r1131, %r982; - xor.b32 %r1345, %r1132, %r993; - cvt.u64.u32 %rd2378, %r1345; - shr.u32 %r1346, %r994, 24; - shr.u32 %r1347, %r994, 8; - and.b32 %r1348, %r1347, 65280; - or.b32 %r1349, %r1348, %r1346; - shl.b32 %r1350, %r994, 24; - shl.b32 %r1351, %r994, 8; - and.b32 %r1352, %r1351, 16711680; - or.b32 %r1353, %r1350, %r1352; - or.b32 %r1354, %r1353, %r1349; - cvt.u64.u32 %rd2379, %r1354; - shr.u32 %r1355, %r983, 24; - shr.u32 %r1356, %r983, 8; - and.b32 %r1357, %r1356, 65280; - or.b32 %r1358, %r1357, %r1355; - shl.b32 %r1359, %r983, 24; - shl.b32 %r1360, %r983, 8; - and.b32 %r1361, %r1360, 16711680; - or.b32 %r1362, %r1359, %r1361; - or.b32 %r1363, %r1362, %r1358; - cvt.u64.u32 %rd2380, %r1363; - cvt.u64.u32 %rd2381, %r1344; - bfi.b64 %rd2382, %rd2378, %rd2381, 32, 32; - bfi.b64 %rd2383, %rd2379, %rd2380, 32, 32; - mov.b64 {%r1364, %r1365}, %rd2383; - mov.b64 {%r1366, %r1367}, %rd2382; - xor.b16 %rs3124, %rs3064, %rs605; - xor.b16 %rs3125, %rs3065, %rs606; - shl.b16 %rs3126, %rs3125, 8; - or.b16 %rs3127, %rs3124, %rs3126; - xor.b16 %rs3128, %rs3068, %rs607; - xor.b16 %rs3129, %rs3069, %rs608; - shl.b16 %rs3130, %rs3129, 8; - or.b16 %rs3131, %rs3128, %rs3130; - mov.b32 %r1368, {%rs3127, %rs3131}; - shr.u32 %r1369, %r1368, 24; - shr.u32 %r1370, %r1368, 8; - and.b32 %r1371, %r1370, 65280; - or.b32 %r1372, %r1371, %r1369; - shl.b32 %r1373, %r1368, 24; - shl.b32 %r1374, %r1368, 8; - and.b32 %r1375, %r1374, 16711680; - or.b32 %r1376, %r1373, %r1375; - or.b32 %r1377, %r1376, %r1372; - xor.b32 %r1378, %r1365, %r1196; - xor.b32 %r1379, %r1366, %r1197; - xor.b32 %r1380, %r1367, %r1198; - xor.b32 %r1381, %r1301, %r1377; - xor.b32 %r1382, %r1378, %r1302; - shf.l.wrap.b32 %r1383, %r1382, %r1382, 1; - xor.b32 %r1384, %r1379, %r1303; - shf.l.wrap.b32 %r1385, %r1384, %r1384, 1; - shf.l.wrap.b32 %r1386, %r1381, %r1381, 1; - xor.b32 %r1387, %r1380, %r1386; - shf.l.wrap.b32 %r1388, %r1387, %r1387, 1; - cvt.u64.u32 %rd2384, %r1388; - cvt.u64.u32 %rd2385, %r1383; - cvt.u64.u32 %rd2386, %r1385; - bfi.b64 %rd2387, %rd2384, %rd2386, 32, 32; - cvt.u64.u32 %rd2388, %r1386; - bfi.b64 %rd2389, %rd2385, %rd2388, 32, 32; - mov.b64 {%r1389, %r1390}, %rd2389; - mov.b64 {%r1391, %r1392}, %rd2387; - cvt.u64.u32 %rd2390, %r1392; - cvt.u64.u32 %rd2391, %r1390; - cvt.u64.u32 %rd2392, %r1391; - bfi.b64 %rd2393, %rd2390, %rd2392, 32, 32; - bfi.b64 %rd2394, %rd2391, %rd2388, 32, 32; - mov.b64 {%r1393, %r1394}, %rd2394; - mov.b64 {%r1395, %r1396}, %rd2393; - shf.l.wrap.b32 %r1397, %r1342, %r1342, 5; - xor.b32 %r1398, %r1343, %r1334; - xor.b32 %r1399, %r1398, %r1333; - add.s32 %r1400, %r1393, %r1325; - add.s32 %r1401, %r1400, %r1399; - add.s32 %r1402, %r1401, %r1397; - add.s32 %r1403, %r1402, 1859775393; - shf.l.wrap.b32 %r1404, %r1333, %r1333, 30; - shf.l.wrap.b32 %r1405, %r1403, %r1403, 5; - xor.b32 %r1406, %r1404, %r1343; - xor.b32 %r1407, %r1406, %r1342; - add.s32 %r1408, %r1394, %r1334; - add.s32 %r1409, %r1408, %r1407; - add.s32 %r1410, %r1409, %r1405; - add.s32 %r1411, %r1410, 1859775393; - shf.l.wrap.b32 %r1412, %r1342, %r1342, 30; - shf.l.wrap.b32 %r1413, %r1411, %r1411, 5; - xor.b32 %r1414, %r1412, %r1404; - xor.b32 %r1415, %r1414, %r1403; - add.s32 %r1416, %r1395, %r1343; - add.s32 %r1417, %r1416, %r1415; - add.s32 %r1418, %r1417, %r1413; - add.s32 %r1419, %r1418, 1859775393; - shf.l.wrap.b32 %r1420, %r1403, %r1403, 30; - shf.l.wrap.b32 %r1421, %r1419, %r1419, 5; - xor.b32 %r1422, %r1420, %r1412; - xor.b32 %r1423, %r1422, %r1411; - add.s32 %r1424, %r1396, %r1404; - add.s32 %r1425, %r1424, %r1423; - add.s32 %r1426, %r1425, %r1421; - add.s32 %r1427, %r1426, 1859775393; - shf.l.wrap.b32 %r1428, %r1411, %r1411, 30; - cvt.u64.u32 %rd2395, %r1420; - cvt.u64.u32 %rd2396, %r1428; - cvt.u64.u32 %rd2397, %r1419; - cvt.u64.u32 %rd2398, %r1427; - bfi.b64 %rd2399, %rd2397, %rd2398, 32, 32; - bfi.b64 %rd2400, %rd2395, %rd2396, 32, 32; - mov.b64 {%r1429, %r1430}, %rd2399; - mov.b64 {%r1431, %r1432}, %rd2400; - xor.b32 %r1433, %r1134, %r1132; - xor.b32 %r1434, %r1195, %r1133; - xor.b32 %r1435, %r1196, %r1134; - cvt.u64.u32 %rd2401, %r1435; - cvt.u64.u32 %rd2402, %r1433; - xor.b32 %r1436, %r1133, %r1131; - cvt.u64.u32 %rd2403, %r1436; - cvt.u64.u32 %rd2404, %r1434; - bfi.b64 %rd2405, %rd2401, %rd2404, 32, 32; - bfi.b64 %rd2406, %rd2402, %rd2403, 32, 32; - mov.b64 {%r1437, %r1438}, %rd2406; - mov.b64 {%r1439, %r1440}, %rd2405; - xor.b32 %r1441, %r1297, %r1436; - xor.b32 %r1442, %r1301, %r1438; - xor.b32 %r1443, %r1302, %r1439; - xor.b32 %r1444, %r1303, %r1440; - xor.b32 %r1445, %r1394, %r1441; - xor.b32 %r1446, %r1442, %r1395; - shf.l.wrap.b32 %r1447, %r1446, %r1446, 1; - xor.b32 %r1448, %r1443, %r1396; - shf.l.wrap.b32 %r1449, %r1448, %r1448, 1; - shf.l.wrap.b32 %r1450, %r1445, %r1445, 1; - xor.b32 %r1451, %r1444, %r1450; - shf.l.wrap.b32 %r1452, %r1451, %r1451, 1; - cvt.u64.u32 %rd2407, %r1452; - cvt.u64.u32 %rd2408, %r1447; - cvt.u64.u32 %rd2409, %r1449; - bfi.b64 %rd2410, %rd2407, %rd2409, 32, 32; - cvt.u64.u32 %rd2411, %r1450; - bfi.b64 %rd2412, %rd2408, %rd2411, 32, 32; - mov.b64 {%r1453, %r1454}, %rd2412; - mov.b64 {%r1455, %r1456}, %rd2410; - cvt.u64.u32 %rd2413, %r1456; - cvt.u64.u32 %rd2414, %r1454; - cvt.u64.u32 %rd2415, %r1455; - bfi.b64 %rd2416, %rd2413, %rd2415, 32, 32; - bfi.b64 %rd2417, %rd2414, %rd2411, 32, 32; - mov.b64 {%r1457, %r1458}, %rd2417; - mov.b64 {%r1459, %r1460}, %rd2416; - cvt.u64.u32 %rd2418, %r1432; - cvt.u64.u32 %rd2419, %r1430; - cvt.u64.u32 %rd2420, %r1431; - bfi.b64 %rd2421, %rd2419, %rd2398, 32, 32; - bfi.b64 %rd2422, %rd2418, %rd2420, 32, 32; - mov.b64 {%r1461, %r1462}, %rd2421; - mov.b64 {%r1463, %r1464}, %rd2422; - shf.l.wrap.b32 %r1465, %r1461, %r1461, 5; - xor.b32 %r1466, %r1463, %r1462; - xor.b32 %r1467, %r1466, %r1464; - add.s32 %r1468, %r1457, %r1412; - add.s32 %r1469, %r1468, %r1465; - add.s32 %r1470, %r1469, %r1467; - add.s32 %r1471, %r1470, 1859775393; - shf.l.wrap.b32 %r1472, %r1462, %r1462, 30; - shf.l.wrap.b32 %r1473, %r1471, %r1471, 5; - xor.b32 %r1474, %r1463, %r1461; - xor.b32 %r1475, %r1474, %r1472; - add.s32 %r1476, %r1458, %r1464; - add.s32 %r1477, %r1476, %r1475; - add.s32 %r1478, %r1477, %r1473; - add.s32 %r1479, %r1478, 1859775393; - shf.l.wrap.b32 %r1480, %r1461, %r1461, 30; - shf.l.wrap.b32 %r1481, %r1479, %r1479, 5; - xor.b32 %r1482, %r1472, %r1480; - xor.b32 %r1483, %r1482, %r1471; - add.s32 %r1484, %r1459, %r1463; - add.s32 %r1485, %r1484, %r1483; - add.s32 %r1486, %r1485, %r1481; - add.s32 %r1487, %r1486, 1859775393; - shf.l.wrap.b32 %r1488, %r1471, %r1471, 30; - shf.l.wrap.b32 %r1489, %r1487, %r1487, 5; - xor.b32 %r1490, %r1488, %r1480; - xor.b32 %r1491, %r1490, %r1479; - add.s32 %r1492, %r1460, %r1472; - add.s32 %r1493, %r1492, %r1491; - add.s32 %r1494, %r1493, %r1489; - add.s32 %r1495, %r1494, 1859775393; - shf.l.wrap.b32 %r1496, %r1479, %r1479, 30; - xor.b32 %r1497, %r1198, %r1196; - xor.b32 %r1498, %r1300, %r1197; - xor.b32 %r1499, %r1301, %r1198; - cvt.u64.u32 %rd2423, %r1499; - cvt.u64.u32 %rd2424, %r1497; - xor.b32 %r1500, %r1197, %r1195; - cvt.u64.u32 %rd2425, %r1500; - cvt.u64.u32 %rd2426, %r1498; - bfi.b64 %rd2427, %rd2423, %rd2426, 32, 32; - bfi.b64 %rd2428, %rd2424, %rd2425, 32, 32; - mov.b64 {%r1501, %r1502}, %rd2428; - mov.b64 {%r1503, %r1504}, %rd2427; - xor.b32 %r1505, %r1386, %r1500; - xor.b32 %r1506, %r1394, %r1502; - xor.b32 %r1507, %r1395, %r1503; - xor.b32 %r1508, %r1396, %r1504; - xor.b32 %r1509, %r1458, %r1505; - xor.b32 %r1510, %r1506, %r1459; - shf.l.wrap.b32 %r1511, %r1510, %r1510, 1; - xor.b32 %r1512, %r1507, %r1460; - shf.l.wrap.b32 %r1513, %r1512, %r1512, 1; - shf.l.wrap.b32 %r1514, %r1509, %r1509, 1; - xor.b32 %r1515, %r1508, %r1514; - shf.l.wrap.b32 %r1516, %r1515, %r1515, 1; - cvt.u64.u32 %rd2429, %r1516; - cvt.u64.u32 %rd2430, %r1511; - cvt.u64.u32 %rd2431, %r1513; - bfi.b64 %rd2432, %rd2429, %rd2431, 32, 32; - cvt.u64.u32 %rd2433, %r1514; - bfi.b64 %rd2434, %rd2430, %rd2433, 32, 32; - mov.b64 {%r1517, %r1518}, %rd2434; - mov.b64 {%r1519, %r1520}, %rd2432; - cvt.u64.u32 %rd2435, %r1520; - cvt.u64.u32 %rd2436, %r1518; - cvt.u64.u32 %rd2437, %r1519; - bfi.b64 %rd2438, %rd2435, %rd2437, 32, 32; - bfi.b64 %rd2439, %rd2436, %rd2433, 32, 32; - mov.b64 {%r1521, %r1522}, %rd2439; - mov.b64 {%r1523, %r1524}, %rd2438; - shf.l.wrap.b32 %r1525, %r1495, %r1495, 5; - xor.b32 %r1526, %r1496, %r1488; - xor.b32 %r1527, %r1526, %r1487; - add.s32 %r1528, %r1521, %r1480; - add.s32 %r1529, %r1528, %r1527; - add.s32 %r1530, %r1529, %r1525; - add.s32 %r1531, %r1530, 1859775393; - shf.l.wrap.b32 %r1532, %r1487, %r1487, 30; - shf.l.wrap.b32 %r1533, %r1531, %r1531, 5; - xor.b32 %r1534, %r1532, %r1496; - xor.b32 %r1535, %r1534, %r1495; - add.s32 %r1536, %r1522, %r1488; - add.s32 %r1537, %r1536, %r1535; - add.s32 %r1538, %r1537, %r1533; - add.s32 %r1539, %r1538, 1859775393; - shf.l.wrap.b32 %r1540, %r1495, %r1495, 30; - shf.l.wrap.b32 %r1541, %r1539, %r1539, 5; - xor.b32 %r1542, %r1540, %r1532; - xor.b32 %r1543, %r1542, %r1531; - add.s32 %r1544, %r1523, %r1496; - add.s32 %r1545, %r1544, %r1543; - add.s32 %r1546, %r1545, %r1541; - add.s32 %r1547, %r1546, 1859775393; - shf.l.wrap.b32 %r1548, %r1531, %r1531, 30; - shf.l.wrap.b32 %r1549, %r1547, %r1547, 5; - xor.b32 %r1550, %r1548, %r1540; - xor.b32 %r1551, %r1550, %r1539; - add.s32 %r1552, %r1524, %r1532; - add.s32 %r1553, %r1552, %r1551; - add.s32 %r1554, %r1553, %r1549; - add.s32 %r1555, %r1554, 1859775393; - shf.l.wrap.b32 %r1556, %r1539, %r1539, 30; - cvt.u64.u32 %rd2440, %r1548; - cvt.u64.u32 %rd2441, %r1556; - cvt.u64.u32 %rd2442, %r1547; - cvt.u64.u32 %rd2443, %r1555; - bfi.b64 %rd2444, %rd2442, %rd2443, 32, 32; - bfi.b64 %rd2445, %rd2440, %rd2441, 32, 32; - mov.b64 {%r1557, %r1558}, %rd2444; - mov.b64 {%r1559, %r1560}, %rd2445; - xor.b32 %r1561, %r1303, %r1301; - xor.b32 %r1562, %r1393, %r1302; - xor.b32 %r1563, %r1394, %r1303; - cvt.u64.u32 %rd2446, %r1563; - cvt.u64.u32 %rd2447, %r1561; - xor.b32 %r1564, %r1302, %r1300; - cvt.u64.u32 %rd2448, %r1564; - cvt.u64.u32 %rd2449, %r1562; - bfi.b64 %rd2450, %rd2446, %rd2449, 32, 32; - bfi.b64 %rd2451, %rd2447, %rd2448, 32, 32; - mov.b64 {%r1565, %r1566}, %rd2451; - mov.b64 {%r1567, %r1568}, %rd2450; - xor.b32 %r1569, %r1450, %r1564; - xor.b32 %r1570, %r1458, %r1566; - xor.b32 %r1571, %r1459, %r1567; - xor.b32 %r1572, %r1460, %r1568; - xor.b32 %r1573, %r1522, %r1569; - xor.b32 %r1574, %r1570, %r1523; - shf.l.wrap.b32 %r1575, %r1574, %r1574, 1; - xor.b32 %r1576, %r1571, %r1524; - shf.l.wrap.b32 %r1577, %r1576, %r1576, 1; - shf.l.wrap.b32 %r1578, %r1573, %r1573, 1; - xor.b32 %r1579, %r1572, %r1578; - shf.l.wrap.b32 %r1580, %r1579, %r1579, 1; - cvt.u64.u32 %rd2452, %r1580; - cvt.u64.u32 %rd2453, %r1575; - cvt.u64.u32 %rd2454, %r1577; - bfi.b64 %rd2455, %rd2452, %rd2454, 32, 32; - cvt.u64.u32 %rd2456, %r1578; - bfi.b64 %rd2457, %rd2453, %rd2456, 32, 32; - mov.b64 {%r1581, %r1582}, %rd2457; - mov.b64 {%r1583, %r1584}, %rd2455; - cvt.u64.u32 %rd2458, %r1584; - cvt.u64.u32 %rd2459, %r1582; - cvt.u64.u32 %rd2460, %r1583; - bfi.b64 %rd2461, %rd2458, %rd2460, 32, 32; - bfi.b64 %rd2462, %rd2459, %rd2456, 32, 32; - mov.b64 {%r1585, %r1586}, %rd2462; - mov.b64 {%r1587, %r1588}, %rd2461; - cvt.u64.u32 %rd2463, %r1560; - cvt.u64.u32 %rd2464, %r1558; - cvt.u64.u32 %rd2465, %r1559; - bfi.b64 %rd2466, %rd2464, %rd2443, 32, 32; - bfi.b64 %rd2467, %rd2463, %rd2465, 32, 32; - mov.b64 {%r1589, %r1590}, %rd2466; - mov.b64 {%r1591, %r1592}, %rd2467; - shf.l.wrap.b32 %r1593, %r1589, %r1589, 5; - xor.b32 %r1594, %r1591, %r1590; - xor.b32 %r1595, %r1594, %r1592; - add.s32 %r1596, %r1585, %r1540; - add.s32 %r1597, %r1596, %r1593; - add.s32 %r1598, %r1597, %r1595; - add.s32 %r1599, %r1598, 1859775393; - shf.l.wrap.b32 %r1600, %r1590, %r1590, 30; - shf.l.wrap.b32 %r1601, %r1599, %r1599, 5; - xor.b32 %r1602, %r1591, %r1589; - xor.b32 %r1603, %r1602, %r1600; - add.s32 %r1604, %r1586, %r1592; - add.s32 %r1605, %r1604, %r1603; - add.s32 %r1606, %r1605, %r1601; - add.s32 %r1607, %r1606, 1859775393; - shf.l.wrap.b32 %r1608, %r1589, %r1589, 30; - shf.l.wrap.b32 %r1609, %r1607, %r1607, 5; - xor.b32 %r1610, %r1600, %r1608; - xor.b32 %r1611, %r1610, %r1599; - add.s32 %r1612, %r1587, %r1591; - add.s32 %r1613, %r1612, %r1611; - add.s32 %r1614, %r1613, %r1609; - add.s32 %r1615, %r1614, 1859775393; - shf.l.wrap.b32 %r1616, %r1599, %r1599, 30; - shf.l.wrap.b32 %r1617, %r1615, %r1615, 5; - xor.b32 %r1618, %r1616, %r1608; - xor.b32 %r1619, %r1618, %r1607; - add.s32 %r1620, %r1588, %r1600; - add.s32 %r1621, %r1620, %r1619; - add.s32 %r1622, %r1621, %r1617; - add.s32 %r1623, %r1622, 1859775393; - shf.l.wrap.b32 %r1624, %r1607, %r1607, 30; - xor.b32 %r1625, %r1396, %r1394; - xor.b32 %r1626, %r1457, %r1395; - xor.b32 %r1627, %r1458, %r1396; - cvt.u64.u32 %rd2468, %r1627; - cvt.u64.u32 %rd2469, %r1625; - xor.b32 %r1628, %r1395, %r1393; - cvt.u64.u32 %rd2470, %r1628; - cvt.u64.u32 %rd2471, %r1626; - bfi.b64 %rd2472, %rd2468, %rd2471, 32, 32; - bfi.b64 %rd2473, %rd2469, %rd2470, 32, 32; - mov.b64 {%r1629, %r1630}, %rd2473; - mov.b64 {%r1631, %r1632}, %rd2472; - xor.b32 %r1633, %r1514, %r1628; - xor.b32 %r1634, %r1522, %r1630; - xor.b32 %r1635, %r1523, %r1631; - xor.b32 %r1636, %r1524, %r1632; - xor.b32 %r1637, %r1586, %r1633; - xor.b32 %r1638, %r1634, %r1587; - shf.l.wrap.b32 %r1639, %r1638, %r1638, 1; - xor.b32 %r1640, %r1635, %r1588; - shf.l.wrap.b32 %r1641, %r1640, %r1640, 1; - shf.l.wrap.b32 %r1642, %r1637, %r1637, 1; - xor.b32 %r1643, %r1636, %r1642; - shf.l.wrap.b32 %r1644, %r1643, %r1643, 1; - cvt.u64.u32 %rd2474, %r1644; - cvt.u64.u32 %rd2475, %r1639; - cvt.u64.u32 %rd2476, %r1642; - cvt.u64.u32 %rd2477, %r1641; - bfi.b64 %rd2478, %rd2474, %rd2477, 32, 32; - bfi.b64 %rd2479, %rd2475, %rd2476, 32, 32; - mov.b64 {%r1645, %r1646}, %rd2479; - mov.b64 {%r1647, %r1648}, %rd2478; - shf.l.wrap.b32 %r1649, %r1623, %r1623, 5; - xor.b32 %r1650, %r1624, %r1616; - xor.b32 %r1651, %r1650, %r1615; - add.s32 %r1652, %r1645, %r1608; - add.s32 %r1653, %r1652, %r1651; - add.s32 %r1654, %r1653, %r1649; - add.s32 %r1655, %r1654, 1859775393; - shf.l.wrap.b32 %r1656, %r1615, %r1615, 30; - shf.l.wrap.b32 %r1657, %r1655, %r1655, 5; - xor.b32 %r1658, %r1656, %r1624; - xor.b32 %r1659, %r1658, %r1623; - add.s32 %r1660, %r1646, %r1616; - add.s32 %r1661, %r1660, %r1659; - add.s32 %r1662, %r1661, %r1657; - add.s32 %r1663, %r1662, 1859775393; - shf.l.wrap.b32 %r1664, %r1623, %r1623, 30; - shf.l.wrap.b32 %r1665, %r1663, %r1663, 5; - xor.b32 %r1666, %r1664, %r1656; - xor.b32 %r1667, %r1666, %r1655; - add.s32 %r1668, %r1647, %r1624; - add.s32 %r1669, %r1668, %r1667; - add.s32 %r1670, %r1669, %r1665; - add.s32 %r1671, %r1670, 1859775393; - shf.l.wrap.b32 %r1672, %r1655, %r1655, 30; - shf.l.wrap.b32 %r1673, %r1671, %r1671, 5; - xor.b32 %r1674, %r1672, %r1664; - xor.b32 %r1675, %r1674, %r1663; - add.s32 %r1676, %r1648, %r1656; - add.s32 %r1677, %r1676, %r1675; - add.s32 %r1678, %r1677, %r1673; - add.s32 %r1679, %r1678, 1859775393; - shf.l.wrap.b32 %r1680, %r1663, %r1663, 30; - cvt.u64.u32 %rd2480, %r1672; - cvt.u64.u32 %rd2481, %r1680; - cvt.u64.u32 %rd2482, %r1671; - cvt.u64.u32 %rd2483, %r1679; - bfi.b64 %rd2484, %rd2482, %rd2483, 32, 32; - bfi.b64 %rd2485, %rd2480, %rd2481, 32, 32; - mov.b64 {%r1681, %r1682}, %rd2484; - mov.b64 {%r1683, %r1684}, %rd2485; - xor.b32 %r1685, %r1460, %r1458; - xor.b32 %r1686, %r1521, %r1459; - xor.b32 %r1687, %r1522, %r1460; - cvt.u64.u32 %rd2486, %r1687; - cvt.u64.u32 %rd2487, %r1685; - xor.b32 %r1688, %r1459, %r1457; - cvt.u64.u32 %rd2488, %r1688; - cvt.u64.u32 %rd2489, %r1686; - bfi.b64 %rd2490, %rd2486, %rd2489, 32, 32; - bfi.b64 %rd2491, %rd2487, %rd2488, 32, 32; - mov.b64 {%r1689, %r1690}, %rd2491; - mov.b64 {%r1691, %r1692}, %rd2490; - xor.b32 %r1693, %r1578, %r1688; - xor.b32 %r1694, %r1586, %r1690; - xor.b32 %r1695, %r1587, %r1691; - xor.b32 %r1696, %r1588, %r1692; - xor.b32 %r1697, %r1646, %r1693; - xor.b32 %r1698, %r1694, %r1647; - shf.l.wrap.b32 %r1699, %r1698, %r1698, 1; - xor.b32 %r1700, %r1695, %r1648; - shf.l.wrap.b32 %r1701, %r1700, %r1700, 1; - shf.l.wrap.b32 %r1702, %r1697, %r1697, 1; - xor.b32 %r1703, %r1696, %r1702; - shf.l.wrap.b32 %r1704, %r1703, %r1703, 1; - cvt.u64.u32 %rd2492, %r1704; - cvt.u64.u32 %rd2493, %r1699; - cvt.u64.u32 %rd2494, %r1701; - bfi.b64 %rd2495, %rd2492, %rd2494, 32, 32; - cvt.u64.u32 %rd2496, %r1702; - bfi.b64 %rd2497, %rd2493, %rd2496, 32, 32; - mov.b64 {%r1705, %r1706}, %rd2497; - mov.b64 {%r1707, %r1708}, %rd2495; - cvt.u64.u32 %rd2498, %r1708; - cvt.u64.u32 %rd2499, %r1706; - cvt.u64.u32 %rd2500, %r1707; - bfi.b64 %rd2501, %rd2498, %rd2500, 32, 32; - bfi.b64 %rd2502, %rd2499, %rd2496, 32, 32; - mov.b64 {%r1709, %r1710}, %rd2502; - mov.b64 {%r1711, %r1712}, %rd2501; - cvt.u64.u32 %rd2503, %r1684; - cvt.u64.u32 %rd2504, %r1682; - cvt.u64.u32 %rd2505, %r1683; - bfi.b64 %rd2506, %rd2504, %rd2483, 32, 32; - bfi.b64 %rd2507, %rd2503, %rd2505, 32, 32; - mov.b64 {%r1713, %r1714}, %rd2506; - mov.b64 {%r1715, %r1716}, %rd2507; - shf.l.wrap.b32 %r1717, %r1713, %r1713, 5; - xor.b32 %r1718, %r1716, %r1715; - and.b32 %r1719, %r1718, %r1714; - and.b32 %r1720, %r1716, %r1715; - xor.b32 %r1721, %r1719, %r1720; - add.s32 %r1722, %r1709, %r1664; - add.s32 %r1723, %r1722, %r1717; - add.s32 %r1724, %r1723, %r1721; - add.s32 %r1725, %r1724, -1894007588; - shf.l.wrap.b32 %r1726, %r1714, %r1714, 30; - shf.l.wrap.b32 %r1727, %r1725, %r1725, 5; - xor.b32 %r1728, %r1726, %r1715; - and.b32 %r1729, %r1728, %r1713; - and.b32 %r1730, %r1726, %r1715; - xor.b32 %r1731, %r1729, %r1730; - add.s32 %r1732, %r1710, %r1716; - add.s32 %r1733, %r1732, %r1731; - add.s32 %r1734, %r1733, %r1727; - add.s32 %r1735, %r1734, -1894007588; - shf.l.wrap.b32 %r1736, %r1713, %r1713, 30; - shf.l.wrap.b32 %r1737, %r1735, %r1735, 5; - xor.b32 %r1738, %r1726, %r1736; - and.b32 %r1739, %r1725, %r1738; - and.b32 %r1740, %r1726, %r1736; - xor.b32 %r1741, %r1739, %r1740; - add.s32 %r1742, %r1711, %r1715; - add.s32 %r1743, %r1742, %r1741; - add.s32 %r1744, %r1743, %r1737; - add.s32 %r1745, %r1744, -1894007588; - shf.l.wrap.b32 %r1746, %r1725, %r1725, 30; - shf.l.wrap.b32 %r1747, %r1745, %r1745, 5; - xor.b32 %r1748, %r1746, %r1736; - and.b32 %r1749, %r1735, %r1748; - and.b32 %r1750, %r1746, %r1736; - xor.b32 %r1751, %r1749, %r1750; - add.s32 %r1752, %r1712, %r1726; - add.s32 %r1753, %r1752, %r1751; - add.s32 %r1754, %r1753, %r1747; - add.s32 %r1755, %r1754, -1894007588; - shf.l.wrap.b32 %r1756, %r1735, %r1735, 30; - xor.b32 %r1757, %r1524, %r1522; - xor.b32 %r1758, %r1585, %r1523; - xor.b32 %r1759, %r1586, %r1524; - cvt.u64.u32 %rd2508, %r1759; - cvt.u64.u32 %rd2509, %r1757; - xor.b32 %r1760, %r1523, %r1521; - cvt.u64.u32 %rd2510, %r1760; - cvt.u64.u32 %rd2511, %r1758; - bfi.b64 %rd2512, %rd2508, %rd2511, 32, 32; - bfi.b64 %rd2513, %rd2509, %rd2510, 32, 32; - mov.b64 {%r1761, %r1762}, %rd2513; - mov.b64 {%r1763, %r1764}, %rd2512; - xor.b32 %r1765, %r1642, %r1760; - xor.b32 %r1766, %r1646, %r1762; - xor.b32 %r1767, %r1647, %r1763; - xor.b32 %r1768, %r1648, %r1764; - xor.b32 %r1769, %r1710, %r1765; - xor.b32 %r1770, %r1766, %r1711; - shf.l.wrap.b32 %r1771, %r1770, %r1770, 1; - xor.b32 %r1772, %r1767, %r1712; - shf.l.wrap.b32 %r1773, %r1772, %r1772, 1; - shf.l.wrap.b32 %r1774, %r1769, %r1769, 1; - xor.b32 %r1775, %r1768, %r1774; - shf.l.wrap.b32 %r1776, %r1775, %r1775, 1; - cvt.u64.u32 %rd2514, %r1776; - cvt.u64.u32 %rd2515, %r1771; - cvt.u64.u32 %rd2516, %r1773; - bfi.b64 %rd2517, %rd2514, %rd2516, 32, 32; - cvt.u64.u32 %rd2518, %r1774; - bfi.b64 %rd2519, %rd2515, %rd2518, 32, 32; - mov.b64 {%r1777, %r1778}, %rd2519; - mov.b64 {%r1779, %r1780}, %rd2517; - cvt.u64.u32 %rd2520, %r1780; - cvt.u64.u32 %rd2521, %r1778; - cvt.u64.u32 %rd2522, %r1779; - bfi.b64 %rd2523, %rd2520, %rd2522, 32, 32; - bfi.b64 %rd2524, %rd2521, %rd2518, 32, 32; - mov.b64 {%r1781, %r1782}, %rd2524; - mov.b64 {%r1783, %r1784}, %rd2523; - shf.l.wrap.b32 %r1785, %r1755, %r1755, 5; - xor.b32 %r1786, %r1756, %r1746; - and.b32 %r1787, %r1786, %r1745; - and.b32 %r1788, %r1756, %r1746; - xor.b32 %r1789, %r1787, %r1788; - add.s32 %r1790, %r1781, %r1736; - add.s32 %r1791, %r1790, %r1789; - add.s32 %r1792, %r1791, %r1785; - add.s32 %r1793, %r1792, -1894007588; - shf.l.wrap.b32 %r1794, %r1745, %r1745, 30; - shf.l.wrap.b32 %r1795, %r1793, %r1793, 5; - xor.b32 %r1796, %r1794, %r1756; - and.b32 %r1797, %r1796, %r1755; - and.b32 %r1798, %r1794, %r1756; - xor.b32 %r1799, %r1797, %r1798; - add.s32 %r1800, %r1782, %r1746; - add.s32 %r1801, %r1800, %r1799; - add.s32 %r1802, %r1801, %r1795; - add.s32 %r1803, %r1802, -1894007588; - shf.l.wrap.b32 %r1804, %r1755, %r1755, 30; - shf.l.wrap.b32 %r1805, %r1803, %r1803, 5; - xor.b32 %r1806, %r1804, %r1794; - and.b32 %r1807, %r1793, %r1806; - and.b32 %r1808, %r1804, %r1794; - xor.b32 %r1809, %r1807, %r1808; - add.s32 %r1810, %r1783, %r1756; - add.s32 %r1811, %r1810, %r1809; - add.s32 %r1812, %r1811, %r1805; - add.s32 %r1813, %r1812, -1894007588; - shf.l.wrap.b32 %r1814, %r1793, %r1793, 30; - shf.l.wrap.b32 %r1815, %r1813, %r1813, 5; - xor.b32 %r1816, %r1814, %r1804; - and.b32 %r1817, %r1803, %r1816; - and.b32 %r1818, %r1814, %r1804; - xor.b32 %r1819, %r1817, %r1818; - add.s32 %r1820, %r1784, %r1794; - add.s32 %r1821, %r1820, %r1819; - add.s32 %r1822, %r1821, %r1815; - add.s32 %r1823, %r1822, -1894007588; - shf.l.wrap.b32 %r1824, %r1803, %r1803, 30; - cvt.u64.u32 %rd2525, %r1814; - cvt.u64.u32 %rd2526, %r1824; - cvt.u64.u32 %rd2527, %r1813; - cvt.u64.u32 %rd2528, %r1823; - bfi.b64 %rd2529, %rd2527, %rd2528, 32, 32; - bfi.b64 %rd2530, %rd2525, %rd2526, 32, 32; - mov.b64 {%r1825, %r1826}, %rd2529; - mov.b64 {%r1827, %r1828}, %rd2530; - xor.b32 %r1829, %r1588, %r1586; - xor.b32 %r1830, %r1645, %r1587; - xor.b32 %r1831, %r1646, %r1588; - cvt.u64.u32 %rd2531, %r1831; - cvt.u64.u32 %rd2532, %r1829; - xor.b32 %r1832, %r1587, %r1585; - cvt.u64.u32 %rd2533, %r1832; - cvt.u64.u32 %rd2534, %r1830; - bfi.b64 %rd2535, %rd2531, %rd2534, 32, 32; - bfi.b64 %rd2536, %rd2532, %rd2533, 32, 32; - mov.b64 {%r1833, %r1834}, %rd2536; - mov.b64 {%r1835, %r1836}, %rd2535; - xor.b32 %r1837, %r1702, %r1832; - xor.b32 %r1838, %r1710, %r1834; - xor.b32 %r1839, %r1711, %r1835; - xor.b32 %r1840, %r1712, %r1836; - xor.b32 %r1841, %r1782, %r1837; - xor.b32 %r1842, %r1838, %r1783; - shf.l.wrap.b32 %r1843, %r1842, %r1842, 1; - xor.b32 %r1844, %r1839, %r1784; - shf.l.wrap.b32 %r1845, %r1844, %r1844, 1; - shf.l.wrap.b32 %r1846, %r1841, %r1841, 1; - xor.b32 %r1847, %r1840, %r1846; - shf.l.wrap.b32 %r1848, %r1847, %r1847, 1; - cvt.u64.u32 %rd2537, %r1848; - cvt.u64.u32 %rd2538, %r1843; - cvt.u64.u32 %rd2539, %r1845; - bfi.b64 %rd2540, %rd2537, %rd2539, 32, 32; - cvt.u64.u32 %rd2541, %r1846; - bfi.b64 %rd2542, %rd2538, %rd2541, 32, 32; - mov.b64 {%r1849, %r1850}, %rd2542; - mov.b64 {%r1851, %r1852}, %rd2540; - cvt.u64.u32 %rd2543, %r1852; - cvt.u64.u32 %rd2544, %r1850; - cvt.u64.u32 %rd2545, %r1851; - bfi.b64 %rd2546, %rd2543, %rd2545, 32, 32; - bfi.b64 %rd2547, %rd2544, %rd2541, 32, 32; - mov.b64 {%r1853, %r1854}, %rd2547; - mov.b64 {%r1855, %r1856}, %rd2546; - cvt.u64.u32 %rd2548, %r1828; - cvt.u64.u32 %rd2549, %r1826; - cvt.u64.u32 %rd2550, %r1827; - bfi.b64 %rd2551, %rd2549, %rd2528, 32, 32; - bfi.b64 %rd2552, %rd2548, %rd2550, 32, 32; - mov.b64 {%r1857, %r1858}, %rd2551; - mov.b64 {%r1859, %r1860}, %rd2552; - shf.l.wrap.b32 %r1861, %r1857, %r1857, 5; - xor.b32 %r1862, %r1860, %r1859; - and.b32 %r1863, %r1862, %r1858; - and.b32 %r1864, %r1860, %r1859; - xor.b32 %r1865, %r1863, %r1864; - add.s32 %r1866, %r1853, %r1804; - add.s32 %r1867, %r1866, %r1861; - add.s32 %r1868, %r1867, %r1865; - add.s32 %r1869, %r1868, -1894007588; - shf.l.wrap.b32 %r1870, %r1858, %r1858, 30; - shf.l.wrap.b32 %r1871, %r1869, %r1869, 5; - xor.b32 %r1872, %r1870, %r1859; - and.b32 %r1873, %r1872, %r1857; - and.b32 %r1874, %r1870, %r1859; - xor.b32 %r1875, %r1873, %r1874; - add.s32 %r1876, %r1854, %r1860; - add.s32 %r1877, %r1876, %r1875; - add.s32 %r1878, %r1877, %r1871; - add.s32 %r1879, %r1878, -1894007588; - shf.l.wrap.b32 %r1880, %r1857, %r1857, 30; - shf.l.wrap.b32 %r1881, %r1879, %r1879, 5; - xor.b32 %r1882, %r1870, %r1880; - and.b32 %r1883, %r1869, %r1882; - and.b32 %r1884, %r1870, %r1880; - xor.b32 %r1885, %r1883, %r1884; - add.s32 %r1886, %r1855, %r1859; - add.s32 %r1887, %r1886, %r1885; - add.s32 %r1888, %r1887, %r1881; - add.s32 %r1889, %r1888, -1894007588; - shf.l.wrap.b32 %r1890, %r1869, %r1869, 30; - shf.l.wrap.b32 %r1891, %r1889, %r1889, 5; - xor.b32 %r1892, %r1890, %r1880; - and.b32 %r1893, %r1879, %r1892; - and.b32 %r1894, %r1890, %r1880; - xor.b32 %r1895, %r1893, %r1894; - add.s32 %r1896, %r1856, %r1870; - add.s32 %r1897, %r1896, %r1895; - add.s32 %r1898, %r1897, %r1891; - add.s32 %r1899, %r1898, -1894007588; - shf.l.wrap.b32 %r1900, %r1879, %r1879, 30; - xor.b32 %r1901, %r1648, %r1646; - xor.b32 %r1902, %r1709, %r1647; - xor.b32 %r1903, %r1710, %r1648; - cvt.u64.u32 %rd2553, %r1903; - cvt.u64.u32 %rd2554, %r1901; - xor.b32 %r1904, %r1647, %r1645; - cvt.u64.u32 %rd2555, %r1904; - cvt.u64.u32 %rd2556, %r1902; - bfi.b64 %rd2557, %rd2553, %rd2556, 32, 32; - bfi.b64 %rd2558, %rd2554, %rd2555, 32, 32; - mov.b64 {%r1905, %r1906}, %rd2558; - mov.b64 {%r1907, %r1908}, %rd2557; - xor.b32 %r1909, %r1774, %r1904; - xor.b32 %r1910, %r1782, %r1906; - xor.b32 %r1911, %r1783, %r1907; - xor.b32 %r1912, %r1784, %r1908; - xor.b32 %r1913, %r1854, %r1909; - xor.b32 %r1914, %r1910, %r1855; - shf.l.wrap.b32 %r1915, %r1914, %r1914, 1; - xor.b32 %r1916, %r1911, %r1856; - shf.l.wrap.b32 %r1917, %r1916, %r1916, 1; - shf.l.wrap.b32 %r1918, %r1913, %r1913, 1; - xor.b32 %r1919, %r1912, %r1918; - shf.l.wrap.b32 %r1920, %r1919, %r1919, 1; - cvt.u64.u32 %rd2559, %r1920; - cvt.u64.u32 %rd2560, %r1915; - cvt.u64.u32 %rd2561, %r1917; - bfi.b64 %rd2562, %rd2559, %rd2561, 32, 32; - cvt.u64.u32 %rd2563, %r1918; - bfi.b64 %rd2564, %rd2560, %rd2563, 32, 32; - mov.b64 {%r1921, %r1922}, %rd2564; - mov.b64 {%r1923, %r1924}, %rd2562; - cvt.u64.u32 %rd2565, %r1924; - cvt.u64.u32 %rd2566, %r1922; - cvt.u64.u32 %rd2567, %r1923; - bfi.b64 %rd2568, %rd2565, %rd2567, 32, 32; - bfi.b64 %rd2569, %rd2566, %rd2563, 32, 32; - mov.b64 {%r1925, %r1926}, %rd2569; - mov.b64 {%r1927, %r1928}, %rd2568; - shf.l.wrap.b32 %r1929, %r1899, %r1899, 5; - xor.b32 %r1930, %r1900, %r1890; - and.b32 %r1931, %r1930, %r1889; - and.b32 %r1932, %r1900, %r1890; - xor.b32 %r1933, %r1931, %r1932; - add.s32 %r1934, %r1925, %r1880; - add.s32 %r1935, %r1934, %r1933; - add.s32 %r1936, %r1935, %r1929; - add.s32 %r1937, %r1936, -1894007588; - shf.l.wrap.b32 %r1938, %r1889, %r1889, 30; - shf.l.wrap.b32 %r1939, %r1937, %r1937, 5; - xor.b32 %r1940, %r1938, %r1900; - and.b32 %r1941, %r1940, %r1899; - and.b32 %r1942, %r1938, %r1900; - xor.b32 %r1943, %r1941, %r1942; - add.s32 %r1944, %r1926, %r1890; - add.s32 %r1945, %r1944, %r1943; - add.s32 %r1946, %r1945, %r1939; - add.s32 %r1947, %r1946, -1894007588; - shf.l.wrap.b32 %r1948, %r1899, %r1899, 30; - shf.l.wrap.b32 %r1949, %r1947, %r1947, 5; - xor.b32 %r1950, %r1948, %r1938; - and.b32 %r1951, %r1937, %r1950; - and.b32 %r1952, %r1948, %r1938; - xor.b32 %r1953, %r1951, %r1952; - add.s32 %r1954, %r1927, %r1900; - add.s32 %r1955, %r1954, %r1953; - add.s32 %r1956, %r1955, %r1949; - add.s32 %r1957, %r1956, -1894007588; - shf.l.wrap.b32 %r1958, %r1937, %r1937, 30; - shf.l.wrap.b32 %r1959, %r1957, %r1957, 5; - xor.b32 %r1960, %r1958, %r1948; - and.b32 %r1961, %r1947, %r1960; - and.b32 %r1962, %r1958, %r1948; - xor.b32 %r1963, %r1961, %r1962; - add.s32 %r1964, %r1928, %r1938; - add.s32 %r1965, %r1964, %r1963; - add.s32 %r1966, %r1965, %r1959; - add.s32 %r1967, %r1966, -1894007588; - shf.l.wrap.b32 %r1968, %r1947, %r1947, 30; - cvt.u64.u32 %rd2570, %r1958; - cvt.u64.u32 %rd2571, %r1968; - cvt.u64.u32 %rd2572, %r1957; - cvt.u64.u32 %rd2573, %r1967; - bfi.b64 %rd2574, %rd2572, %rd2573, 32, 32; - bfi.b64 %rd2575, %rd2570, %rd2571, 32, 32; - mov.b64 {%r1969, %r1970}, %rd2574; - mov.b64 {%r1971, %r1972}, %rd2575; - xor.b32 %r1973, %r1712, %r1710; - xor.b32 %r1974, %r1781, %r1711; - xor.b32 %r1975, %r1782, %r1712; - cvt.u64.u32 %rd2576, %r1975; - cvt.u64.u32 %rd2577, %r1973; - xor.b32 %r1976, %r1711, %r1709; - cvt.u64.u32 %rd2578, %r1976; - cvt.u64.u32 %rd2579, %r1974; - bfi.b64 %rd2580, %rd2576, %rd2579, 32, 32; - bfi.b64 %rd2581, %rd2577, %rd2578, 32, 32; - mov.b64 {%r1977, %r1978}, %rd2581; - mov.b64 {%r1979, %r1980}, %rd2580; - xor.b32 %r1981, %r1846, %r1976; - xor.b32 %r1982, %r1854, %r1978; - xor.b32 %r1983, %r1855, %r1979; - xor.b32 %r1984, %r1856, %r1980; - xor.b32 %r1985, %r1926, %r1981; - xor.b32 %r1986, %r1982, %r1927; - shf.l.wrap.b32 %r1987, %r1986, %r1986, 1; - xor.b32 %r1988, %r1983, %r1928; - shf.l.wrap.b32 %r1989, %r1988, %r1988, 1; - shf.l.wrap.b32 %r1990, %r1985, %r1985, 1; - xor.b32 %r1991, %r1984, %r1990; - shf.l.wrap.b32 %r1992, %r1991, %r1991, 1; - cvt.u64.u32 %rd2582, %r1992; - cvt.u64.u32 %rd2583, %r1987; - cvt.u64.u32 %rd2584, %r1990; - cvt.u64.u32 %rd2585, %r1989; - bfi.b64 %rd2586, %rd2582, %rd2585, 32, 32; - bfi.b64 %rd2587, %rd2583, %rd2584, 32, 32; - mov.b64 {%r1993, %r1994}, %rd2587; - mov.b64 {%r1995, %r1996}, %rd2586; - cvt.u64.u32 %rd2588, %r1972; - cvt.u64.u32 %rd2589, %r1970; - cvt.u64.u32 %rd2590, %r1971; - bfi.b64 %rd2591, %rd2589, %rd2573, 32, 32; - bfi.b64 %rd2592, %rd2588, %rd2590, 32, 32; - mov.b64 {%r1997, %r1998}, %rd2591; - mov.b64 {%r1999, %r2000}, %rd2592; - shf.l.wrap.b32 %r2001, %r1997, %r1997, 5; - xor.b32 %r2002, %r2000, %r1999; - and.b32 %r2003, %r2002, %r1998; - and.b32 %r2004, %r2000, %r1999; - xor.b32 %r2005, %r2003, %r2004; - add.s32 %r2006, %r1993, %r1948; - add.s32 %r2007, %r2006, %r2001; - add.s32 %r2008, %r2007, %r2005; - add.s32 %r2009, %r2008, -1894007588; - shf.l.wrap.b32 %r2010, %r1998, %r1998, 30; - shf.l.wrap.b32 %r2011, %r2009, %r2009, 5; - xor.b32 %r2012, %r2010, %r1999; - and.b32 %r2013, %r2012, %r1997; - and.b32 %r2014, %r2010, %r1999; - xor.b32 %r2015, %r2013, %r2014; - add.s32 %r2016, %r1994, %r2000; - add.s32 %r2017, %r2016, %r2015; - add.s32 %r2018, %r2017, %r2011; - add.s32 %r2019, %r2018, -1894007588; - shf.l.wrap.b32 %r2020, %r1997, %r1997, 30; - shf.l.wrap.b32 %r2021, %r2019, %r2019, 5; - xor.b32 %r2022, %r2010, %r2020; - and.b32 %r2023, %r2009, %r2022; - and.b32 %r2024, %r2010, %r2020; - xor.b32 %r2025, %r2023, %r2024; - add.s32 %r2026, %r1995, %r1999; - add.s32 %r2027, %r2026, %r2025; - add.s32 %r2028, %r2027, %r2021; - add.s32 %r2029, %r2028, -1894007588; - shf.l.wrap.b32 %r2030, %r2009, %r2009, 30; - shf.l.wrap.b32 %r2031, %r2029, %r2029, 5; - xor.b32 %r2032, %r2030, %r2020; - and.b32 %r2033, %r2019, %r2032; - and.b32 %r2034, %r2030, %r2020; - xor.b32 %r2035, %r2033, %r2034; - add.s32 %r2036, %r1996, %r2010; - add.s32 %r2037, %r2036, %r2035; - add.s32 %r2038, %r2037, %r2031; - add.s32 %r2039, %r2038, -1894007588; - shf.l.wrap.b32 %r2040, %r2019, %r2019, 30; - xor.b32 %r2041, %r1784, %r1782; - xor.b32 %r2042, %r1853, %r1783; - xor.b32 %r2043, %r1854, %r1784; - cvt.u64.u32 %rd2593, %r2043; - cvt.u64.u32 %rd2594, %r2041; - xor.b32 %r2044, %r1783, %r1781; - cvt.u64.u32 %rd2595, %r2044; - cvt.u64.u32 %rd2596, %r2042; - bfi.b64 %rd2597, %rd2593, %rd2596, 32, 32; - bfi.b64 %rd2598, %rd2594, %rd2595, 32, 32; - mov.b64 {%r2045, %r2046}, %rd2598; - mov.b64 {%r2047, %r2048}, %rd2597; - xor.b32 %r2049, %r1918, %r2044; - xor.b32 %r2050, %r1926, %r2046; - xor.b32 %r2051, %r1927, %r2047; - xor.b32 %r2052, %r1928, %r2048; - xor.b32 %r2053, %r1994, %r2049; - xor.b32 %r2054, %r2050, %r1995; - shf.l.wrap.b32 %r2055, %r2054, %r2054, 1; - xor.b32 %r2056, %r2051, %r1996; - shf.l.wrap.b32 %r2057, %r2056, %r2056, 1; - shf.l.wrap.b32 %r2058, %r2053, %r2053, 1; - xor.b32 %r2059, %r2052, %r2058; - shf.l.wrap.b32 %r2060, %r2059, %r2059, 1; - cvt.u64.u32 %rd2599, %r2060; - cvt.u64.u32 %rd2600, %r2055; - cvt.u64.u32 %rd2601, %r2057; - bfi.b64 %rd2602, %rd2599, %rd2601, 32, 32; - cvt.u64.u32 %rd2603, %r2058; - bfi.b64 %rd2604, %rd2600, %rd2603, 32, 32; - mov.b64 {%r2061, %r2062}, %rd2604; - mov.b64 {%r2063, %r2064}, %rd2602; - cvt.u64.u32 %rd2605, %r2064; - cvt.u64.u32 %rd2606, %r2062; - cvt.u64.u32 %rd2607, %r2063; - bfi.b64 %rd2608, %rd2605, %rd2607, 32, 32; - bfi.b64 %rd2609, %rd2606, %rd2603, 32, 32; - mov.b64 {%r2065, %r2066}, %rd2609; - mov.b64 {%r2067, %r2068}, %rd2608; - shf.l.wrap.b32 %r2069, %r2039, %r2039, 5; - xor.b32 %r2070, %r2040, %r2030; - xor.b32 %r2071, %r2070, %r2029; - add.s32 %r2072, %r2065, %r2020; - add.s32 %r2073, %r2072, %r2071; - add.s32 %r2074, %r2073, %r2069; - add.s32 %r2075, %r2074, -899497514; - shf.l.wrap.b32 %r2076, %r2029, %r2029, 30; - shf.l.wrap.b32 %r2077, %r2075, %r2075, 5; - xor.b32 %r2078, %r2076, %r2040; - xor.b32 %r2079, %r2078, %r2039; - add.s32 %r2080, %r2066, %r2030; - add.s32 %r2081, %r2080, %r2079; - add.s32 %r2082, %r2081, %r2077; - add.s32 %r2083, %r2082, -899497514; - shf.l.wrap.b32 %r2084, %r2039, %r2039, 30; - shf.l.wrap.b32 %r2085, %r2083, %r2083, 5; - xor.b32 %r2086, %r2084, %r2076; - xor.b32 %r2087, %r2086, %r2075; - add.s32 %r2088, %r2067, %r2040; - add.s32 %r2089, %r2088, %r2087; - add.s32 %r2090, %r2089, %r2085; - add.s32 %r2091, %r2090, -899497514; - shf.l.wrap.b32 %r2092, %r2075, %r2075, 30; - shf.l.wrap.b32 %r2093, %r2091, %r2091, 5; - xor.b32 %r2094, %r2092, %r2084; - xor.b32 %r2095, %r2094, %r2083; - add.s32 %r2096, %r2068, %r2076; - add.s32 %r2097, %r2096, %r2095; - add.s32 %r2098, %r2097, %r2093; - add.s32 %r2099, %r2098, -899497514; - shf.l.wrap.b32 %r2100, %r2083, %r2083, 30; - cvt.u64.u32 %rd2610, %r2092; - cvt.u64.u32 %rd2611, %r2100; - cvt.u64.u32 %rd2612, %r2091; - cvt.u64.u32 %rd2613, %r2099; - bfi.b64 %rd2614, %rd2612, %rd2613, 32, 32; - bfi.b64 %rd2615, %rd2610, %rd2611, 32, 32; - mov.b64 {%r2101, %r2102}, %rd2614; - mov.b64 {%r2103, %r2104}, %rd2615; - xor.b32 %r2105, %r1856, %r1854; - xor.b32 %r2106, %r1925, %r1855; - xor.b32 %r2107, %r1926, %r1856; - cvt.u64.u32 %rd2616, %r2107; - cvt.u64.u32 %rd2617, %r2105; - xor.b32 %r2108, %r1855, %r1853; - cvt.u64.u32 %rd2618, %r2108; - cvt.u64.u32 %rd2619, %r2106; - bfi.b64 %rd2620, %rd2616, %rd2619, 32, 32; - bfi.b64 %rd2621, %rd2617, %rd2618, 32, 32; - mov.b64 {%r2109, %r2110}, %rd2621; - mov.b64 {%r2111, %r2112}, %rd2620; - xor.b32 %r2113, %r1990, %r2108; - xor.b32 %r2114, %r1994, %r2110; - xor.b32 %r2115, %r1995, %r2111; - xor.b32 %r2116, %r1996, %r2112; - xor.b32 %r2117, %r2066, %r2113; - xor.b32 %r2118, %r2114, %r2067; - shf.l.wrap.b32 %r2119, %r2118, %r2118, 1; - xor.b32 %r2120, %r2115, %r2068; - shf.l.wrap.b32 %r2121, %r2120, %r2120, 1; - shf.l.wrap.b32 %r2122, %r2117, %r2117, 1; - xor.b32 %r2123, %r2116, %r2122; - shf.l.wrap.b32 %r2124, %r2123, %r2123, 1; - cvt.u64.u32 %rd2622, %r2124; - cvt.u64.u32 %rd2623, %r2119; - cvt.u64.u32 %rd2624, %r2121; - bfi.b64 %rd2625, %rd2622, %rd2624, 32, 32; - cvt.u64.u32 %rd2626, %r2122; - bfi.b64 %rd2627, %rd2623, %rd2626, 32, 32; - mov.b64 {%r2125, %r2126}, %rd2627; - mov.b64 {%r2127, %r2128}, %rd2625; - cvt.u64.u32 %rd2628, %r2128; - cvt.u64.u32 %rd2629, %r2126; - cvt.u64.u32 %rd2630, %r2127; - bfi.b64 %rd2631, %rd2628, %rd2630, 32, 32; - bfi.b64 %rd2632, %rd2629, %rd2626, 32, 32; - mov.b64 {%r2129, %r2130}, %rd2632; - mov.b64 {%r2131, %r2132}, %rd2631; - cvt.u64.u32 %rd2633, %r2104; - cvt.u64.u32 %rd2634, %r2102; - cvt.u64.u32 %rd2635, %r2103; - bfi.b64 %rd2636, %rd2634, %rd2613, 32, 32; - bfi.b64 %rd2637, %rd2633, %rd2635, 32, 32; - mov.b64 {%r2133, %r2134}, %rd2636; - mov.b64 {%r2135, %r2136}, %rd2637; - shf.l.wrap.b32 %r2137, %r2133, %r2133, 5; - xor.b32 %r2138, %r2135, %r2134; - xor.b32 %r2139, %r2138, %r2136; - add.s32 %r2140, %r2129, %r2084; - add.s32 %r2141, %r2140, %r2137; - add.s32 %r2142, %r2141, %r2139; - add.s32 %r2143, %r2142, -899497514; - shf.l.wrap.b32 %r2144, %r2134, %r2134, 30; - shf.l.wrap.b32 %r2145, %r2143, %r2143, 5; - xor.b32 %r2146, %r2135, %r2133; - xor.b32 %r2147, %r2146, %r2144; - add.s32 %r2148, %r2130, %r2136; - add.s32 %r2149, %r2148, %r2147; - add.s32 %r2150, %r2149, %r2145; - add.s32 %r2151, %r2150, -899497514; - shf.l.wrap.b32 %r2152, %r2133, %r2133, 30; - shf.l.wrap.b32 %r2153, %r2151, %r2151, 5; - xor.b32 %r2154, %r2144, %r2152; - xor.b32 %r2155, %r2154, %r2143; - add.s32 %r2156, %r2131, %r2135; - add.s32 %r2157, %r2156, %r2155; - add.s32 %r2158, %r2157, %r2153; - add.s32 %r2159, %r2158, -899497514; - shf.l.wrap.b32 %r2160, %r2143, %r2143, 30; - shf.l.wrap.b32 %r2161, %r2159, %r2159, 5; - xor.b32 %r2162, %r2160, %r2152; - xor.b32 %r2163, %r2162, %r2151; - add.s32 %r2164, %r2132, %r2144; - add.s32 %r2165, %r2164, %r2163; - add.s32 %r2166, %r2165, %r2161; - add.s32 %r2167, %r2166, -899497514; - shf.l.wrap.b32 %r2168, %r2151, %r2151, 30; - xor.b32 %r2169, %r1928, %r1926; - xor.b32 %r2170, %r1993, %r1927; - xor.b32 %r2171, %r1994, %r1928; - cvt.u64.u32 %rd2638, %r2171; - cvt.u64.u32 %rd2639, %r2169; - xor.b32 %r2172, %r1927, %r1925; - cvt.u64.u32 %rd2640, %r2172; - cvt.u64.u32 %rd2641, %r2170; - bfi.b64 %rd2642, %rd2638, %rd2641, 32, 32; - bfi.b64 %rd2643, %rd2639, %rd2640, 32, 32; - mov.b64 {%r2173, %r2174}, %rd2643; - mov.b64 {%r2175, %r2176}, %rd2642; - xor.b32 %r2177, %r2058, %r2172; - xor.b32 %r2178, %r2066, %r2174; - xor.b32 %r2179, %r2067, %r2175; - xor.b32 %r2180, %r2068, %r2176; - xor.b32 %r2181, %r2130, %r2177; - xor.b32 %r2182, %r2178, %r2131; - shf.l.wrap.b32 %r2183, %r2182, %r2182, 1; - xor.b32 %r2184, %r2179, %r2132; - shf.l.wrap.b32 %r2185, %r2184, %r2184, 1; - shf.l.wrap.b32 %r2186, %r2181, %r2181, 1; - xor.b32 %r2187, %r2180, %r2186; - shf.l.wrap.b32 %r2188, %r2187, %r2187, 1; - cvt.u64.u32 %rd2644, %r2188; - cvt.u64.u32 %rd2645, %r2183; - cvt.u64.u32 %rd2646, %r2185; - bfi.b64 %rd2647, %rd2644, %rd2646, 32, 32; - cvt.u64.u32 %rd2648, %r2186; - bfi.b64 %rd2649, %rd2645, %rd2648, 32, 32; - mov.b64 {%r2189, %r2190}, %rd2649; - mov.b64 {%r2191, %r2192}, %rd2647; - cvt.u64.u32 %rd2650, %r2192; - cvt.u64.u32 %rd2651, %r2190; - cvt.u64.u32 %rd2652, %r2191; - bfi.b64 %rd2653, %rd2650, %rd2652, 32, 32; - bfi.b64 %rd2654, %rd2651, %rd2648, 32, 32; - mov.b64 {%r2193, %r2194}, %rd2654; - mov.b64 {%r2195, %r2196}, %rd2653; - shf.l.wrap.b32 %r2197, %r2167, %r2167, 5; - xor.b32 %r2198, %r2168, %r2160; - xor.b32 %r2199, %r2198, %r2159; - add.s32 %r2200, %r2193, %r2152; - add.s32 %r2201, %r2200, %r2199; - add.s32 %r2202, %r2201, %r2197; - add.s32 %r2203, %r2202, -899497514; - shf.l.wrap.b32 %r2204, %r2159, %r2159, 30; - shf.l.wrap.b32 %r2205, %r2203, %r2203, 5; - xor.b32 %r2206, %r2204, %r2168; - xor.b32 %r2207, %r2206, %r2167; - add.s32 %r2208, %r2194, %r2160; - add.s32 %r2209, %r2208, %r2207; - add.s32 %r2210, %r2209, %r2205; - add.s32 %r2211, %r2210, -899497514; - shf.l.wrap.b32 %r2212, %r2167, %r2167, 30; - shf.l.wrap.b32 %r2213, %r2211, %r2211, 5; - xor.b32 %r2214, %r2212, %r2204; - xor.b32 %r2215, %r2214, %r2203; - add.s32 %r2216, %r2195, %r2168; - add.s32 %r2217, %r2216, %r2215; - add.s32 %r2218, %r2217, %r2213; - add.s32 %r2219, %r2218, -899497514; - shf.l.wrap.b32 %r2220, %r2203, %r2203, 30; - shf.l.wrap.b32 %r2221, %r2219, %r2219, 5; - xor.b32 %r2222, %r2220, %r2212; - xor.b32 %r2223, %r2222, %r2211; - add.s32 %r2224, %r2196, %r2204; - add.s32 %r2225, %r2224, %r2223; - add.s32 %r2226, %r2225, %r2221; - add.s32 %r2227, %r2226, -899497514; - shf.l.wrap.b32 %r2228, %r2211, %r2211, 30; - cvt.u64.u32 %rd2655, %r2220; - cvt.u64.u32 %rd2656, %r2228; - cvt.u64.u32 %rd2657, %r2219; - cvt.u64.u32 %rd2658, %r2227; - bfi.b64 %rd2659, %rd2657, %rd2658, 32, 32; - bfi.b64 %rd2660, %rd2655, %rd2656, 32, 32; - mov.b64 {%r2229, %r2230}, %rd2659; - mov.b64 {%r2231, %r2232}, %rd2660; - xor.b32 %r2233, %r1996, %r1994; - xor.b32 %r2234, %r2065, %r1995; - xor.b32 %r2235, %r2066, %r1996; - cvt.u64.u32 %rd2661, %r2235; - cvt.u64.u32 %rd2662, %r2233; - xor.b32 %r2236, %r1995, %r1993; - cvt.u64.u32 %rd2663, %r2236; - cvt.u64.u32 %rd2664, %r2234; - bfi.b64 %rd2665, %rd2661, %rd2664, 32, 32; - bfi.b64 %rd2666, %rd2662, %rd2663, 32, 32; - mov.b64 {%r2237, %r2238}, %rd2666; - mov.b64 {%r2239, %r2240}, %rd2665; - xor.b32 %r2241, %r2122, %r2236; - xor.b32 %r2242, %r2130, %r2238; - xor.b32 %r2243, %r2131, %r2239; - xor.b32 %r2244, %r2132, %r2240; - xor.b32 %r2245, %r2194, %r2241; - shf.l.wrap.b32 %r2246, %r2245, %r2245, 1; - xor.b32 %r2247, %r2242, %r2195; - shf.l.wrap.b32 %r2248, %r2247, %r2247, 1; - xor.b32 %r2249, %r2243, %r2196; - shf.l.wrap.b32 %r2250, %r2249, %r2249, 1; - xor.b32 %r2251, %r2244, %r2246; - shf.l.wrap.b32 %r2252, %r2251, %r2251, 1; - cvt.u64.u32 %rd2667, %r2252; - cvt.u64.u32 %rd2668, %r2248; - cvt.u64.u32 %rd2669, %r2250; - bfi.b64 %rd2670, %rd2667, %rd2669, 32, 32; - cvt.u64.u32 %rd2671, %r2246; - bfi.b64 %rd2672, %rd2668, %rd2671, 32, 32; - mov.b64 {%r2253, %r2254}, %rd2672; - mov.b64 {%r2255, %r2256}, %rd2670; - cvt.u64.u32 %rd2673, %r2256; - cvt.u64.u32 %rd2674, %r2254; - cvt.u64.u32 %rd2675, %r2255; - bfi.b64 %rd2676, %rd2673, %rd2675, 32, 32; - bfi.b64 %rd2677, %rd2674, %rd2671, 32, 32; - mov.b64 {%r2257, %r2258}, %rd2677; - mov.b64 {%r2259, %r2260}, %rd2676; - cvt.u64.u32 %rd2678, %r2232; - cvt.u64.u32 %rd2679, %r2230; - cvt.u64.u32 %rd2680, %r2231; - bfi.b64 %rd2681, %rd2679, %rd2658, 32, 32; - bfi.b64 %rd2682, %rd2678, %rd2680, 32, 32; - mov.b64 {%r2261, %r2262}, %rd2681; - mov.b64 {%r2263, %r2264}, %rd2682; - shf.l.wrap.b32 %r2265, %r2261, %r2261, 5; - xor.b32 %r2266, %r2263, %r2262; - xor.b32 %r2267, %r2266, %r2264; - add.s32 %r2268, %r2212, %r2257; - add.s32 %r2269, %r2268, %r2265; - add.s32 %r2270, %r2269, %r2267; - add.s32 %r2271, %r2270, -899497514; - shf.l.wrap.b32 %r2272, %r2262, %r2262, 30; - shf.l.wrap.b32 %r2273, %r2271, %r2271, 5; - xor.b32 %r2274, %r2263, %r2261; - xor.b32 %r2275, %r2274, %r2272; - add.s32 %r2276, %r2258, %r2264; - add.s32 %r2277, %r2276, %r2275; - add.s32 %r2278, %r2277, %r2273; - add.s32 %r2279, %r2278, -899497514; - shf.l.wrap.b32 %r2280, %r2261, %r2261, 30; - shf.l.wrap.b32 %r2281, %r2279, %r2279, 5; - xor.b32 %r2282, %r2272, %r2280; - xor.b32 %r2283, %r2282, %r2271; - add.s32 %r2284, %r2259, %r2263; - add.s32 %r2285, %r2284, %r2283; - add.s32 %r2286, %r2285, %r2281; - add.s32 %r2287, %r2286, -899497514; - shf.l.wrap.b32 %r2288, %r2271, %r2271, 30; - shf.l.wrap.b32 %r2289, %r2287, %r2287, 5; - xor.b32 %r2290, %r2288, %r2280; - xor.b32 %r2291, %r2290, %r2279; - add.s32 %r2292, %r2260, %r2272; - add.s32 %r2293, %r2292, %r2291; - add.s32 %r2294, %r2293, %r2289; - add.s32 %r2295, %r2294, -899497514; - shf.l.wrap.b32 %r2296, %r2279, %r2279, 30; - xor.b32 %r2297, %r2068, %r2066; - xor.b32 %r2298, %r2129, %r2067; - xor.b32 %r2299, %r2130, %r2068; - cvt.u64.u32 %rd2683, %r2299; - cvt.u64.u32 %rd2684, %r2297; - xor.b32 %r2300, %r2067, %r2065; - cvt.u64.u32 %rd2685, %r2300; - cvt.u64.u32 %rd2686, %r2298; - bfi.b64 %rd2687, %rd2683, %rd2686, 32, 32; - bfi.b64 %rd2688, %rd2684, %rd2685, 32, 32; - mov.b64 {%r2301, %r2302}, %rd2688; - mov.b64 {%r2303, %r2304}, %rd2687; - xor.b32 %r2305, %r2186, %r2300; - xor.b32 %r2306, %r2194, %r2302; - xor.b32 %r2307, %r2195, %r2303; - xor.b32 %r2308, %r2196, %r2304; - xor.b32 %r2309, %r2258, %r2305; - shf.l.wrap.b32 %r2310, %r2309, %r2309, 1; - xor.b32 %r2311, %r2306, %r2259; - shf.l.wrap.b32 %r2312, %r2311, %r2311, 1; - xor.b32 %r2313, %r2307, %r2260; - shf.l.wrap.b32 %r2314, %r2313, %r2313, 1; - xor.b32 %r2315, %r2308, %r2310; - shf.l.wrap.b32 %r2316, %r2315, %r2315, 1; - shf.l.wrap.b32 %r2317, %r2295, %r2295, 5; - xor.b32 %r2318, %r2296, %r2288; - xor.b32 %r2319, %r2318, %r2287; - add.s32 %r2320, %r2310, %r2280; - add.s32 %r2321, %r2320, %r2319; - add.s32 %r2322, %r2321, %r2317; - add.s32 %r2323, %r2322, -899497514; - shf.l.wrap.b32 %r2324, %r2287, %r2287, 30; - shf.l.wrap.b32 %r2325, %r2323, %r2323, 5; - xor.b32 %r2326, %r2324, %r2296; - xor.b32 %r2327, %r2326, %r2295; - add.s32 %r2328, %r2312, %r2288; - add.s32 %r2329, %r2328, %r2327; - add.s32 %r2330, %r2329, %r2325; - add.s32 %r2331, %r2330, -899497514; - shf.l.wrap.b32 %r2332, %r2295, %r2295, 30; - shf.l.wrap.b32 %r2333, %r2331, %r2331, 5; - xor.b32 %r2334, %r2332, %r2324; - xor.b32 %r2335, %r2334, %r2323; - add.s32 %r2336, %r2314, %r2296; - add.s32 %r2337, %r2336, %r2335; - add.s32 %r2338, %r2337, %r2333; - add.s32 %r2339, %r2338, -899497514; - shf.l.wrap.b32 %r2340, %r2323, %r2323, 30; - shf.l.wrap.b32 %r2341, %r2339, %r2339, 5; - xor.b32 %r2342, %r2340, %r2332; - xor.b32 %r2343, %r2342, %r2331; - shf.l.wrap.b32 %r2344, %r2331, %r2331, 30; - add.s32 %r2345, %r9085, %r2316; - add.s32 %r2346, %r2345, %r2324; - add.s32 %r2347, %r2346, %r2343; - add.s32 %r2348, %r2347, %r2341; - add.s32 %r9085, %r2348, -899497514; - add.s32 %r9086, %r2339, %r9086; - add.s32 %r9087, %r2344, %r9087; - add.s32 %r9088, %r2340, %r9088; - add.s32 %r9089, %r2332, %r9089; - setp.eq.s64 %p194, %rd4243, %rd793; - add.s64 %rd4244, %rd4244, 64; - @%p194 bra $L__BB1_325; - bra.uni $L__BB1_269; - -$L__BB1_325: - mov.u16 %rs4345, 0; - ld.param.u64 %rd4026, [_ZN16cugparck_commons8HashType4hash17hb62948cbb849e285E_param_0]; - cvta.to.local.u64 %rd4025, %rd4026; - shr.u32 %r5298, %r9089, 24; - shr.u32 %r5299, %r9089, 8; - and.b32 %r5300, %r5299, 65280; - or.b32 %r5301, %r5300, %r5298; - shl.b32 %r5302, %r9089, 24; - shl.b32 %r5303, %r9089, 8; - and.b32 %r5304, %r5303, 16711680; - or.b32 %r5305, %r5302, %r5304; - or.b32 %r5306, %r5305, %r5301; - shr.u32 %r5307, %r5306, 8; - shr.u32 %r5308, %r5305, 16; - shr.u32 %r5309, %r9085, 24; - shr.u32 %r5310, %r9085, 8; - and.b32 %r5311, %r5310, 65280; - or.b32 %r5312, %r5311, %r5309; - shl.b32 %r5313, %r9085, 24; - shl.b32 %r5314, %r9085, 8; - and.b32 %r5315, %r5314, 16711680; - or.b32 %r5316, %r5313, %r5315; - or.b32 %r5317, %r5316, %r5312; - shr.u32 %r5318, %r5317, 8; - shr.u32 %r5319, %r5316, 16; - shr.u32 %r5320, %r9086, 24; - shr.u32 %r5321, %r9086, 8; - and.b32 %r5322, %r5321, 65280; - or.b32 %r5323, %r5322, %r5320; - shl.b32 %r5324, %r9086, 24; - shl.b32 %r5325, %r9086, 8; - and.b32 %r5326, %r5325, 16711680; - or.b32 %r5327, %r5324, %r5326; - or.b32 %r5328, %r5327, %r5323; - shr.u32 %r5329, %r5328, 8; - shr.u32 %r5330, %r5327, 16; - shr.u32 %r5331, %r9087, 24; - shr.u32 %r5332, %r9087, 8; - and.b32 %r5333, %r5332, 65280; - or.b32 %r5334, %r5333, %r5331; - shl.b32 %r5335, %r9087, 24; - shl.b32 %r5336, %r9087, 8; - and.b32 %r5337, %r5336, 16711680; - or.b32 %r5338, %r5335, %r5337; - or.b32 %r5339, %r5338, %r5334; - shr.u32 %r5340, %r5339, 8; - shr.u32 %r5341, %r5338, 16; - shr.u32 %r5342, %r9088, 24; - shr.u32 %r5343, %r9088, 8; - and.b32 %r5344, %r5343, 65280; - or.b32 %r5345, %r5344, %r5342; - shl.b32 %r5346, %r9088, 24; - shl.b32 %r5347, %r9088, 8; - and.b32 %r5348, %r5347, 16711680; - or.b32 %r5349, %r5346, %r5348; - or.b32 %r5350, %r5349, %r5345; - shr.u32 %r5351, %r5350, 8; - shr.u32 %r5352, %r5349, 16; - mov.u16 %rs3421, 20; - st.local.u16 [%rd4025], %rs3421; - cvt.u16.u32 %rs3422, %r5318; - cvt.u16.u32 %rs3423, %r5309; - cvt.u16.u32 %rs3424, %r5310; - and.b16 %rs3425, %rs3424, -256; - or.b16 %rs3426, %rs3425, %rs3423; - st.local.v2.u8 [%rd4025+2], {%rs3426, %rs3422}; - cvt.u16.u32 %rs3427, %r5319; - cvt.u16.u32 %rs3428, %r9085; - and.b16 %rs3429, %rs3428, 255; - st.local.v2.u8 [%rd4025+4], {%rs3427, %rs3429}; - cvt.u16.u32 %rs3430, %r5329; - cvt.u16.u32 %rs3431, %r5320; - cvt.u16.u32 %rs3432, %r5321; - and.b16 %rs3433, %rs3432, -256; - or.b16 %rs3434, %rs3433, %rs3431; - st.local.v2.u8 [%rd4025+6], {%rs3434, %rs3430}; - cvt.u16.u32 %rs3435, %r5330; - cvt.u16.u32 %rs3436, %r9086; - and.b16 %rs3437, %rs3436, 255; - st.local.v2.u8 [%rd4025+8], {%rs3435, %rs3437}; - cvt.u16.u32 %rs3438, %r5340; - cvt.u16.u32 %rs3439, %r5331; - cvt.u16.u32 %rs3440, %r5332; - and.b16 %rs3441, %rs3440, -256; - or.b16 %rs3442, %rs3441, %rs3439; - st.local.v2.u8 [%rd4025+10], {%rs3442, %rs3438}; - cvt.u16.u32 %rs3443, %r5341; - cvt.u16.u32 %rs3444, %r9087; - and.b16 %rs3445, %rs3444, 255; - st.local.v2.u8 [%rd4025+12], {%rs3443, %rs3445}; - cvt.u16.u32 %rs3446, %r5351; - cvt.u16.u32 %rs3447, %r5342; - cvt.u16.u32 %rs3448, %r5343; - and.b16 %rs3449, %rs3448, -256; - or.b16 %rs3450, %rs3449, %rs3447; - st.local.v2.u8 [%rd4025+14], {%rs3450, %rs3446}; - cvt.u16.u32 %rs3451, %r5352; - cvt.u16.u32 %rs3452, %r9088; - and.b16 %rs3453, %rs3452, 255; - st.local.v2.u8 [%rd4025+16], {%rs3451, %rs3453}; - cvt.u16.u32 %rs3454, %r5307; - cvt.u16.u32 %rs3455, %r5298; - cvt.u16.u32 %rs3456, %r5299; - and.b16 %rs3457, %rs3456, -256; - or.b16 %rs3458, %rs3457, %rs3455; - st.local.v2.u8 [%rd4025+18], {%rs3458, %rs3454}; - cvt.u16.u32 %rs3460, %r5308; - cvt.u16.u32 %rs3461, %r9089; - and.b16 %rs3462, %rs3461, 255; - st.local.v2.u8 [%rd4025+20], {%rs3460, %rs3462}; - st.local.v2.u8 [%rd4025+22], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+24], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+26], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+28], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+30], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+32], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+34], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+36], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+38], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+40], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+42], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+44], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+46], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+48], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+50], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+52], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+54], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+56], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+58], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+60], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+62], {%rs4345, %rs4345}; - st.local.v2.u8 [%rd4025+64], {%rs4345, %rs4345}; - bra.uni $L__BB1_549; - -$L__BB1_19: - setp.eq.s16 %p7, %rs1380, 6; - @%p7 bra $L__BB1_208; - - setp.eq.s16 %p8, %rs1380, 7; - @%p8 bra $L__BB1_21; - -$L__BB1_470: - setp.gt.u16 %p343, %rs1, 10; - @%p343 bra $L__BB1_550; - - add.u64 %rd3892, %SP, 504; - add.u64 %rd4274, %SPL, 504; - mov.u64 %rd4273, 0; - mov.u16 %rs4068, 0; - st.local.v4.u8 [%rd4274], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd929, %rd3892, 4; - cvta.to.local.u64 %rd3894, %rd929; - st.local.v4.u8 [%rd3894], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3895, %rd3892, 8; - cvta.to.local.u64 %rd3896, %rd3895; - st.local.v4.u8 [%rd3896], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3897, %rd3892, 12; - cvta.to.local.u64 %rd3898, %rd3897; - st.local.v4.u8 [%rd3898], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3899, %rd3892, 16; - cvta.to.local.u64 %rd3900, %rd3899; - st.local.v4.u8 [%rd3900], {%rs4068, %rs4068, %rs4068, %rs4068}; - setp.eq.s16 %p344, %rs1, 0; - mov.u16 %rs4356, %rs4068; - @%p344 bra $L__BB1_483; - - shr.u16 %rs1200, %rs1382, 8; - mov.b32 {%rs1201, %rs1203}, %r304; - shr.u16 %rs1204, %rs1203, 8; - shr.u16 %rs1202, %rs1201, 8; - mov.b32 {%rs1205, %rs1207}, %r302; - shr.u16 %rs1208, %rs1207, 8; - shr.u16 %rs1206, %rs1205, 8; - mov.u64 %rd4273, 2; - mov.u16 %rs4069, 0; - st.local.v2.u8 [%rd4274], {%rs1382, %rs4069}; - and.b16 %rs4356, %rs1382, 255; - setp.eq.s16 %p345, %rs1, 1; - @%p345 bra $L__BB1_483; - - or.b64 %rd3906, %rd3892, 2; - cvta.to.local.u64 %rd3907, %rd3906; - st.local.v2.u8 [%rd3907], {%rs1200, %rs4069}; - setp.eq.s16 %p346, %rs1, 2; - mov.u64 %rd4273, 4; - @%p346 bra $L__BB1_483; - - st.local.v2.u8 [%rd3894], {%rs1201, %rs4069}; - setp.eq.s16 %p347, %rs1, 3; - mov.u64 %rd4273, 6; - @%p347 bra $L__BB1_483; - - add.s64 %rd3912, %rd3892, 6; - cvta.to.local.u64 %rd3913, %rd3912; - st.local.v2.u8 [%rd3913], {%rs1202, %rs4069}; - setp.eq.s16 %p348, %rs1, 4; - mov.u64 %rd4273, 8; - @%p348 bra $L__BB1_483; - - add.s64 %rd3915, %rd929, 4; - cvta.to.local.u64 %rd3916, %rd3915; - st.local.v2.u8 [%rd3916], {%rs1203, %rs4069}; - setp.eq.s16 %p349, %rs1, 5; - mov.u64 %rd4273, 10; - @%p349 bra $L__BB1_483; - - add.s64 %rd3919, %rd3892, 10; - cvta.to.local.u64 %rd3920, %rd3919; - st.local.v2.u8 [%rd3920], {%rs1204, %rs4069}; - setp.eq.s16 %p350, %rs1, 6; - mov.u64 %rd4273, 12; - @%p350 bra $L__BB1_483; - - add.s64 %rd3922, %rd929, 8; - cvta.to.local.u64 %rd3923, %rd3922; - st.local.v2.u8 [%rd3923], {%rs1205, %rs4069}; - setp.eq.s16 %p351, %rs1, 7; - mov.u64 %rd4273, 14; - @%p351 bra $L__BB1_483; - - add.s64 %rd3926, %rd3892, 14; - cvta.to.local.u64 %rd3927, %rd3926; - st.local.v2.u8 [%rd3927], {%rs1206, %rs4069}; - setp.eq.s16 %p352, %rs1, 8; - mov.u64 %rd4273, 16; - @%p352 bra $L__BB1_483; - - add.s64 %rd3929, %rd929, 12; - cvta.to.local.u64 %rd3930, %rd3929; - st.local.v2.u8 [%rd3930], {%rs1207, %rs4069}; - setp.eq.s16 %p353, %rs1, 9; - mov.u64 %rd4273, 18; - @%p353 bra $L__BB1_483; - - add.s64 %rd3933, %rd3892, 18; - cvta.to.local.u64 %rd3934, %rd3933; - st.local.v2.u8 [%rd3934], {%rs1208, %rs4069}; - setp.eq.s16 %p354, %rs1, 10; - mov.u64 %rd4273, 20; - @%p354 bra $L__BB1_483; - bra.uni $L__BB1_482; - -$L__BB1_483: - add.u64 %rd3935, %SP, 352; - add.u64 %rd931, %SPL, 352; - st.local.v4.u16 [%rd931], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3936, %rd3935, 8; - cvta.to.local.u64 %rd932, %rd3936; - st.local.v4.u16 [%rd932], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3937, %rd3935, 16; - cvta.to.local.u64 %rd933, %rd3937; - st.local.v4.u16 [%rd933], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3938, %rd3935, 24; - cvta.to.local.u64 %rd934, %rd3938; - st.local.v4.u16 [%rd934], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3939, %rd3935, 32; - cvta.to.local.u64 %rd935, %rd3939; - st.local.v4.u16 [%rd935], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3940, %rd3935, 40; - cvta.to.local.u64 %rd936, %rd3940; - st.local.v4.u16 [%rd936], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3941, %rd3935, 48; - cvta.to.local.u64 %rd937, %rd3941; - st.local.v4.u16 [%rd937], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd3942, %rd3935, 56; - cvta.to.local.u64 %rd938, %rd3942; - st.local.v4.u16 [%rd938], {%rs4068, %rs4068, %rs4068, %rs4068}; - add.s64 %rd939, %rd3935, 64; - cvta.to.local.u64 %rd940, %rd939; - st.local.u8 [%rd940], %rs4068; - setp.eq.s64 %p355, %rd4273, 0; - @%p355 bra $L__BB1_487; - - shr.u64 %rd943, %rd4273, 1; - mov.u64 %rd4276, 1; - mov.u64 %rd4275, %rd931; - bra.uni $L__BB1_485; - -$L__BB1_486: - add.s64 %rd947, %rd4274, 2; - ld.local.u16 %rs4356, [%rd4274+2]; - add.s64 %rd4276, %rd4276, 1; - add.s64 %rd4275, %rd4275, 2; - mov.u64 %rd4274, %rd947; - -$L__BB1_485: - st.local.u16 [%rd4275], %rs4356; - setp.ge.u64 %p356, %rd4276, %rd943; - @%p356 bra $L__BB1_487; - bra.uni $L__BB1_486; - -$L__BB1_487: - mov.u64 %rd3946, 0; - st.local.u8 [%rd940], %rd4273; - ld.local.v4.u16 {%rs4080, %rs4081, %rs4082, %rs4083}, [%rd931]; - ld.local.v4.u16 {%rs4088, %rs4089, %rs4090, %rs4091}, [%rd932]; - ld.local.v4.u16 {%rs4096, %rs4097, %rs4098, %rs4099}, [%rd933]; - ld.local.v4.u16 {%rs4104, %rs4105, %rs4106, %rs4107}, [%rd934]; - ld.local.v4.u16 {%rs4112, %rs4113, %rs4114, %rs4115}, [%rd935]; - ld.local.v4.u16 {%rs4120, %rs4121, %rs4122, %rs4123}, [%rd936]; - ld.local.v4.u16 {%rs4128, %rs4129, %rs4130, %rs4131}, [%rd937]; - ld.local.v4.u16 {%rs4136, %rs4137, %rs4138, %rs4139}, [%rd938]; - shr.u16 %rs4142, %rs4137, 8; - ld.local.v4.u16 {%rs4143, %rs4144, %rs4145, %rs4146}, [%rd940]; - and.b16 %rs4147, %rs4143, 255; - shr.u16 %rs4149, %rs4144, 8; - shr.u16 %rs4152, %rs4146, 8; - st.local.u64 [%rd1], %rd3946; - mov.u32 %r9155, -271733879; - mov.u32 %r8090, 1732584193; - st.local.v2.u32 [%rd1+8], {%r8090, %r9155}; - mov.u32 %r9152, 271733878; - mov.u32 %r9154, -1732584194; - st.local.v2.u32 [%rd1+16], {%r9154, %r9152}; - st.local.v4.u16 [%rd1+24], {%rs4080, %rs4081, %rs4082, %rs4083}; - st.local.v4.u16 [%rd1+32], {%rs4088, %rs4089, %rs4090, %rs4091}; - st.local.v4.u16 [%rd1+40], {%rs4096, %rs4097, %rs4098, %rs4099}; - st.local.v4.u16 [%rd1+48], {%rs4104, %rs4105, %rs4106, %rs4107}; - st.local.v4.u16 [%rd1+56], {%rs4112, %rs4113, %rs4114, %rs4115}; - st.local.v4.u16 [%rd1+64], {%rs4120, %rs4121, %rs4122, %rs4123}; - st.local.v4.u16 [%rd1+72], {%rs4128, %rs4129, %rs4130, %rs4131}; - st.local.u16 [%rd1+80], %rs4136; - st.local.u8 [%rd1+82], %rs4137; - st.local.u8 [%rd1+83], %rs4142; - st.local.v2.u16 [%rd1+84], {%rs4138, %rs4139}; - st.local.u16 [%rd1+88], %rs4143; - st.local.u8 [%rd1+90], %rs4144; - st.local.u8 [%rd1+91], %rs4149; - st.local.u16 [%rd1+92], %rs4145; - st.local.u8 [%rd1+94], %rs4146; - st.local.u8 [%rd1+95], %rs4152; - cvt.u64.u16 %rd3948, %rs4143; - and.b64 %rd951, %rd3948, 255; - cvt.u32.u16 %r8093, %rs4143; - and.b32 %r8094, %r8093, 255; - mul.wide.u32 %rd952, %r8094, 8; - setp.lt.u16 %p357, %rs4147, 64; - @%p357 bra $L__BB1_489; - bra.uni $L__BB1_488; - -$L__BB1_489: - add.s64 %rd3949, %rd1, %rd951; - mov.u16 %rs4155, 128; - st.local.u8 [%rd3949+24], %rs4155; - add.s64 %rd953, %rd951, 1; - setp.eq.s64 %p358, %rd953, 64; - @%p358 bra $L__BB1_496; - - add.s64 %rd3950, %rd1, %rd953; - add.s64 %rd4281, %rd3950, 24; - mov.u16 %rs4156, 3; - sub.s16 %rs4157, %rs4156, %rs4143; - and.b16 %rs1214, %rs4157, 3; - setp.eq.s16 %p359, %rs1214, 0; - @%p359 bra $L__BB1_493; - - cvt.u64.u16 %rd3951, %rs1214; - neg.s64 %rd4277, %rd3951; - mov.u16 %rs4158, 0; - mov.u64 %rd4278, %rd4281; - -$L__BB1_492: - .pragma "nounroll"; - add.s64 %rd4281, %rd4278, 1; - st.local.u8 [%rd4278], %rs4158; - add.s64 %rd4277, %rd4277, 1; - setp.ne.s64 %p360, %rd4277, 0; - mov.u64 %rd4278, %rd4281; - @%p360 bra $L__BB1_492; - -$L__BB1_493: - mov.u64 %rd3952, 62; - sub.s64 %rd3953, %rd3952, %rd951; - setp.lt.u64 %p361, %rd3953, 3; - @%p361 bra $L__BB1_496; - - sub.s64 %rd3954, %rd1, %rd4281; - add.s64 %rd4280, %rd3954, 88; - mov.u16 %rs4159, 0; - -$L__BB1_495: - st.local.u8 [%rd4281], %rs4159; - st.local.u8 [%rd4281+1], %rs4159; - st.local.u8 [%rd4281+2], %rs4159; - st.local.u8 [%rd4281+3], %rs4159; - add.s64 %rd4280, %rd4280, -4; - setp.ne.s64 %p362, %rd4280, 0; - add.s64 %rd4281, %rd4281, 4; - @%p362 bra $L__BB1_495; - -$L__BB1_496: - or.b64 %rd3955, %rd951, 7; - setp.eq.s64 %p363, %rd3955, 63; - @%p363 bra $L__BB1_518; - bra.uni $L__BB1_497; - -$L__BB1_518: - ld.local.u32 %rd3985, [%rd1+24]; - shl.b64 %rd3986, %rd3985, 8; - mov.b64 {%r8440, %r8441}, %rd3986; - mov.b32 {%rs1294, %rs4234}, %r8441; - mov.b32 {%rs1290, %rs1292}, %r8440; - shr.u16 %rs1293, %rs1292, 8; - shr.u16 %rs1291, %rs1290, 8; - mov.pred %p381, 0; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3987, [%rd1+28]; - shl.b64 %rd3988, %rd3987, 8; - mov.b64 {%r8442, %r8443}, %rd3988; - mov.b32 {%rs1299, %rs4235}, %r8443; - mov.b32 {%rs1295, %rs1297}, %r8442; - shr.u16 %rs1298, %rs1297, 8; - shr.u16 %rs1296, %rs1295, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3989, [%rd1+32]; - shl.b64 %rd3990, %rd3989, 8; - mov.b64 {%r8444, %r8445}, %rd3990; - mov.b32 {%rs1304, %rs4236}, %r8445; - mov.b32 {%rs1300, %rs1302}, %r8444; - shr.u16 %rs1303, %rs1302, 8; - shr.u16 %rs1301, %rs1300, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3991, [%rd1+36]; - shl.b64 %rd3992, %rd3991, 8; - mov.b64 {%r8446, %r8447}, %rd3992; - mov.b32 {%rs1309, %rs4237}, %r8447; - mov.b32 {%rs1305, %rs1307}, %r8446; - shr.u16 %rs1308, %rs1307, 8; - shr.u16 %rs1306, %rs1305, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3993, [%rd1+40]; - shl.b64 %rd3994, %rd3993, 8; - mov.b64 {%r8448, %r8449}, %rd3994; - mov.b32 {%rs1314, %rs4238}, %r8449; - mov.b32 {%rs1310, %rs1312}, %r8448; - shr.u16 %rs1313, %rs1312, 8; - shr.u16 %rs1311, %rs1310, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3995, [%rd1+44]; - shl.b64 %rd3996, %rd3995, 8; - mov.b64 {%r8450, %r8451}, %rd3996; - mov.b32 {%rs1319, %rs4239}, %r8451; - mov.b32 {%rs1315, %rs1317}, %r8450; - shr.u16 %rs1318, %rs1317, 8; - shr.u16 %rs1316, %rs1315, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3997, [%rd1+48]; - shl.b64 %rd3998, %rd3997, 8; - mov.b64 {%r8452, %r8453}, %rd3998; - mov.b32 {%rs1324, %rs4240}, %r8453; - mov.b32 {%rs1320, %rs1322}, %r8452; - shr.u16 %rs1323, %rs1322, 8; - shr.u16 %rs1321, %rs1320, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd3999, [%rd1+52]; - shl.b64 %rd4000, %rd3999, 8; - mov.b64 {%r8454, %r8455}, %rd4000; - mov.b32 {%rs1329, %rs4241}, %r8455; - mov.b32 {%rs1325, %rs1327}, %r8454; - shr.u16 %rs1328, %rs1327, 8; - shr.u16 %rs1326, %rs1325, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4001, [%rd1+56]; - shl.b64 %rd4002, %rd4001, 8; - mov.b64 {%r8456, %r8457}, %rd4002; - mov.b32 {%rs1334, %rs4242}, %r8457; - mov.b32 {%rs1330, %rs1332}, %r8456; - shr.u16 %rs1333, %rs1332, 8; - shr.u16 %rs1331, %rs1330, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4003, [%rd1+60]; - shl.b64 %rd4004, %rd4003, 8; - mov.b64 {%r8458, %r8459}, %rd4004; - mov.b32 {%rs1339, %rs4243}, %r8459; - mov.b32 {%rs1335, %rs1337}, %r8458; - shr.u16 %rs1338, %rs1337, 8; - shr.u16 %rs1336, %rs1335, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4005, [%rd1+64]; - shl.b64 %rd4006, %rd4005, 8; - mov.b64 {%r8460, %r8461}, %rd4006; - mov.b32 {%rs1344, %rs4244}, %r8461; - mov.b32 {%rs1340, %rs1342}, %r8460; - shr.u16 %rs1343, %rs1342, 8; - shr.u16 %rs1341, %rs1340, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4007, [%rd1+68]; - shl.b64 %rd4008, %rd4007, 8; - mov.b64 {%r8462, %r8463}, %rd4008; - mov.b32 {%rs1349, %rs4245}, %r8463; - mov.b32 {%rs1345, %rs1347}, %r8462; - shr.u16 %rs1348, %rs1347, 8; - shr.u16 %rs1346, %rs1345, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4009, [%rd1+72]; - shl.b64 %rd4010, %rd4009, 8; - mov.b64 {%r8464, %r8465}, %rd4010; - mov.b32 {%rs1354, %rs4246}, %r8465; - mov.b32 {%rs1350, %rs1352}, %r8464; - shr.u16 %rs1353, %rs1352, 8; - shr.u16 %rs1351, %rs1350, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4011, [%rd1+76]; - shl.b64 %rd4012, %rd4011, 8; - mov.b64 {%r8466, %r8467}, %rd4012; - mov.b32 {%rs1359, %rs4247}, %r8467; - mov.b32 {%rs1355, %rs1357}, %r8466; - shr.u16 %rs1358, %rs1357, 8; - shr.u16 %rs1356, %rs1355, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4013, [%rd1+80]; - shl.b64 %rd4014, %rd4013, 8; - mov.b64 {%r8468, %r8469}, %rd4014; - mov.b32 {%rs1364, %rs4248}, %r8469; - mov.b32 {%rs1360, %rs1362}, %r8468; - shr.u16 %rs1363, %rs1362, 8; - shr.u16 %rs1361, %rs1360, 8; - @%p381 bra $L__BB1_534; - - ld.local.u32 %rd4015, [%rd1+84]; - shl.b64 %rd4016, %rd4015, 8; - mov.b64 {%r8470, %r8471}, %rd4016; - mov.b32 {%rs1369, %rs4249}, %r8471; - mov.b32 {%rs1365, %rs1367}, %r8470; - shr.u16 %rs1368, %rs1367, 8; - shr.u16 %rs1366, %rs1365, 8; - mov.pred %p396, -1; - @%p396 bra $L__BB1_535; - bra.uni $L__BB1_534; - -$L__BB1_535: - shl.b16 %rs4250, %rs1367, 8; - or.b16 %rs4251, %rs1366, %rs4250; - shl.b16 %rs4252, %rs1369, 8; - or.b16 %rs4253, %rs1368, %rs4252; - mov.b32 %r223, {%rs4251, %rs4253}; - shl.b16 %rs4254, %rs1362, 8; - or.b16 %rs4255, %rs1361, %rs4254; - shl.b16 %rs4256, %rs1364, 8; - or.b16 %rs4257, %rs1363, %rs4256; - mov.b32 %r224, {%rs4255, %rs4257}; - shl.b16 %rs4258, %rs1357, 8; - or.b16 %rs4259, %rs1356, %rs4258; - shl.b16 %rs4260, %rs1359, 8; - or.b16 %rs4261, %rs1358, %rs4260; - mov.b32 %r225, {%rs4259, %rs4261}; - shl.b16 %rs4262, %rs1352, 8; - or.b16 %rs4263, %rs1351, %rs4262; - shl.b16 %rs4264, %rs1354, 8; - or.b16 %rs4265, %rs1353, %rs4264; - mov.b32 %r226, {%rs4263, %rs4265}; - shl.b16 %rs4266, %rs1347, 8; - or.b16 %rs4267, %rs1346, %rs4266; - shl.b16 %rs4268, %rs1349, 8; - or.b16 %rs4269, %rs1348, %rs4268; - mov.b32 %r227, {%rs4267, %rs4269}; - shl.b16 %rs4270, %rs1342, 8; - or.b16 %rs4271, %rs1341, %rs4270; - shl.b16 %rs4272, %rs1344, 8; - or.b16 %rs4273, %rs1343, %rs4272; - mov.b32 %r228, {%rs4271, %rs4273}; - shl.b16 %rs4274, %rs1337, 8; - or.b16 %rs4275, %rs1336, %rs4274; - shl.b16 %rs4276, %rs1339, 8; - or.b16 %rs4277, %rs1338, %rs4276; - mov.b32 %r229, {%rs4275, %rs4277}; - shl.b16 %rs4278, %rs1332, 8; - or.b16 %rs4279, %rs1331, %rs4278; - shl.b16 %rs4280, %rs1334, 8; - or.b16 %rs4281, %rs1333, %rs4280; - mov.b32 %r230, {%rs4279, %rs4281}; - shl.b16 %rs4282, %rs1327, 8; - or.b16 %rs4283, %rs1326, %rs4282; - shl.b16 %rs4284, %rs1329, 8; - or.b16 %rs4285, %rs1328, %rs4284; - mov.b32 %r231, {%rs4283, %rs4285}; - shl.b16 %rs4286, %rs1322, 8; - or.b16 %rs4287, %rs1321, %rs4286; - shl.b16 %rs4288, %rs1324, 8; - or.b16 %rs4289, %rs1323, %rs4288; - mov.b32 %r232, {%rs4287, %rs4289}; - shl.b16 %rs4290, %rs1317, 8; - or.b16 %rs4291, %rs1316, %rs4290; - shl.b16 %rs4292, %rs1319, 8; - or.b16 %rs4293, %rs1318, %rs4292; - mov.b32 %r233, {%rs4291, %rs4293}; - shl.b16 %rs4294, %rs1312, 8; - or.b16 %rs4295, %rs1311, %rs4294; - shl.b16 %rs4296, %rs1314, 8; - or.b16 %rs4297, %rs1313, %rs4296; - mov.b32 %r234, {%rs4295, %rs4297}; - shl.b16 %rs4298, %rs1307, 8; - or.b16 %rs4299, %rs1306, %rs4298; - shl.b16 %rs4300, %rs1309, 8; - or.b16 %rs4301, %rs1308, %rs4300; - mov.b32 %r235, {%rs4299, %rs4301}; - shl.b16 %rs4302, %rs1302, 8; - or.b16 %rs4303, %rs1301, %rs4302; - shl.b16 %rs4304, %rs1304, 8; - or.b16 %rs4305, %rs1303, %rs4304; - mov.b32 %r236, {%rs4303, %rs4305}; - shl.b16 %rs4306, %rs1297, 8; - or.b16 %rs4307, %rs1296, %rs4306; - shl.b16 %rs4308, %rs1299, 8; - or.b16 %rs4309, %rs1298, %rs4308; - mov.b32 %r237, {%rs4307, %rs4309}; - shl.b16 %rs4310, %rs1292, 8; - or.b16 %rs4311, %rs1291, %rs4310; - shl.b16 %rs4312, %rs1294, 8; - or.b16 %rs4313, %rs1293, %rs4312; - mov.b32 %r238, {%rs4311, %rs4313}; - mov.u32 %r9165, -1043882854; - mov.u32 %r9164, -271733879; - mov.u32 %r9163, -1732584194; - mov.u32 %r9161, 271733878; - mov.u32 %r9162, %r9161; - @%p381 bra $L__BB1_537; - - add.s32 %r8477, %r238, -1; - shf.l.wrap.b32 %r8478, %r8477, %r8477, 3; - not.b32 %r8479, %r8478; - and.b32 %r8480, %r8478, -271733879; - and.b32 %r8481, %r8479, -1732584194; - or.b32 %r8482, %r8481, %r8480; - add.s32 %r8483, %r8482, %r237; - add.s32 %r8484, %r8483, 271733878; - shf.l.wrap.b32 %r8485, %r8484, %r8484, 7; - not.b32 %r8486, %r8485; - and.b32 %r8487, %r8485, %r8478; - and.b32 %r8488, %r8486, -271733879; - or.b32 %r8489, %r8488, %r8487; - add.s32 %r8490, %r8489, %r236; - add.s32 %r8491, %r8490, -1732584194; - shf.l.wrap.b32 %r8492, %r8491, %r8491, 11; - and.b32 %r8493, %r8492, %r8485; - not.b32 %r8494, %r8492; - and.b32 %r8495, %r8478, %r8494; - or.b32 %r8496, %r8495, %r8493; - add.s32 %r8497, %r8496, %r235; - add.s32 %r8498, %r8497, -271733879; - shf.l.wrap.b32 %r8499, %r8498, %r8498, 19; - and.b32 %r8500, %r8492, %r8499; - not.b32 %r8501, %r8499; - and.b32 %r8502, %r8485, %r8501; - or.b32 %r8503, %r8502, %r8500; - add.s32 %r8504, %r8503, %r8478; - add.s32 %r8505, %r8504, %r234; - shf.l.wrap.b32 %r8506, %r8505, %r8505, 3; - and.b32 %r8507, %r8506, %r8499; - not.b32 %r8508, %r8506; - and.b32 %r8509, %r8492, %r8508; - or.b32 %r8510, %r8509, %r8507; - add.s32 %r8511, %r8510, %r8485; - add.s32 %r8512, %r8511, %r233; - shf.l.wrap.b32 %r8513, %r8512, %r8512, 7; - and.b32 %r8514, %r8513, %r8506; - not.b32 %r8515, %r8513; - and.b32 %r8516, %r8499, %r8515; - or.b32 %r8517, %r8516, %r8514; - add.s32 %r8518, %r8517, %r8492; - add.s32 %r8519, %r8518, %r232; - shf.l.wrap.b32 %r8520, %r8519, %r8519, 11; - and.b32 %r8521, %r8520, %r8513; - not.b32 %r8522, %r8520; - and.b32 %r8523, %r8506, %r8522; - or.b32 %r8524, %r8523, %r8521; - add.s32 %r8525, %r8524, %r8499; - add.s32 %r8526, %r8525, %r231; - shf.l.wrap.b32 %r8527, %r8526, %r8526, 19; - and.b32 %r8528, %r8520, %r8527; - not.b32 %r8529, %r8527; - and.b32 %r8530, %r8513, %r8529; - or.b32 %r8531, %r8530, %r8528; - add.s32 %r8532, %r8531, %r8506; - add.s32 %r8533, %r8532, %r230; - shf.l.wrap.b32 %r8534, %r8533, %r8533, 3; - and.b32 %r8535, %r8534, %r8527; - not.b32 %r8536, %r8534; - and.b32 %r8537, %r8520, %r8536; - or.b32 %r8538, %r8537, %r8535; - add.s32 %r8539, %r8538, %r8513; - add.s32 %r8540, %r8539, %r229; - shf.l.wrap.b32 %r8541, %r8540, %r8540, 7; - and.b32 %r8542, %r8541, %r8534; - not.b32 %r8543, %r8541; - and.b32 %r8544, %r8527, %r8543; - or.b32 %r8545, %r8544, %r8542; - add.s32 %r8546, %r8545, %r8520; - add.s32 %r8547, %r8546, %r228; - shf.l.wrap.b32 %r8548, %r8547, %r8547, 11; - and.b32 %r8549, %r8548, %r8541; - not.b32 %r8550, %r8548; - and.b32 %r8551, %r8534, %r8550; - or.b32 %r8552, %r8551, %r8549; - add.s32 %r8553, %r8552, %r8527; - add.s32 %r8554, %r8553, %r227; - shf.l.wrap.b32 %r8555, %r8554, %r8554, 19; - and.b32 %r8556, %r8548, %r8555; - not.b32 %r8557, %r8555; - and.b32 %r8558, %r8541, %r8557; - or.b32 %r8559, %r8558, %r8556; - add.s32 %r8560, %r8559, %r8534; - add.s32 %r8561, %r8560, %r226; - shf.l.wrap.b32 %r8562, %r8561, %r8561, 3; - and.b32 %r8563, %r8562, %r8555; - not.b32 %r8564, %r8562; - and.b32 %r8565, %r8548, %r8564; - or.b32 %r8566, %r8565, %r8563; - add.s32 %r8567, %r8566, %r8541; - add.s32 %r8568, %r8567, %r225; - shf.l.wrap.b32 %r9162, %r8568, %r8568, 7; - and.b32 %r8569, %r9162, %r8562; - not.b32 %r8570, %r9162; - and.b32 %r8571, %r8555, %r8570; - or.b32 %r8572, %r8571, %r8569; - add.s32 %r8573, %r8572, %r8548; - add.s32 %r8574, %r8573, %r224; - shf.l.wrap.b32 %r9163, %r8574, %r8574, 11; - and.b32 %r9161, %r9163, %r9162; - not.b32 %r8575, %r9163; - and.b32 %r8576, %r8562, %r8575; - or.b32 %r8577, %r8576, %r9161; - add.s32 %r8578, %r8577, %r8555; - add.s32 %r8579, %r8578, %r223; - shf.l.wrap.b32 %r9164, %r8579, %r8579, 19; - add.s32 %r9165, %r8562, 1518500249; - -$L__BB1_537: - or.b32 %r8580, %r9163, %r9162; - and.b32 %r8581, %r8580, %r9164; - or.b32 %r8582, %r8581, %r9161; - add.s32 %r8583, %r9165, %r8582; - add.s32 %r8584, %r8583, %r238; - shf.l.wrap.b32 %r8585, %r8584, %r8584, 3; - or.b32 %r8586, %r9164, %r9163; - and.b32 %r8587, %r8585, %r8586; - and.b32 %r8588, %r9164, %r9163; - or.b32 %r8589, %r8587, %r8588; - add.s32 %r8590, %r9162, %r234; - add.s32 %r8591, %r8590, %r8589; - add.s32 %r8592, %r8591, 1518500249; - shf.l.wrap.b32 %r8593, %r8592, %r8592, 5; - or.b32 %r8594, %r8585, %r9164; - and.b32 %r8595, %r8593, %r8594; - and.b32 %r8596, %r8585, %r9164; - or.b32 %r8597, %r8595, %r8596; - add.s32 %r8598, %r9163, %r230; - add.s32 %r8599, %r8598, %r8597; - add.s32 %r8600, %r8599, 1518500249; - shf.l.wrap.b32 %r8601, %r8600, %r8600, 9; - or.b32 %r8602, %r8593, %r8585; - and.b32 %r8603, %r8601, %r8602; - and.b32 %r8604, %r8593, %r8585; - or.b32 %r8605, %r8603, %r8604; - add.s32 %r8606, %r9164, %r226; - add.s32 %r8607, %r8606, %r8605; - add.s32 %r8608, %r8607, 1518500249; - shf.l.wrap.b32 %r8609, %r8608, %r8608, 13; - or.b32 %r8610, %r8601, %r8593; - and.b32 %r8611, %r8609, %r8610; - and.b32 %r8612, %r8601, %r8593; - or.b32 %r8613, %r8611, %r8612; - add.s32 %r8614, %r8585, %r237; - add.s32 %r8615, %r8614, %r8613; - add.s32 %r8616, %r8615, 1518500249; - shf.l.wrap.b32 %r8617, %r8616, %r8616, 3; - or.b32 %r8618, %r8609, %r8601; - and.b32 %r8619, %r8617, %r8618; - and.b32 %r8620, %r8609, %r8601; - or.b32 %r8621, %r8619, %r8620; - add.s32 %r8622, %r233, %r8593; - add.s32 %r8623, %r8622, %r8621; - add.s32 %r8624, %r8623, 1518500249; - shf.l.wrap.b32 %r8625, %r8624, %r8624, 5; - or.b32 %r8626, %r8617, %r8609; - and.b32 %r8627, %r8625, %r8626; - and.b32 %r8628, %r8617, %r8609; - or.b32 %r8629, %r8627, %r8628; - add.s32 %r8630, %r229, %r8601; - add.s32 %r8631, %r8630, %r8629; - add.s32 %r8632, %r8631, 1518500249; - shf.l.wrap.b32 %r8633, %r8632, %r8632, 9; - or.b32 %r8634, %r8625, %r8617; - and.b32 %r8635, %r8633, %r8634; - and.b32 %r8636, %r8625, %r8617; - or.b32 %r8637, %r8635, %r8636; - add.s32 %r8638, %r225, %r8609; - add.s32 %r8639, %r8638, %r8637; - add.s32 %r8640, %r8639, 1518500249; - shf.l.wrap.b32 %r8641, %r8640, %r8640, 13; - or.b32 %r8642, %r8633, %r8625; - and.b32 %r8643, %r8641, %r8642; - and.b32 %r8644, %r8633, %r8625; - or.b32 %r8645, %r8643, %r8644; - add.s32 %r8646, %r236, %r8617; - add.s32 %r8647, %r8646, %r8645; - add.s32 %r8648, %r8647, 1518500249; - shf.l.wrap.b32 %r8649, %r8648, %r8648, 3; - or.b32 %r8650, %r8641, %r8633; - and.b32 %r8651, %r8649, %r8650; - and.b32 %r8652, %r8641, %r8633; - or.b32 %r8653, %r8651, %r8652; - add.s32 %r8654, %r232, %r8625; - add.s32 %r8655, %r8654, %r8653; - add.s32 %r8656, %r8655, 1518500249; - shf.l.wrap.b32 %r8657, %r8656, %r8656, 5; - or.b32 %r8658, %r8649, %r8641; - and.b32 %r8659, %r8657, %r8658; - and.b32 %r8660, %r8649, %r8641; - or.b32 %r8661, %r8659, %r8660; - add.s32 %r8662, %r228, %r8633; - add.s32 %r8663, %r8662, %r8661; - add.s32 %r8664, %r8663, 1518500249; - shf.l.wrap.b32 %r8665, %r8664, %r8664, 9; - or.b32 %r8666, %r8657, %r8649; - and.b32 %r8667, %r8665, %r8666; - and.b32 %r8668, %r8657, %r8649; - or.b32 %r8669, %r8667, %r8668; - add.s32 %r8670, %r224, %r8641; - add.s32 %r8671, %r8670, %r8669; - add.s32 %r8672, %r8671, 1518500249; - shf.l.wrap.b32 %r8673, %r8672, %r8672, 13; - or.b32 %r8674, %r8665, %r8657; - and.b32 %r8675, %r8673, %r8674; - and.b32 %r8676, %r8665, %r8657; - or.b32 %r8677, %r8675, %r8676; - add.s32 %r8678, %r235, %r8649; - add.s32 %r8679, %r8678, %r8677; - add.s32 %r8680, %r8679, 1518500249; - shf.l.wrap.b32 %r9169, %r8680, %r8680, 3; - or.b32 %r8681, %r8673, %r8665; - and.b32 %r8682, %r9169, %r8681; - and.b32 %r8683, %r8673, %r8665; - or.b32 %r8684, %r8682, %r8683; - add.s32 %r8685, %r231, %r8657; - add.s32 %r8686, %r8685, %r8684; - add.s32 %r8687, %r8686, 1518500249; - shf.l.wrap.b32 %r9166, %r8687, %r8687, 5; - or.b32 %r8688, %r9169, %r8673; - and.b32 %r8689, %r9166, %r8688; - and.b32 %r8690, %r9169, %r8673; - or.b32 %r8691, %r8689, %r8690; - add.s32 %r8692, %r227, %r8665; - add.s32 %r8693, %r8692, %r8691; - add.s32 %r8694, %r8693, 1518500249; - shf.l.wrap.b32 %r9167, %r8694, %r8694, 9; - or.b32 %r8695, %r9166, %r9169; - and.b32 %r8696, %r9167, %r8695; - and.b32 %r8697, %r9166, %r9169; - or.b32 %r8698, %r8696, %r8697; - add.s32 %r8699, %r223, %r8673; - add.s32 %r8700, %r8699, %r8698; - add.s32 %r8701, %r8700, 1518500249; - shf.l.wrap.b32 %r9168, %r8701, %r8701, 13; - @%p381 bra $L__BB1_539; - - xor.b32 %r8702, %r9167, %r9168; - xor.b32 %r8703, %r8702, %r9166; - add.s32 %r8704, %r9169, %r8703; - add.s32 %r8705, %r8704, %r238; - add.s32 %r8706, %r8705, 1859775393; - shf.l.wrap.b32 %r8707, %r8706, %r8706, 3; - xor.b32 %r8708, %r8707, %r8702; - add.s32 %r8709, %r9166, %r8708; - add.s32 %r8710, %r8709, %r230; - add.s32 %r8711, %r8710, 1859775393; - shf.l.wrap.b32 %r8712, %r8711, %r8711, 9; - xor.b32 %r8713, %r8707, %r9168; - xor.b32 %r8714, %r8713, %r8712; - add.s32 %r8715, %r9167, %r234; - add.s32 %r8716, %r8715, %r8714; - add.s32 %r8717, %r8716, 1859775393; - shf.l.wrap.b32 %r8718, %r8717, %r8717, 11; - xor.b32 %r8719, %r8712, %r8707; - xor.b32 %r8720, %r8719, %r8718; - add.s32 %r8721, %r9168, %r8720; - add.s32 %r8722, %r8721, %r226; - add.s32 %r8723, %r8722, 1859775393; - shf.l.wrap.b32 %r8724, %r8723, %r8723, 15; - xor.b32 %r8725, %r8718, %r8724; - xor.b32 %r8726, %r8725, %r8712; - add.s32 %r8727, %r8707, %r8726; - add.s32 %r8728, %r8727, %r236; - add.s32 %r8729, %r8728, 1859775393; - shf.l.wrap.b32 %r8730, %r8729, %r8729, 3; - xor.b32 %r8731, %r8730, %r8725; - add.s32 %r8732, %r8712, %r8731; - add.s32 %r8733, %r8732, %r228; - add.s32 %r8734, %r8733, 1859775393; - shf.l.wrap.b32 %r8735, %r8734, %r8734, 9; - xor.b32 %r8736, %r8730, %r8724; - xor.b32 %r8737, %r8736, %r8735; - add.s32 %r8738, %r8718, %r232; - add.s32 %r8739, %r8738, %r8737; - add.s32 %r8740, %r8739, 1859775393; - shf.l.wrap.b32 %r8741, %r8740, %r8740, 11; - xor.b32 %r8742, %r8735, %r8730; - xor.b32 %r8743, %r8742, %r8741; - add.s32 %r8744, %r8724, %r8743; - add.s32 %r8745, %r8744, %r224; - add.s32 %r8746, %r8745, 1859775393; - shf.l.wrap.b32 %r8747, %r8746, %r8746, 15; - xor.b32 %r8748, %r8741, %r8747; - xor.b32 %r8749, %r8748, %r8735; - add.s32 %r8750, %r8730, %r8749; - add.s32 %r8751, %r8750, %r237; - add.s32 %r8752, %r8751, 1859775393; - shf.l.wrap.b32 %r8753, %r8752, %r8752, 3; - xor.b32 %r8754, %r8753, %r8748; - add.s32 %r8755, %r8735, %r8754; - add.s32 %r8756, %r8755, %r229; - add.s32 %r8757, %r8756, 1859775393; - shf.l.wrap.b32 %r8758, %r8757, %r8757, 9; - xor.b32 %r8759, %r8753, %r8747; - xor.b32 %r8760, %r8759, %r8758; - add.s32 %r8761, %r8741, %r233; - add.s32 %r8762, %r8761, %r8760; - add.s32 %r8763, %r8762, 1859775393; - shf.l.wrap.b32 %r8764, %r8763, %r8763, 11; - xor.b32 %r8765, %r8758, %r8753; - xor.b32 %r8766, %r8765, %r8764; - add.s32 %r8767, %r8747, %r8766; - add.s32 %r8768, %r8767, %r225; - add.s32 %r8769, %r8768, 1859775393; - shf.l.wrap.b32 %r8770, %r8769, %r8769, 15; - xor.b32 %r8771, %r8764, %r8770; - xor.b32 %r8772, %r8771, %r8758; - add.s32 %r8773, %r8753, %r8772; - add.s32 %r8774, %r8773, %r235; - add.s32 %r8775, %r8774, 1859775393; - shf.l.wrap.b32 %r9169, %r8775, %r8775, 3; - xor.b32 %r8776, %r9169, %r8771; - add.s32 %r8777, %r8758, %r8776; - add.s32 %r8778, %r8777, %r227; - add.s32 %r8779, %r8778, 1859775393; - shf.l.wrap.b32 %r9166, %r8779, %r8779, 9; - xor.b32 %r8780, %r9169, %r8770; - xor.b32 %r8781, %r8780, %r9166; - add.s32 %r8782, %r8764, %r231; - add.s32 %r8783, %r8782, %r8781; - add.s32 %r8784, %r8783, 1859775393; - shf.l.wrap.b32 %r9167, %r8784, %r8784, 11; - xor.b32 %r8785, %r9166, %r9169; - xor.b32 %r8786, %r8785, %r9167; - add.s32 %r8787, %r8770, %r8786; - add.s32 %r8788, %r8787, %r223; - add.s32 %r8789, %r8788, 1859775393; - shf.l.wrap.b32 %r9168, %r8789, %r8789, 15; - -$L__BB1_539: - add.s32 %r261, %r9169, 1732584193; - add.s32 %r262, %r9168, -271733879; - add.s32 %r263, %r9167, -1732584194; - add.s32 %r264, %r9166, 271733878; - mov.b64 {%r265, %r266}, %rd952; - cvt.u64.u32 %rd4017, %r265; - shl.b64 %rd4018, %rd4017, 8; - mov.b64 {%r8790, %r8791}, %rd4018; - mov.b32 {%rs1374, %rs4314}, %r8791; - mov.b32 {%rs1370, %rs1372}, %r8790; - shr.u16 %rs1373, %rs1372, 8; - shr.u16 %rs1371, %rs1370, 8; - @%p381 bra $L__BB1_541; - - cvt.u64.u32 %rd4019, %r266; - shl.b64 %rd4020, %rd4019, 8; - mov.b64 {%r8792, %r8793}, %rd4020; - mov.b32 {%rs1379, %rs4315}, %r8793; - mov.b32 {%rs1375, %rs1377}, %r8792; - shr.u16 %rs1378, %rs1377, 8; - shr.u16 %rs1376, %rs1375, 8; - @%p396 bra $L__BB1_542; - bra.uni $L__BB1_541; - -$L__BB1_542: - shl.b16 %rs4316, %rs1377, 8; - or.b16 %rs4317, %rs1376, %rs4316; - shl.b16 %rs4318, %rs1379, 8; - or.b16 %rs4319, %rs1378, %rs4318; - mov.b32 %r267, {%rs4317, %rs4319}; - shl.b16 %rs4320, %rs1372, 8; - or.b16 %rs4321, %rs1371, %rs4320; - shl.b16 %rs4322, %rs1374, 8; - or.b16 %rs4323, %rs1373, %rs4322; - mov.b32 %r268, {%rs4321, %rs4323}; - @%p381 bra $L__BB1_544; - bra.uni $L__BB1_543; - -$L__BB1_544: - and.b32 %r9170, %r264, %r263; - mov.u32 %r9171, %r264; - mov.u32 %r9172, %r263; - mov.u32 %r9173, %r262; - mov.u32 %r9174, %r261; - bra.uni $L__BB1_545; - -$L__BB1_497: - st.local.u64 [%rd1+80], %rd952; - ld.local.u32 %rd3956, [%rd1+24]; - shl.b64 %rd3957, %rd3956, 8; - mov.b64 {%r8095, %r8096}, %rd3957; - mov.b32 {%rs1219, %rs4160}, %r8096; - mov.b32 {%rs1215, %rs1217}, %r8095; - shr.u16 %rs1218, %rs1217, 8; - shr.u16 %rs1216, %rs1215, 8; - mov.pred %p364, 0; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3958, [%rd1+28]; - shl.b64 %rd3959, %rd3958, 8; - mov.b64 {%r8097, %r8098}, %rd3959; - mov.b32 {%rs1224, %rs4161}, %r8098; - mov.b32 {%rs1220, %rs1222}, %r8097; - shr.u16 %rs1223, %rs1222, 8; - shr.u16 %rs1221, %rs1220, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3960, [%rd1+32]; - shl.b64 %rd3961, %rd3960, 8; - mov.b64 {%r8099, %r8100}, %rd3961; - mov.b32 {%rs1229, %rs4162}, %r8100; - mov.b32 {%rs1225, %rs1227}, %r8099; - shr.u16 %rs1228, %rs1227, 8; - shr.u16 %rs1226, %rs1225, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3962, [%rd1+36]; - shl.b64 %rd3963, %rd3962, 8; - mov.b64 {%r8101, %r8102}, %rd3963; - mov.b32 {%rs1234, %rs4163}, %r8102; - mov.b32 {%rs1230, %rs1232}, %r8101; - shr.u16 %rs1233, %rs1232, 8; - shr.u16 %rs1231, %rs1230, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3964, [%rd1+40]; - shl.b64 %rd3965, %rd3964, 8; - mov.b64 {%r8103, %r8104}, %rd3965; - mov.b32 {%rs1239, %rs4164}, %r8104; - mov.b32 {%rs1235, %rs1237}, %r8103; - shr.u16 %rs1238, %rs1237, 8; - shr.u16 %rs1236, %rs1235, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3966, [%rd1+44]; - shl.b64 %rd3967, %rd3966, 8; - mov.b64 {%r8105, %r8106}, %rd3967; - mov.b32 {%rs1244, %rs4165}, %r8106; - mov.b32 {%rs1240, %rs1242}, %r8105; - shr.u16 %rs1243, %rs1242, 8; - shr.u16 %rs1241, %rs1240, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3968, [%rd1+48]; - shl.b64 %rd3969, %rd3968, 8; - mov.b64 {%r8107, %r8108}, %rd3969; - mov.b32 {%rs1249, %rs4166}, %r8108; - mov.b32 {%rs1245, %rs1247}, %r8107; - shr.u16 %rs1248, %rs1247, 8; - shr.u16 %rs1246, %rs1245, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3970, [%rd1+52]; - shl.b64 %rd3971, %rd3970, 8; - mov.b64 {%r8109, %r8110}, %rd3971; - mov.b32 {%rs1254, %rs4167}, %r8110; - mov.b32 {%rs1250, %rs1252}, %r8109; - shr.u16 %rs1253, %rs1252, 8; - shr.u16 %rs1251, %rs1250, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3972, [%rd1+56]; - shl.b64 %rd3973, %rd3972, 8; - mov.b64 {%r8111, %r8112}, %rd3973; - mov.b32 {%rs1259, %rs4168}, %r8112; - mov.b32 {%rs1255, %rs1257}, %r8111; - shr.u16 %rs1258, %rs1257, 8; - shr.u16 %rs1256, %rs1255, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3974, [%rd1+60]; - shl.b64 %rd3975, %rd3974, 8; - mov.b64 {%r8113, %r8114}, %rd3975; - mov.b32 {%rs1264, %rs4169}, %r8114; - mov.b32 {%rs1260, %rs1262}, %r8113; - shr.u16 %rs1263, %rs1262, 8; - shr.u16 %rs1261, %rs1260, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3976, [%rd1+64]; - shl.b64 %rd3977, %rd3976, 8; - mov.b64 {%r8115, %r8116}, %rd3977; - mov.b32 {%rs1269, %rs4170}, %r8116; - mov.b32 {%rs1265, %rs1267}, %r8115; - shr.u16 %rs1268, %rs1267, 8; - shr.u16 %rs1266, %rs1265, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3978, [%rd1+68]; - shl.b64 %rd3979, %rd3978, 8; - mov.b64 {%r8117, %r8118}, %rd3979; - mov.b32 {%rs1274, %rs4171}, %r8118; - mov.b32 {%rs1270, %rs1272}, %r8117; - shr.u16 %rs1273, %rs1272, 8; - shr.u16 %rs1271, %rs1270, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3980, [%rd1+72]; - shl.b64 %rd3981, %rd3980, 8; - mov.b64 {%r8119, %r8120}, %rd3981; - mov.b32 {%rs1279, %rs4172}, %r8120; - mov.b32 {%rs1275, %rs1277}, %r8119; - shr.u16 %rs1278, %rs1277, 8; - shr.u16 %rs1276, %rs1275, 8; - @%p364 bra $L__BB1_512; - - ld.local.u32 %rd3982, [%rd1+76]; - shl.b64 %rd3983, %rd3982, 8; - mov.b64 {%r8121, %r8122}, %rd3983; - mov.b32 {%rs1284, %rs4173}, %r8122; - mov.b32 {%rs1280, %rs1282}, %r8121; - shr.u16 %rs1283, %rs1282, 8; - shr.u16 %rs1281, %rs1280, 8; - @%p364 bra $L__BB1_512; - - shl.b64 %rd3984, %rd951, 11; - mov.b64 {%r8123, %r8124}, %rd3984; - mov.b32 {%rs1289, %rs4174}, %r8124; - mov.b32 {%rs1285, %rs1287}, %r8123; - shr.u16 %rs1286, %rs1285, 8; - mov.pred %p378, -1; - @%p378 bra $L__BB1_513; - bra.uni $L__BB1_512; - -$L__BB1_513: - shl.b16 %rs4175, %rs1287, 8; - or.b16 %rs4176, %rs1286, %rs4175; - shl.b16 %rs4177, %rs1289, 8; - mov.b32 %r182, {%rs4176, %rs4177}; - shl.b16 %rs4178, %rs1282, 8; - or.b16 %rs4179, %rs1281, %rs4178; - shl.b16 %rs4180, %rs1284, 8; - or.b16 %rs4181, %rs1283, %rs4180; - mov.b32 %r183, {%rs4179, %rs4181}; - shl.b16 %rs4182, %rs1277, 8; - or.b16 %rs4183, %rs1276, %rs4182; - shl.b16 %rs4184, %rs1279, 8; - or.b16 %rs4185, %rs1278, %rs4184; - mov.b32 %r184, {%rs4183, %rs4185}; - shl.b16 %rs4186, %rs1272, 8; - or.b16 %rs4187, %rs1271, %rs4186; - shl.b16 %rs4188, %rs1274, 8; - or.b16 %rs4189, %rs1273, %rs4188; - mov.b32 %r185, {%rs4187, %rs4189}; - shl.b16 %rs4190, %rs1267, 8; - or.b16 %rs4191, %rs1266, %rs4190; - shl.b16 %rs4192, %rs1269, 8; - or.b16 %rs4193, %rs1268, %rs4192; - mov.b32 %r186, {%rs4191, %rs4193}; - shl.b16 %rs4194, %rs1262, 8; - or.b16 %rs4195, %rs1261, %rs4194; - shl.b16 %rs4196, %rs1264, 8; - or.b16 %rs4197, %rs1263, %rs4196; - mov.b32 %r187, {%rs4195, %rs4197}; - shl.b16 %rs4198, %rs1257, 8; - or.b16 %rs4199, %rs1256, %rs4198; - shl.b16 %rs4200, %rs1259, 8; - or.b16 %rs4201, %rs1258, %rs4200; - mov.b32 %r188, {%rs4199, %rs4201}; - shl.b16 %rs4202, %rs1252, 8; - or.b16 %rs4203, %rs1251, %rs4202; - shl.b16 %rs4204, %rs1254, 8; - or.b16 %rs4205, %rs1253, %rs4204; - mov.b32 %r189, {%rs4203, %rs4205}; - shl.b16 %rs4206, %rs1247, 8; - or.b16 %rs4207, %rs1246, %rs4206; - shl.b16 %rs4208, %rs1249, 8; - or.b16 %rs4209, %rs1248, %rs4208; - mov.b32 %r190, {%rs4207, %rs4209}; - shl.b16 %rs4210, %rs1242, 8; - or.b16 %rs4211, %rs1241, %rs4210; - shl.b16 %rs4212, %rs1244, 8; - or.b16 %rs4213, %rs1243, %rs4212; - mov.b32 %r191, {%rs4211, %rs4213}; - shl.b16 %rs4214, %rs1237, 8; - or.b16 %rs4215, %rs1236, %rs4214; - shl.b16 %rs4216, %rs1239, 8; - or.b16 %rs4217, %rs1238, %rs4216; - mov.b32 %r192, {%rs4215, %rs4217}; - shl.b16 %rs4218, %rs1232, 8; - or.b16 %rs4219, %rs1231, %rs4218; - shl.b16 %rs4220, %rs1234, 8; - or.b16 %rs4221, %rs1233, %rs4220; - mov.b32 %r193, {%rs4219, %rs4221}; - shl.b16 %rs4222, %rs1227, 8; - or.b16 %rs4223, %rs1226, %rs4222; - shl.b16 %rs4224, %rs1229, 8; - or.b16 %rs4225, %rs1228, %rs4224; - mov.b32 %r194, {%rs4223, %rs4225}; - shl.b16 %rs4226, %rs1222, 8; - or.b16 %rs4227, %rs1221, %rs4226; - shl.b16 %rs4228, %rs1224, 8; - or.b16 %rs4229, %rs1223, %rs4228; - mov.b32 %r195, {%rs4227, %rs4229}; - shl.b16 %rs4230, %rs1217, 8; - or.b16 %rs4231, %rs1216, %rs4230; - shl.b16 %rs4232, %rs1219, 8; - or.b16 %rs4233, %rs1218, %rs4232; - mov.b32 %r196, {%rs4231, %rs4233}; - mov.u32 %r9156, -1043882854; - mov.u32 %r9153, %r9152; - @%p364 bra $L__BB1_515; - - add.s32 %r8130, %r196, -1; - shf.l.wrap.b32 %r8131, %r8130, %r8130, 3; - not.b32 %r8132, %r8131; - and.b32 %r8133, %r8131, -271733879; - and.b32 %r8134, %r8132, -1732584194; - or.b32 %r8135, %r8134, %r8133; - add.s32 %r8136, %r8135, %r195; - add.s32 %r8137, %r8136, 271733878; - shf.l.wrap.b32 %r8138, %r8137, %r8137, 7; - not.b32 %r8139, %r8138; - and.b32 %r8140, %r8138, %r8131; - and.b32 %r8141, %r8139, -271733879; - or.b32 %r8142, %r8141, %r8140; - add.s32 %r8143, %r8142, %r194; - add.s32 %r8144, %r8143, -1732584194; - shf.l.wrap.b32 %r8145, %r8144, %r8144, 11; - and.b32 %r8146, %r8145, %r8138; - not.b32 %r8147, %r8145; - and.b32 %r8148, %r8131, %r8147; - or.b32 %r8149, %r8148, %r8146; - add.s32 %r8150, %r8149, %r193; - add.s32 %r8151, %r8150, -271733879; - shf.l.wrap.b32 %r8152, %r8151, %r8151, 19; - and.b32 %r8153, %r8145, %r8152; - not.b32 %r8154, %r8152; - and.b32 %r8155, %r8138, %r8154; - or.b32 %r8156, %r8155, %r8153; - add.s32 %r8157, %r8156, %r8131; - add.s32 %r8158, %r8157, %r192; - shf.l.wrap.b32 %r8159, %r8158, %r8158, 3; - and.b32 %r8160, %r8159, %r8152; - not.b32 %r8161, %r8159; - and.b32 %r8162, %r8145, %r8161; - or.b32 %r8163, %r8162, %r8160; - add.s32 %r8164, %r8163, %r8138; - add.s32 %r8165, %r8164, %r191; - shf.l.wrap.b32 %r8166, %r8165, %r8165, 7; - and.b32 %r8167, %r8166, %r8159; - not.b32 %r8168, %r8166; - and.b32 %r8169, %r8152, %r8168; - or.b32 %r8170, %r8169, %r8167; - add.s32 %r8171, %r8170, %r8145; - add.s32 %r8172, %r8171, %r190; - shf.l.wrap.b32 %r8173, %r8172, %r8172, 11; - and.b32 %r8174, %r8173, %r8166; - not.b32 %r8175, %r8173; - and.b32 %r8176, %r8159, %r8175; - or.b32 %r8177, %r8176, %r8174; - add.s32 %r8178, %r8177, %r8152; - add.s32 %r8179, %r8178, %r189; - shf.l.wrap.b32 %r8180, %r8179, %r8179, 19; - and.b32 %r8181, %r8173, %r8180; - not.b32 %r8182, %r8180; - and.b32 %r8183, %r8166, %r8182; - or.b32 %r8184, %r8183, %r8181; - add.s32 %r8185, %r8184, %r8159; - add.s32 %r8186, %r8185, %r188; - shf.l.wrap.b32 %r8187, %r8186, %r8186, 3; - and.b32 %r8188, %r8187, %r8180; - not.b32 %r8189, %r8187; - and.b32 %r8190, %r8173, %r8189; - or.b32 %r8191, %r8190, %r8188; - add.s32 %r8192, %r8191, %r8166; - add.s32 %r8193, %r8192, %r187; - shf.l.wrap.b32 %r8194, %r8193, %r8193, 7; - and.b32 %r8195, %r8194, %r8187; - not.b32 %r8196, %r8194; - and.b32 %r8197, %r8180, %r8196; - or.b32 %r8198, %r8197, %r8195; - add.s32 %r8199, %r8198, %r8173; - add.s32 %r8200, %r8199, %r186; - shf.l.wrap.b32 %r8201, %r8200, %r8200, 11; - and.b32 %r8202, %r8201, %r8194; - not.b32 %r8203, %r8201; - and.b32 %r8204, %r8187, %r8203; - or.b32 %r8205, %r8204, %r8202; - add.s32 %r8206, %r8205, %r8180; - add.s32 %r8207, %r8206, %r185; - shf.l.wrap.b32 %r8208, %r8207, %r8207, 19; - and.b32 %r8209, %r8201, %r8208; - not.b32 %r8210, %r8208; - and.b32 %r8211, %r8194, %r8210; - or.b32 %r8212, %r8211, %r8209; - add.s32 %r8213, %r8212, %r8187; - add.s32 %r8214, %r8213, %r184; - shf.l.wrap.b32 %r8215, %r8214, %r8214, 3; - and.b32 %r8216, %r8215, %r8208; - not.b32 %r8217, %r8215; - and.b32 %r8218, %r8201, %r8217; - or.b32 %r8219, %r8218, %r8216; - add.s32 %r8220, %r8219, %r8194; - add.s32 %r8221, %r8220, %r183; - shf.l.wrap.b32 %r9153, %r8221, %r8221, 7; - and.b32 %r8222, %r9153, %r8215; - not.b32 %r8223, %r9153; - and.b32 %r8224, %r8208, %r8223; - or.b32 %r8225, %r8224, %r8222; - add.s32 %r8226, %r8225, %r8201; - add.s32 %r8227, %r8226, %r182; - shf.l.wrap.b32 %r9154, %r8227, %r8227, 11; - and.b32 %r9152, %r9154, %r9153; - not.b32 %r8228, %r9154; - and.b32 %r8229, %r8215, %r8228; - or.b32 %r8230, %r8229, %r9152; - add.s32 %r8231, %r8230, %r8208; - shf.l.wrap.b32 %r9155, %r8231, %r8231, 19; - add.s32 %r9156, %r8215, 1518500249; - -$L__BB1_515: - or.b32 %r8232, %r9154, %r9153; - and.b32 %r8233, %r8232, %r9155; - or.b32 %r8234, %r8233, %r9152; - add.s32 %r8235, %r9156, %r8234; - add.s32 %r8236, %r8235, %r196; - shf.l.wrap.b32 %r8237, %r8236, %r8236, 3; - or.b32 %r8238, %r9155, %r9154; - and.b32 %r8239, %r8237, %r8238; - and.b32 %r8240, %r9155, %r9154; - or.b32 %r8241, %r8239, %r8240; - add.s32 %r8242, %r9153, %r192; - add.s32 %r8243, %r8242, %r8241; - add.s32 %r8244, %r8243, 1518500249; - shf.l.wrap.b32 %r8245, %r8244, %r8244, 5; - or.b32 %r8246, %r8237, %r9155; - and.b32 %r8247, %r8245, %r8246; - and.b32 %r8248, %r8237, %r9155; - or.b32 %r8249, %r8247, %r8248; - add.s32 %r8250, %r9154, %r188; - add.s32 %r8251, %r8250, %r8249; - add.s32 %r8252, %r8251, 1518500249; - shf.l.wrap.b32 %r8253, %r8252, %r8252, 9; - or.b32 %r8254, %r8245, %r8237; - and.b32 %r8255, %r8253, %r8254; - and.b32 %r8256, %r8245, %r8237; - or.b32 %r8257, %r8255, %r8256; - add.s32 %r8258, %r9155, %r184; - add.s32 %r8259, %r8258, %r8257; - add.s32 %r8260, %r8259, 1518500249; - shf.l.wrap.b32 %r8261, %r8260, %r8260, 13; - or.b32 %r8262, %r8253, %r8245; - and.b32 %r8263, %r8261, %r8262; - and.b32 %r8264, %r8253, %r8245; - or.b32 %r8265, %r8263, %r8264; - add.s32 %r8266, %r8237, %r195; - add.s32 %r8267, %r8266, %r8265; - add.s32 %r8268, %r8267, 1518500249; - shf.l.wrap.b32 %r8269, %r8268, %r8268, 3; - or.b32 %r8270, %r8261, %r8253; - and.b32 %r8271, %r8269, %r8270; - and.b32 %r8272, %r8261, %r8253; - or.b32 %r8273, %r8271, %r8272; - add.s32 %r8274, %r191, %r8245; - add.s32 %r8275, %r8274, %r8273; - add.s32 %r8276, %r8275, 1518500249; - shf.l.wrap.b32 %r8277, %r8276, %r8276, 5; - or.b32 %r8278, %r8269, %r8261; - and.b32 %r8279, %r8277, %r8278; - and.b32 %r8280, %r8269, %r8261; - or.b32 %r8281, %r8279, %r8280; - add.s32 %r8282, %r187, %r8253; - add.s32 %r8283, %r8282, %r8281; - add.s32 %r8284, %r8283, 1518500249; - shf.l.wrap.b32 %r8285, %r8284, %r8284, 9; - or.b32 %r8286, %r8277, %r8269; - and.b32 %r8287, %r8285, %r8286; - and.b32 %r8288, %r8277, %r8269; - or.b32 %r8289, %r8287, %r8288; - add.s32 %r8290, %r183, %r8261; - add.s32 %r8291, %r8290, %r8289; - add.s32 %r8292, %r8291, 1518500249; - shf.l.wrap.b32 %r8293, %r8292, %r8292, 13; - or.b32 %r8294, %r8285, %r8277; - and.b32 %r8295, %r8293, %r8294; - and.b32 %r8296, %r8285, %r8277; - or.b32 %r8297, %r8295, %r8296; - add.s32 %r8298, %r194, %r8269; - add.s32 %r8299, %r8298, %r8297; - add.s32 %r8300, %r8299, 1518500249; - shf.l.wrap.b32 %r8301, %r8300, %r8300, 3; - or.b32 %r8302, %r8293, %r8285; - and.b32 %r8303, %r8301, %r8302; - and.b32 %r8304, %r8293, %r8285; - or.b32 %r8305, %r8303, %r8304; - add.s32 %r8306, %r190, %r8277; - add.s32 %r8307, %r8306, %r8305; - add.s32 %r8308, %r8307, 1518500249; - shf.l.wrap.b32 %r8309, %r8308, %r8308, 5; - or.b32 %r8310, %r8301, %r8293; - and.b32 %r8311, %r8309, %r8310; - and.b32 %r8312, %r8301, %r8293; - or.b32 %r8313, %r8311, %r8312; - add.s32 %r8314, %r186, %r8285; - add.s32 %r8315, %r8314, %r8313; - add.s32 %r8316, %r8315, 1518500249; - shf.l.wrap.b32 %r8317, %r8316, %r8316, 9; - or.b32 %r8318, %r8309, %r8301; - and.b32 %r8319, %r8317, %r8318; - and.b32 %r8320, %r8309, %r8301; - or.b32 %r8321, %r8319, %r8320; - add.s32 %r8322, %r182, %r8293; - add.s32 %r8323, %r8322, %r8321; - add.s32 %r8324, %r8323, 1518500249; - shf.l.wrap.b32 %r8325, %r8324, %r8324, 13; - or.b32 %r8326, %r8317, %r8309; - and.b32 %r8327, %r8325, %r8326; - and.b32 %r8328, %r8317, %r8309; - or.b32 %r8329, %r8327, %r8328; - add.s32 %r8330, %r193, %r8301; - add.s32 %r8331, %r8330, %r8329; - add.s32 %r8332, %r8331, 1518500249; - shf.l.wrap.b32 %r9160, %r8332, %r8332, 3; - or.b32 %r8333, %r8325, %r8317; - and.b32 %r8334, %r9160, %r8333; - and.b32 %r8335, %r8325, %r8317; - or.b32 %r8336, %r8334, %r8335; - add.s32 %r8337, %r189, %r8309; - add.s32 %r8338, %r8337, %r8336; - add.s32 %r8339, %r8338, 1518500249; - shf.l.wrap.b32 %r9157, %r8339, %r8339, 5; - or.b32 %r8340, %r9160, %r8325; - and.b32 %r8341, %r9157, %r8340; - and.b32 %r8342, %r9160, %r8325; - or.b32 %r8343, %r8341, %r8342; - add.s32 %r8344, %r185, %r8317; - add.s32 %r8345, %r8344, %r8343; - add.s32 %r8346, %r8345, 1518500249; - shf.l.wrap.b32 %r9158, %r8346, %r8346, 9; - or.b32 %r8347, %r9157, %r9160; - and.b32 %r8348, %r9158, %r8347; - and.b32 %r8349, %r9157, %r9160; - or.b32 %r8350, %r8348, %r8349; - add.s32 %r8351, %r8325, %r8350; - add.s32 %r8352, %r8351, 1518500249; - shf.l.wrap.b32 %r9159, %r8352, %r8352, 13; - @%p364 bra $L__BB1_517; - - xor.b32 %r8353, %r9158, %r9159; - xor.b32 %r8354, %r8353, %r9157; - add.s32 %r8355, %r9160, %r8354; - add.s32 %r8356, %r8355, %r196; - add.s32 %r8357, %r8356, 1859775393; - shf.l.wrap.b32 %r8358, %r8357, %r8357, 3; - xor.b32 %r8359, %r8358, %r8353; - add.s32 %r8360, %r9157, %r8359; - add.s32 %r8361, %r8360, %r188; - add.s32 %r8362, %r8361, 1859775393; - shf.l.wrap.b32 %r8363, %r8362, %r8362, 9; - xor.b32 %r8364, %r8358, %r9159; - xor.b32 %r8365, %r8364, %r8363; - add.s32 %r8366, %r9158, %r192; - add.s32 %r8367, %r8366, %r8365; - add.s32 %r8368, %r8367, 1859775393; - shf.l.wrap.b32 %r8369, %r8368, %r8368, 11; - xor.b32 %r8370, %r8363, %r8358; - xor.b32 %r8371, %r8370, %r8369; - add.s32 %r8372, %r9159, %r8371; - add.s32 %r8373, %r8372, %r184; - add.s32 %r8374, %r8373, 1859775393; - shf.l.wrap.b32 %r8375, %r8374, %r8374, 15; - xor.b32 %r8376, %r8369, %r8375; - xor.b32 %r8377, %r8376, %r8363; - add.s32 %r8378, %r8358, %r8377; - add.s32 %r8379, %r8378, %r194; - add.s32 %r8380, %r8379, 1859775393; - shf.l.wrap.b32 %r8381, %r8380, %r8380, 3; - xor.b32 %r8382, %r8381, %r8376; - add.s32 %r8383, %r8363, %r8382; - add.s32 %r8384, %r8383, %r186; - add.s32 %r8385, %r8384, 1859775393; - shf.l.wrap.b32 %r8386, %r8385, %r8385, 9; - xor.b32 %r8387, %r8381, %r8375; - xor.b32 %r8388, %r8387, %r8386; - add.s32 %r8389, %r8369, %r190; - add.s32 %r8390, %r8389, %r8388; - add.s32 %r8391, %r8390, 1859775393; - shf.l.wrap.b32 %r8392, %r8391, %r8391, 11; - xor.b32 %r8393, %r8386, %r8381; - xor.b32 %r8394, %r8393, %r8392; - add.s32 %r8395, %r8375, %r8394; - add.s32 %r8396, %r8395, %r182; - add.s32 %r8397, %r8396, 1859775393; - shf.l.wrap.b32 %r8398, %r8397, %r8397, 15; - xor.b32 %r8399, %r8392, %r8398; - xor.b32 %r8400, %r8399, %r8386; - add.s32 %r8401, %r8381, %r8400; - add.s32 %r8402, %r8401, %r195; - add.s32 %r8403, %r8402, 1859775393; - shf.l.wrap.b32 %r8404, %r8403, %r8403, 3; - xor.b32 %r8405, %r8404, %r8399; - add.s32 %r8406, %r8386, %r8405; - add.s32 %r8407, %r8406, %r187; - add.s32 %r8408, %r8407, 1859775393; - shf.l.wrap.b32 %r8409, %r8408, %r8408, 9; - xor.b32 %r8410, %r8404, %r8398; - xor.b32 %r8411, %r8410, %r8409; - add.s32 %r8412, %r8392, %r191; - add.s32 %r8413, %r8412, %r8411; - add.s32 %r8414, %r8413, 1859775393; - shf.l.wrap.b32 %r8415, %r8414, %r8414, 11; - xor.b32 %r8416, %r8409, %r8404; - xor.b32 %r8417, %r8416, %r8415; - add.s32 %r8418, %r8398, %r8417; - add.s32 %r8419, %r8418, %r183; - add.s32 %r8420, %r8419, 1859775393; - shf.l.wrap.b32 %r8421, %r8420, %r8420, 15; - xor.b32 %r8422, %r8415, %r8421; - xor.b32 %r8423, %r8422, %r8409; - add.s32 %r8424, %r8404, %r8423; - add.s32 %r8425, %r8424, %r193; - add.s32 %r8426, %r8425, 1859775393; - shf.l.wrap.b32 %r9160, %r8426, %r8426, 3; - xor.b32 %r8427, %r9160, %r8422; - add.s32 %r8428, %r8409, %r8427; - add.s32 %r8429, %r8428, %r185; - add.s32 %r8430, %r8429, 1859775393; - shf.l.wrap.b32 %r9157, %r8430, %r8430, 9; - xor.b32 %r8431, %r9160, %r8421; - xor.b32 %r8432, %r8431, %r9157; - add.s32 %r8433, %r8415, %r189; - add.s32 %r8434, %r8433, %r8432; - add.s32 %r8435, %r8434, 1859775393; - shf.l.wrap.b32 %r9158, %r8435, %r8435, 11; - xor.b32 %r8436, %r9157, %r9160; - xor.b32 %r8437, %r8436, %r9158; - add.s32 %r8438, %r8421, %r8437; - add.s32 %r8439, %r8438, 1859775393; - shf.l.wrap.b32 %r9159, %r8439, %r8439, 15; - -$L__BB1_517: - add.s32 %r9182, %r9160, 1732584193; - add.s32 %r9181, %r9159, -271733879; - add.s32 %r9180, %r9158, -1732584194; - add.s32 %r9179, %r9157, 271733878; - bra.uni $L__BB1_548; - -$L__BB1_543: - and.b32 %r8794, %r263, %r262; - mov.u32 %r8795, 271733878; - sub.s32 %r8796, %r8795, %r9168; - and.b32 %r8797, %r264, %r8796; - or.b32 %r8798, %r8797, %r8794; - add.s32 %r8799, %r8798, %r261; - shf.l.wrap.b32 %r8800, %r8799, %r8799, 3; - and.b32 %r8801, %r8800, %r262; - not.b32 %r8802, %r8800; - and.b32 %r8803, %r263, %r8802; - or.b32 %r8804, %r8803, %r8801; - add.s32 %r8805, %r8804, %r264; - shf.l.wrap.b32 %r8806, %r8805, %r8805, 7; - and.b32 %r8807, %r8806, %r8800; - not.b32 %r8808, %r8806; - and.b32 %r8809, %r262, %r8808; - or.b32 %r8810, %r8809, %r8807; - add.s32 %r8811, %r8810, %r263; - shf.l.wrap.b32 %r8812, %r8811, %r8811, 11; - and.b32 %r8813, %r8812, %r8806; - not.b32 %r8814, %r8812; - and.b32 %r8815, %r8800, %r8814; - or.b32 %r8816, %r8815, %r8813; - add.s32 %r8817, %r8816, %r262; - shf.l.wrap.b32 %r8818, %r8817, %r8817, 19; - and.b32 %r8819, %r8812, %r8818; - not.b32 %r8820, %r8818; - and.b32 %r8821, %r8806, %r8820; - or.b32 %r8822, %r8821, %r8819; - add.s32 %r8823, %r8822, %r8800; - shf.l.wrap.b32 %r8824, %r8823, %r8823, 3; - and.b32 %r8825, %r8824, %r8818; - not.b32 %r8826, %r8824; - and.b32 %r8827, %r8812, %r8826; - or.b32 %r8828, %r8827, %r8825; - add.s32 %r8829, %r8828, %r8806; - shf.l.wrap.b32 %r8830, %r8829, %r8829, 7; - and.b32 %r8831, %r8830, %r8824; - not.b32 %r8832, %r8830; - and.b32 %r8833, %r8818, %r8832; - or.b32 %r8834, %r8833, %r8831; - add.s32 %r8835, %r8834, %r8812; - shf.l.wrap.b32 %r8836, %r8835, %r8835, 11; - and.b32 %r8837, %r8836, %r8830; - not.b32 %r8838, %r8836; - and.b32 %r8839, %r8824, %r8838; - or.b32 %r8840, %r8839, %r8837; - add.s32 %r8841, %r8840, %r8818; - shf.l.wrap.b32 %r8842, %r8841, %r8841, 19; - and.b32 %r8843, %r8836, %r8842; - not.b32 %r8844, %r8842; - and.b32 %r8845, %r8830, %r8844; - or.b32 %r8846, %r8845, %r8843; - add.s32 %r8847, %r8846, %r8824; - shf.l.wrap.b32 %r8848, %r8847, %r8847, 3; - and.b32 %r8849, %r8848, %r8842; - not.b32 %r8850, %r8848; - and.b32 %r8851, %r8836, %r8850; - or.b32 %r8852, %r8851, %r8849; - add.s32 %r8853, %r8852, %r8830; - shf.l.wrap.b32 %r8854, %r8853, %r8853, 7; - and.b32 %r8855, %r8854, %r8848; - not.b32 %r8856, %r8854; - and.b32 %r8857, %r8842, %r8856; - or.b32 %r8858, %r8857, %r8855; - add.s32 %r8859, %r8858, %r8836; - shf.l.wrap.b32 %r8860, %r8859, %r8859, 11; - and.b32 %r8861, %r8860, %r8854; - not.b32 %r8862, %r8860; - and.b32 %r8863, %r8848, %r8862; - or.b32 %r8864, %r8863, %r8861; - add.s32 %r8865, %r8864, %r8842; - shf.l.wrap.b32 %r8866, %r8865, %r8865, 19; - and.b32 %r8867, %r8860, %r8866; - not.b32 %r8868, %r8866; - and.b32 %r8869, %r8854, %r8868; - or.b32 %r8870, %r8869, %r8867; - add.s32 %r8871, %r8870, %r8848; - shf.l.wrap.b32 %r9174, %r8871, %r8871, 3; - and.b32 %r8872, %r9174, %r8866; - not.b32 %r8873, %r9174; - and.b32 %r8874, %r8860, %r8873; - or.b32 %r8875, %r8874, %r8872; - add.s32 %r8876, %r8875, %r8854; - shf.l.wrap.b32 %r9171, %r8876, %r8876, 7; - and.b32 %r8877, %r9171, %r9174; - not.b32 %r8878, %r9171; - and.b32 %r8879, %r8866, %r8878; - or.b32 %r8880, %r8879, %r8877; - add.s32 %r8881, %r8880, %r8860; - add.s32 %r8882, %r8881, %r268; - shf.l.wrap.b32 %r9172, %r8882, %r8882, 11; - and.b32 %r9170, %r9172, %r9171; - not.b32 %r8883, %r9172; - and.b32 %r8884, %r9174, %r8883; - or.b32 %r8885, %r8884, %r9170; - add.s32 %r8886, %r8885, %r8866; - add.s32 %r8887, %r8886, %r267; - shf.l.wrap.b32 %r9173, %r8887, %r8887, 19; - -$L__BB1_545: - or.b32 %r8888, %r9172, %r9171; - and.b32 %r8889, %r8888, %r9173; - or.b32 %r8890, %r8889, %r9170; - add.s32 %r8891, %r9174, %r8890; - add.s32 %r8892, %r8891, 1518500249; - shf.l.wrap.b32 %r8893, %r8892, %r8892, 3; - or.b32 %r8894, %r9173, %r9172; - and.b32 %r8895, %r8893, %r8894; - and.b32 %r8896, %r9173, %r9172; - or.b32 %r8897, %r8895, %r8896; - add.s32 %r8898, %r9171, %r8897; - add.s32 %r8899, %r8898, 1518500249; - shf.l.wrap.b32 %r8900, %r8899, %r8899, 5; - or.b32 %r8901, %r8893, %r9173; - and.b32 %r8902, %r8900, %r8901; - and.b32 %r8903, %r8893, %r9173; - or.b32 %r8904, %r8902, %r8903; - add.s32 %r8905, %r9172, %r8904; - add.s32 %r8906, %r8905, 1518500249; - shf.l.wrap.b32 %r8907, %r8906, %r8906, 9; - or.b32 %r8908, %r8900, %r8893; - and.b32 %r8909, %r8907, %r8908; - and.b32 %r8910, %r8900, %r8893; - or.b32 %r8911, %r8909, %r8910; - add.s32 %r8912, %r9173, %r8911; - add.s32 %r8913, %r8912, 1518500249; - shf.l.wrap.b32 %r8914, %r8913, %r8913, 13; - or.b32 %r8915, %r8907, %r8900; - and.b32 %r8916, %r8914, %r8915; - and.b32 %r8917, %r8907, %r8900; - or.b32 %r8918, %r8916, %r8917; - add.s32 %r8919, %r8893, %r8918; - add.s32 %r8920, %r8919, 1518500249; - shf.l.wrap.b32 %r8921, %r8920, %r8920, 3; - or.b32 %r8922, %r8914, %r8907; - and.b32 %r8923, %r8921, %r8922; - and.b32 %r8924, %r8914, %r8907; - or.b32 %r8925, %r8923, %r8924; - add.s32 %r8926, %r8900, %r8925; - add.s32 %r8927, %r8926, 1518500249; - shf.l.wrap.b32 %r8928, %r8927, %r8927, 5; - or.b32 %r8929, %r8921, %r8914; - and.b32 %r8930, %r8928, %r8929; - and.b32 %r8931, %r8921, %r8914; - or.b32 %r8932, %r8930, %r8931; - add.s32 %r8933, %r8907, %r8932; - add.s32 %r8934, %r8933, 1518500249; - shf.l.wrap.b32 %r8935, %r8934, %r8934, 9; - or.b32 %r8936, %r8928, %r8921; - and.b32 %r8937, %r8935, %r8936; - and.b32 %r8938, %r8928, %r8921; - or.b32 %r8939, %r8937, %r8938; - add.s32 %r8940, %r8914, %r8939; - add.s32 %r8941, %r8940, 1518500249; - shf.l.wrap.b32 %r8942, %r8941, %r8941, 13; - or.b32 %r8943, %r8935, %r8928; - and.b32 %r8944, %r8942, %r8943; - and.b32 %r8945, %r8935, %r8928; - or.b32 %r8946, %r8944, %r8945; - add.s32 %r8947, %r8921, %r8946; - add.s32 %r8948, %r8947, 1518500249; - shf.l.wrap.b32 %r8949, %r8948, %r8948, 3; - or.b32 %r8950, %r8942, %r8935; - and.b32 %r8951, %r8949, %r8950; - and.b32 %r8952, %r8942, %r8935; - or.b32 %r8953, %r8951, %r8952; - add.s32 %r8954, %r8928, %r8953; - add.s32 %r8955, %r8954, 1518500249; - shf.l.wrap.b32 %r8956, %r8955, %r8955, 5; - or.b32 %r8957, %r8949, %r8942; - and.b32 %r8958, %r8956, %r8957; - and.b32 %r8959, %r8949, %r8942; - or.b32 %r8960, %r8958, %r8959; - add.s32 %r8961, %r8935, %r8960; - add.s32 %r8962, %r8961, 1518500249; - shf.l.wrap.b32 %r8963, %r8962, %r8962, 9; - or.b32 %r8964, %r8956, %r8949; - and.b32 %r8965, %r8963, %r8964; - and.b32 %r8966, %r8956, %r8949; - or.b32 %r8967, %r8965, %r8966; - add.s32 %r8968, %r268, %r8942; - add.s32 %r8969, %r8968, %r8967; - add.s32 %r8970, %r8969, 1518500249; - shf.l.wrap.b32 %r8971, %r8970, %r8970, 13; - or.b32 %r8972, %r8963, %r8956; - and.b32 %r8973, %r8971, %r8972; - and.b32 %r8974, %r8963, %r8956; - or.b32 %r8975, %r8973, %r8974; - add.s32 %r8976, %r8949, %r8975; - add.s32 %r8977, %r8976, 1518500249; - shf.l.wrap.b32 %r9178, %r8977, %r8977, 3; - or.b32 %r8978, %r8971, %r8963; - and.b32 %r8979, %r9178, %r8978; - and.b32 %r8980, %r8971, %r8963; - or.b32 %r8981, %r8979, %r8980; - add.s32 %r8982, %r8956, %r8981; - add.s32 %r8983, %r8982, 1518500249; - shf.l.wrap.b32 %r9175, %r8983, %r8983, 5; - or.b32 %r8984, %r9178, %r8971; - and.b32 %r8985, %r9175, %r8984; - and.b32 %r8986, %r9178, %r8971; - or.b32 %r8987, %r8985, %r8986; - add.s32 %r8988, %r8963, %r8987; - add.s32 %r8989, %r8988, 1518500249; - shf.l.wrap.b32 %r9176, %r8989, %r8989, 9; - or.b32 %r8990, %r9175, %r9178; - and.b32 %r8991, %r9176, %r8990; - and.b32 %r8992, %r9175, %r9178; - or.b32 %r8993, %r8991, %r8992; - add.s32 %r8994, %r267, %r8971; - add.s32 %r8995, %r8994, %r8993; - add.s32 %r8996, %r8995, 1518500249; - shf.l.wrap.b32 %r9177, %r8996, %r8996, 13; - @%p381 bra $L__BB1_547; - - xor.b32 %r8997, %r9176, %r9177; - xor.b32 %r8998, %r8997, %r9175; - add.s32 %r8999, %r9178, %r8998; - add.s32 %r9000, %r8999, 1859775393; - shf.l.wrap.b32 %r9001, %r9000, %r9000, 3; - xor.b32 %r9002, %r9001, %r8997; - add.s32 %r9003, %r9175, %r9002; - add.s32 %r9004, %r9003, 1859775393; - shf.l.wrap.b32 %r9005, %r9004, %r9004, 9; - xor.b32 %r9006, %r9001, %r9177; - xor.b32 %r9007, %r9006, %r9005; - add.s32 %r9008, %r9176, %r9007; - add.s32 %r9009, %r9008, 1859775393; - shf.l.wrap.b32 %r9010, %r9009, %r9009, 11; - xor.b32 %r9011, %r9005, %r9001; - xor.b32 %r9012, %r9011, %r9010; - add.s32 %r9013, %r9177, %r9012; - add.s32 %r9014, %r9013, 1859775393; - shf.l.wrap.b32 %r9015, %r9014, %r9014, 15; - xor.b32 %r9016, %r9010, %r9015; - xor.b32 %r9017, %r9016, %r9005; - add.s32 %r9018, %r9001, %r9017; - add.s32 %r9019, %r9018, 1859775393; - shf.l.wrap.b32 %r9020, %r9019, %r9019, 3; - xor.b32 %r9021, %r9020, %r9016; - add.s32 %r9022, %r9005, %r9021; - add.s32 %r9023, %r9022, 1859775393; - shf.l.wrap.b32 %r9024, %r9023, %r9023, 9; - xor.b32 %r9025, %r9020, %r9015; - xor.b32 %r9026, %r9025, %r9024; - add.s32 %r9027, %r9010, %r9026; - add.s32 %r9028, %r9027, 1859775393; - shf.l.wrap.b32 %r9029, %r9028, %r9028, 11; - xor.b32 %r9030, %r9024, %r9020; - xor.b32 %r9031, %r9030, %r9029; - add.s32 %r9032, %r9015, %r9031; - add.s32 %r9033, %r9032, %r268; - add.s32 %r9034, %r9033, 1859775393; - shf.l.wrap.b32 %r9035, %r9034, %r9034, 15; - xor.b32 %r9036, %r9029, %r9035; - xor.b32 %r9037, %r9036, %r9024; - add.s32 %r9038, %r9020, %r9037; - add.s32 %r9039, %r9038, 1859775393; - shf.l.wrap.b32 %r9040, %r9039, %r9039, 3; - xor.b32 %r9041, %r9040, %r9036; - add.s32 %r9042, %r9024, %r9041; - add.s32 %r9043, %r9042, 1859775393; - shf.l.wrap.b32 %r9044, %r9043, %r9043, 9; - xor.b32 %r9045, %r9040, %r9035; - xor.b32 %r9046, %r9045, %r9044; - add.s32 %r9047, %r9029, %r9046; - add.s32 %r9048, %r9047, 1859775393; - shf.l.wrap.b32 %r9049, %r9048, %r9048, 11; - xor.b32 %r9050, %r9044, %r9040; - xor.b32 %r9051, %r9050, %r9049; - add.s32 %r9052, %r9035, %r9051; - add.s32 %r9053, %r9052, 1859775393; - shf.l.wrap.b32 %r9054, %r9053, %r9053, 15; - xor.b32 %r9055, %r9049, %r9054; - xor.b32 %r9056, %r9055, %r9044; - add.s32 %r9057, %r9040, %r9056; - add.s32 %r9058, %r9057, 1859775393; - shf.l.wrap.b32 %r9178, %r9058, %r9058, 3; - xor.b32 %r9059, %r9178, %r9055; - add.s32 %r9060, %r9044, %r9059; - add.s32 %r9061, %r9060, 1859775393; - shf.l.wrap.b32 %r9175, %r9061, %r9061, 9; - xor.b32 %r9062, %r9178, %r9054; - xor.b32 %r9063, %r9062, %r9175; - add.s32 %r9064, %r9049, %r9063; - add.s32 %r9065, %r9064, 1859775393; - shf.l.wrap.b32 %r9176, %r9065, %r9065, 11; - xor.b32 %r9066, %r9175, %r9178; - xor.b32 %r9067, %r9066, %r9176; - add.s32 %r9068, %r9054, %r9067; - add.s32 %r9069, %r9068, %r267; - add.s32 %r9070, %r9069, 1859775393; - shf.l.wrap.b32 %r9177, %r9070, %r9070, 15; - -$L__BB1_547: - add.s32 %r9182, %r261, %r9178; - add.s32 %r9181, %r262, %r9177; - add.s32 %r9180, %r263, %r9176; - add.s32 %r9179, %r264, %r9175; - -$L__BB1_548: - shr.u32 %r9071, %r9182, 8; - shr.u32 %r9072, %r9182, 16; - shr.u32 %r9073, %r9182, 24; - shr.u32 %r9074, %r9181, 8; - shr.u32 %r9075, %r9181, 16; - shr.u32 %r9076, %r9181, 24; - shr.u32 %r9077, %r9180, 8; - shr.u32 %r9078, %r9180, 16; - shr.u32 %r9079, %r9180, 24; - shr.u32 %r9080, %r9179, 8; - shr.u32 %r9081, %r9179, 16; - shr.u32 %r9082, %r9179, 24; - mov.u16 %rs4324, 16; - st.local.u16 [%rd12], %rs4324; - cvt.u16.u32 %rs4325, %r9182; - cvt.u16.u32 %rs4326, %r9071; - st.local.v2.u8 [%rd12+2], {%rs4325, %rs4326}; - cvt.u16.u32 %rs4327, %r9073; - cvt.u16.u32 %rs4328, %r9072; - st.local.v2.u8 [%rd12+4], {%rs4328, %rs4327}; - cvt.u16.u32 %rs4329, %r9181; - cvt.u16.u32 %rs4330, %r9074; - st.local.v2.u8 [%rd12+6], {%rs4329, %rs4330}; - cvt.u16.u32 %rs4331, %r9076; - cvt.u16.u32 %rs4332, %r9075; - st.local.v2.u8 [%rd12+8], {%rs4332, %rs4331}; - cvt.u16.u32 %rs4333, %r9180; - cvt.u16.u32 %rs4334, %r9077; - st.local.v2.u8 [%rd12+10], {%rs4333, %rs4334}; - cvt.u16.u32 %rs4335, %r9079; - cvt.u16.u32 %rs4336, %r9078; - st.local.v2.u8 [%rd12+12], {%rs4336, %rs4335}; - cvt.u16.u32 %rs4337, %r9179; - cvt.u16.u32 %rs4338, %r9080; - st.local.v2.u8 [%rd12+14], {%rs4337, %rs4338}; - cvt.u16.u32 %rs4339, %r9082; - cvt.u16.u32 %rs4340, %r9081; - st.local.v2.u8 [%rd12+16], {%rs4340, %rs4339}; - mov.u16 %rs4341, 0; - st.local.v2.u8 [%rd12+18], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+20], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+22], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+24], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+26], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+28], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+30], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+32], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+34], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+36], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+38], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+40], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+42], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+44], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+46], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+48], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+50], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+52], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+54], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+56], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+58], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+60], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+62], {%rs4341, %rs4341}; - st.local.v2.u8 [%rd12+64], {%rs4341, %rs4341}; - bra.uni $L__BB1_549; - -$L__BB1_463: - and.b32 %r7800, %r145, %r144; - mov.u32 %r7801, 271733878; - sub.s32 %r7802, %r7801, %r9137; - and.b32 %r7803, %r146, %r7802; - or.b32 %r7804, %r7803, %r7800; - add.s32 %r7805, %r7804, %r143; - shf.l.wrap.b32 %r7806, %r7805, %r7805, 3; - and.b32 %r7807, %r7806, %r144; - not.b32 %r7808, %r7806; - and.b32 %r7809, %r145, %r7808; - or.b32 %r7810, %r7809, %r7807; - add.s32 %r7811, %r7810, %r146; - shf.l.wrap.b32 %r7812, %r7811, %r7811, 7; - and.b32 %r7813, %r7812, %r7806; - not.b32 %r7814, %r7812; - and.b32 %r7815, %r144, %r7814; - or.b32 %r7816, %r7815, %r7813; - add.s32 %r7817, %r7816, %r145; - shf.l.wrap.b32 %r7818, %r7817, %r7817, 11; - and.b32 %r7819, %r7818, %r7812; - not.b32 %r7820, %r7818; - and.b32 %r7821, %r7806, %r7820; - or.b32 %r7822, %r7821, %r7819; - add.s32 %r7823, %r7822, %r144; - shf.l.wrap.b32 %r7824, %r7823, %r7823, 19; - and.b32 %r7825, %r7818, %r7824; - not.b32 %r7826, %r7824; - and.b32 %r7827, %r7812, %r7826; - or.b32 %r7828, %r7827, %r7825; - add.s32 %r7829, %r7828, %r7806; - shf.l.wrap.b32 %r7830, %r7829, %r7829, 3; - and.b32 %r7831, %r7830, %r7824; - not.b32 %r7832, %r7830; - and.b32 %r7833, %r7818, %r7832; - or.b32 %r7834, %r7833, %r7831; - add.s32 %r7835, %r7834, %r7812; - shf.l.wrap.b32 %r7836, %r7835, %r7835, 7; - and.b32 %r7837, %r7836, %r7830; - not.b32 %r7838, %r7836; - and.b32 %r7839, %r7824, %r7838; - or.b32 %r7840, %r7839, %r7837; - add.s32 %r7841, %r7840, %r7818; - shf.l.wrap.b32 %r7842, %r7841, %r7841, 11; - and.b32 %r7843, %r7842, %r7836; - not.b32 %r7844, %r7842; - and.b32 %r7845, %r7830, %r7844; - or.b32 %r7846, %r7845, %r7843; - add.s32 %r7847, %r7846, %r7824; - shf.l.wrap.b32 %r7848, %r7847, %r7847, 19; - and.b32 %r7849, %r7842, %r7848; - not.b32 %r7850, %r7848; - and.b32 %r7851, %r7836, %r7850; - or.b32 %r7852, %r7851, %r7849; - add.s32 %r7853, %r7852, %r7830; - shf.l.wrap.b32 %r7854, %r7853, %r7853, 3; - and.b32 %r7855, %r7854, %r7848; - not.b32 %r7856, %r7854; - and.b32 %r7857, %r7842, %r7856; - or.b32 %r7858, %r7857, %r7855; - add.s32 %r7859, %r7858, %r7836; - shf.l.wrap.b32 %r7860, %r7859, %r7859, 7; - and.b32 %r7861, %r7860, %r7854; - not.b32 %r7862, %r7860; - and.b32 %r7863, %r7848, %r7862; - or.b32 %r7864, %r7863, %r7861; - add.s32 %r7865, %r7864, %r7842; - shf.l.wrap.b32 %r7866, %r7865, %r7865, 11; - and.b32 %r7867, %r7866, %r7860; - not.b32 %r7868, %r7866; - and.b32 %r7869, %r7854, %r7868; - or.b32 %r7870, %r7869, %r7867; - add.s32 %r7871, %r7870, %r7848; - shf.l.wrap.b32 %r7872, %r7871, %r7871, 19; - and.b32 %r7873, %r7866, %r7872; - not.b32 %r7874, %r7872; - and.b32 %r7875, %r7860, %r7874; - or.b32 %r7876, %r7875, %r7873; - add.s32 %r7877, %r7876, %r7854; - shf.l.wrap.b32 %r9143, %r7877, %r7877, 3; - and.b32 %r7878, %r9143, %r7872; - not.b32 %r7879, %r9143; - and.b32 %r7880, %r7866, %r7879; - or.b32 %r7881, %r7880, %r7878; - add.s32 %r7882, %r7881, %r7860; - shf.l.wrap.b32 %r9140, %r7882, %r7882, 7; - and.b32 %r7883, %r9140, %r9143; - not.b32 %r7884, %r9140; - and.b32 %r7885, %r7872, %r7884; - or.b32 %r7886, %r7885, %r7883; - add.s32 %r7887, %r7886, %r7866; - add.s32 %r7888, %r7887, %r150; - shf.l.wrap.b32 %r9141, %r7888, %r7888, 11; - and.b32 %r9139, %r9141, %r9140; - not.b32 %r7889, %r9141; - and.b32 %r7890, %r9143, %r7889; - or.b32 %r7891, %r7890, %r9139; - add.s32 %r7892, %r7891, %r7872; - add.s32 %r7893, %r7892, %r149; - shf.l.wrap.b32 %r9142, %r7893, %r7893, 19; - -$L__BB1_465: - or.b32 %r7894, %r9141, %r9140; - and.b32 %r7895, %r7894, %r9142; - or.b32 %r7896, %r7895, %r9139; - add.s32 %r7897, %r9143, %r7896; - add.s32 %r7898, %r7897, 1518500249; - shf.l.wrap.b32 %r7899, %r7898, %r7898, 3; - or.b32 %r7900, %r9142, %r9141; - and.b32 %r7901, %r7899, %r7900; - and.b32 %r7902, %r9142, %r9141; - or.b32 %r7903, %r7901, %r7902; - add.s32 %r7904, %r9140, %r7903; - add.s32 %r7905, %r7904, 1518500249; - shf.l.wrap.b32 %r7906, %r7905, %r7905, 5; - or.b32 %r7907, %r7899, %r9142; - and.b32 %r7908, %r7906, %r7907; - and.b32 %r7909, %r7899, %r9142; - or.b32 %r7910, %r7908, %r7909; - add.s32 %r7911, %r9141, %r7910; - add.s32 %r7912, %r7911, 1518500249; - shf.l.wrap.b32 %r7913, %r7912, %r7912, 9; - or.b32 %r7914, %r7906, %r7899; - and.b32 %r7915, %r7913, %r7914; - and.b32 %r7916, %r7906, %r7899; - or.b32 %r7917, %r7915, %r7916; - add.s32 %r7918, %r9142, %r7917; - add.s32 %r7919, %r7918, 1518500249; - shf.l.wrap.b32 %r7920, %r7919, %r7919, 13; - or.b32 %r7921, %r7913, %r7906; - and.b32 %r7922, %r7920, %r7921; - and.b32 %r7923, %r7913, %r7906; - or.b32 %r7924, %r7922, %r7923; - add.s32 %r7925, %r7899, %r7924; - add.s32 %r7926, %r7925, 1518500249; - shf.l.wrap.b32 %r7927, %r7926, %r7926, 3; - or.b32 %r7928, %r7920, %r7913; - and.b32 %r7929, %r7927, %r7928; - and.b32 %r7930, %r7920, %r7913; - or.b32 %r7931, %r7929, %r7930; - add.s32 %r7932, %r7906, %r7931; - add.s32 %r7933, %r7932, 1518500249; - shf.l.wrap.b32 %r7934, %r7933, %r7933, 5; - or.b32 %r7935, %r7927, %r7920; - and.b32 %r7936, %r7934, %r7935; - and.b32 %r7937, %r7927, %r7920; - or.b32 %r7938, %r7936, %r7937; - add.s32 %r7939, %r7913, %r7938; - add.s32 %r7940, %r7939, 1518500249; - shf.l.wrap.b32 %r7941, %r7940, %r7940, 9; - or.b32 %r7942, %r7934, %r7927; - and.b32 %r7943, %r7941, %r7942; - and.b32 %r7944, %r7934, %r7927; - or.b32 %r7945, %r7943, %r7944; - add.s32 %r7946, %r7920, %r7945; - add.s32 %r7947, %r7946, 1518500249; - shf.l.wrap.b32 %r7948, %r7947, %r7947, 13; - or.b32 %r7949, %r7941, %r7934; - and.b32 %r7950, %r7948, %r7949; - and.b32 %r7951, %r7941, %r7934; - or.b32 %r7952, %r7950, %r7951; - add.s32 %r7953, %r7927, %r7952; - add.s32 %r7954, %r7953, 1518500249; - shf.l.wrap.b32 %r7955, %r7954, %r7954, 3; - or.b32 %r7956, %r7948, %r7941; - and.b32 %r7957, %r7955, %r7956; - and.b32 %r7958, %r7948, %r7941; - or.b32 %r7959, %r7957, %r7958; - add.s32 %r7960, %r7934, %r7959; - add.s32 %r7961, %r7960, 1518500249; - shf.l.wrap.b32 %r7962, %r7961, %r7961, 5; - or.b32 %r7963, %r7955, %r7948; - and.b32 %r7964, %r7962, %r7963; - and.b32 %r7965, %r7955, %r7948; - or.b32 %r7966, %r7964, %r7965; - add.s32 %r7967, %r7941, %r7966; - add.s32 %r7968, %r7967, 1518500249; - shf.l.wrap.b32 %r7969, %r7968, %r7968, 9; - or.b32 %r7970, %r7962, %r7955; - and.b32 %r7971, %r7969, %r7970; - and.b32 %r7972, %r7962, %r7955; - or.b32 %r7973, %r7971, %r7972; - add.s32 %r7974, %r150, %r7948; - add.s32 %r7975, %r7974, %r7973; - add.s32 %r7976, %r7975, 1518500249; - shf.l.wrap.b32 %r7977, %r7976, %r7976, 13; - or.b32 %r7978, %r7969, %r7962; - and.b32 %r7979, %r7977, %r7978; - and.b32 %r7980, %r7969, %r7962; - or.b32 %r7981, %r7979, %r7980; - add.s32 %r7982, %r7955, %r7981; - add.s32 %r7983, %r7982, 1518500249; - shf.l.wrap.b32 %r9147, %r7983, %r7983, 3; - or.b32 %r7984, %r7977, %r7969; - and.b32 %r7985, %r9147, %r7984; - and.b32 %r7986, %r7977, %r7969; - or.b32 %r7987, %r7985, %r7986; - add.s32 %r7988, %r7962, %r7987; - add.s32 %r7989, %r7988, 1518500249; - shf.l.wrap.b32 %r9144, %r7989, %r7989, 5; - or.b32 %r7990, %r9147, %r7977; - and.b32 %r7991, %r9144, %r7990; - and.b32 %r7992, %r9147, %r7977; - or.b32 %r7993, %r7991, %r7992; - add.s32 %r7994, %r7969, %r7993; - add.s32 %r7995, %r7994, 1518500249; - shf.l.wrap.b32 %r9145, %r7995, %r7995, 9; - or.b32 %r7996, %r9144, %r9147; - and.b32 %r7997, %r9145, %r7996; - and.b32 %r7998, %r9144, %r9147; - or.b32 %r7999, %r7997, %r7998; - add.s32 %r8000, %r149, %r7977; - add.s32 %r8001, %r8000, %r7999; - add.s32 %r8002, %r8001, 1518500249; - shf.l.wrap.b32 %r9146, %r8002, %r8002, 13; - @%p321 bra $L__BB1_467; - - xor.b32 %r8003, %r9145, %r9146; - xor.b32 %r8004, %r8003, %r9144; - add.s32 %r8005, %r9147, %r8004; - add.s32 %r8006, %r8005, 1859775393; - shf.l.wrap.b32 %r8007, %r8006, %r8006, 3; - xor.b32 %r8008, %r8007, %r8003; - add.s32 %r8009, %r9144, %r8008; - add.s32 %r8010, %r8009, 1859775393; - shf.l.wrap.b32 %r8011, %r8010, %r8010, 9; - xor.b32 %r8012, %r8007, %r9146; - xor.b32 %r8013, %r8012, %r8011; - add.s32 %r8014, %r9145, %r8013; - add.s32 %r8015, %r8014, 1859775393; - shf.l.wrap.b32 %r8016, %r8015, %r8015, 11; - xor.b32 %r8017, %r8011, %r8007; - xor.b32 %r8018, %r8017, %r8016; - add.s32 %r8019, %r9146, %r8018; - add.s32 %r8020, %r8019, 1859775393; - shf.l.wrap.b32 %r8021, %r8020, %r8020, 15; - xor.b32 %r8022, %r8016, %r8021; - xor.b32 %r8023, %r8022, %r8011; - add.s32 %r8024, %r8007, %r8023; - add.s32 %r8025, %r8024, 1859775393; - shf.l.wrap.b32 %r8026, %r8025, %r8025, 3; - xor.b32 %r8027, %r8026, %r8022; - add.s32 %r8028, %r8011, %r8027; - add.s32 %r8029, %r8028, 1859775393; - shf.l.wrap.b32 %r8030, %r8029, %r8029, 9; - xor.b32 %r8031, %r8026, %r8021; - xor.b32 %r8032, %r8031, %r8030; - add.s32 %r8033, %r8016, %r8032; - add.s32 %r8034, %r8033, 1859775393; - shf.l.wrap.b32 %r8035, %r8034, %r8034, 11; - xor.b32 %r8036, %r8030, %r8026; - xor.b32 %r8037, %r8036, %r8035; - add.s32 %r8038, %r8021, %r8037; - add.s32 %r8039, %r8038, %r150; - add.s32 %r8040, %r8039, 1859775393; - shf.l.wrap.b32 %r8041, %r8040, %r8040, 15; - xor.b32 %r8042, %r8035, %r8041; - xor.b32 %r8043, %r8042, %r8030; - add.s32 %r8044, %r8026, %r8043; - add.s32 %r8045, %r8044, 1859775393; - shf.l.wrap.b32 %r8046, %r8045, %r8045, 3; - xor.b32 %r8047, %r8046, %r8042; - add.s32 %r8048, %r8030, %r8047; - add.s32 %r8049, %r8048, 1859775393; - shf.l.wrap.b32 %r8050, %r8049, %r8049, 9; - xor.b32 %r8051, %r8046, %r8041; - xor.b32 %r8052, %r8051, %r8050; - add.s32 %r8053, %r8035, %r8052; - add.s32 %r8054, %r8053, 1859775393; - shf.l.wrap.b32 %r8055, %r8054, %r8054, 11; - xor.b32 %r8056, %r8050, %r8046; - xor.b32 %r8057, %r8056, %r8055; - add.s32 %r8058, %r8041, %r8057; - add.s32 %r8059, %r8058, 1859775393; - shf.l.wrap.b32 %r8060, %r8059, %r8059, 15; - xor.b32 %r8061, %r8055, %r8060; - xor.b32 %r8062, %r8061, %r8050; - add.s32 %r8063, %r8046, %r8062; - add.s32 %r8064, %r8063, 1859775393; - shf.l.wrap.b32 %r9147, %r8064, %r8064, 3; - xor.b32 %r8065, %r9147, %r8061; - add.s32 %r8066, %r8050, %r8065; - add.s32 %r8067, %r8066, 1859775393; - shf.l.wrap.b32 %r9144, %r8067, %r8067, 9; - xor.b32 %r8068, %r9147, %r8060; - xor.b32 %r8069, %r8068, %r9144; - add.s32 %r8070, %r8055, %r8069; - add.s32 %r8071, %r8070, 1859775393; - shf.l.wrap.b32 %r9145, %r8071, %r8071, 11; - xor.b32 %r8072, %r9144, %r9147; - xor.b32 %r8073, %r8072, %r9145; - add.s32 %r8074, %r8060, %r8073; - add.s32 %r8075, %r8074, %r149; - add.s32 %r8076, %r8075, 1859775393; - shf.l.wrap.b32 %r9146, %r8076, %r8076, 15; - -$L__BB1_467: - add.s32 %r9151, %r143, %r9147; - add.s32 %r9150, %r144, %r9146; - add.s32 %r9149, %r145, %r9145; - add.s32 %r9148, %r146, %r9144; - -$L__BB1_468: - shr.u32 %r8077, %r9151, 8; - shr.u32 %r8078, %r9151, 16; - shr.u32 %r8079, %r9151, 24; - shr.u32 %r8080, %r9150, 8; - shr.u32 %r8081, %r9150, 16; - shr.u32 %r8082, %r9150, 24; - shr.u32 %r8083, %r9149, 8; - shr.u32 %r8084, %r9149, 16; - shr.u32 %r8085, %r9149, 24; - shr.u32 %r8086, %r9148, 8; - shr.u32 %r8087, %r9148, 16; - shr.u32 %r8088, %r9148, 24; - mov.u16 %rs4050, 16; - st.local.u16 [%rd12], %rs4050; - cvt.u16.u32 %rs4051, %r9151; - cvt.u16.u32 %rs4052, %r8077; - st.local.v2.u8 [%rd12+2], {%rs4051, %rs4052}; - cvt.u16.u32 %rs4053, %r8079; - cvt.u16.u32 %rs4054, %r8078; - st.local.v2.u8 [%rd12+4], {%rs4054, %rs4053}; - cvt.u16.u32 %rs4055, %r9150; - cvt.u16.u32 %rs4056, %r8080; - st.local.v2.u8 [%rd12+6], {%rs4055, %rs4056}; - cvt.u16.u32 %rs4057, %r8082; - cvt.u16.u32 %rs4058, %r8081; - st.local.v2.u8 [%rd12+8], {%rs4058, %rs4057}; - cvt.u16.u32 %rs4059, %r9149; - cvt.u16.u32 %rs4060, %r8083; - st.local.v2.u8 [%rd12+10], {%rs4059, %rs4060}; - cvt.u16.u32 %rs4061, %r8085; - cvt.u16.u32 %rs4062, %r8084; - st.local.v2.u8 [%rd12+12], {%rs4062, %rs4061}; - cvt.u16.u32 %rs4063, %r9148; - cvt.u16.u32 %rs4064, %r8086; - st.local.v2.u8 [%rd12+14], {%rs4063, %rs4064}; - cvt.u16.u32 %rs4065, %r8088; - cvt.u16.u32 %rs4066, %r8087; - st.local.v2.u8 [%rd12+16], {%rs4066, %rs4065}; - st.local.v2.u8 [%rd12+18], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+20], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+22], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+24], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+26], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+28], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+30], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+32], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+34], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+36], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+38], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+40], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+42], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+44], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+46], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+48], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+50], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+52], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+54], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+56], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+58], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+60], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+62], {%rs3804, %rs3804}; - st.local.v2.u8 [%rd12+64], {%rs3804, %rs3804}; - -$L__BB1_549: - ret; - -$L__BB1_376: - { // callseq 37, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 37 - -$L__BB1_304: - { // callseq 33, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 33 - -$L__BB1_357: - { // callseq 36, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 36 - -$L__BB1_285: - { // callseq 32, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 32 - -$L__BB1_395: - { // callseq 38, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 38 - -$L__BB1_323: - { // callseq 34, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 34 - -$L__BB1_197: - { // callseq 19, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 19 - -$L__BB1_208: - setp.gt.u16 %p141, %rs1, 10; - @%p141 bra $L__BB1_210; - bra.uni $L__BB1_209; - -$L__BB1_210: - { // callseq 23, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 23 - -$L__BB1_21: - setp.gt.u16 %p140, %rs1, 10; - @%p140 bra $L__BB1_207; - bra.uni $L__BB1_22; - -$L__BB1_207: - { // callseq 22, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 22 - -$L__BB1_148: - { // callseq 16, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 16 - -$L__BB1_100: - { // callseq 13, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 13 - -$L__BB1_209: - trap; - -$L__BB1_22: - trap; - -$L__BB1_534: - { // callseq 45, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 45 - -$L__BB1_512: - { // callseq 44, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 44 - -$L__BB1_454: - { // callseq 41, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 41 - -$L__BB1_432: - { // callseq 40, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 40 - -$L__BB1_56: - { // callseq 10, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 10 - -$L__BB1_206: - { // callseq 21, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 21 - -$L__BB1_205: - { // callseq 20, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index26slice_start_index_len_fail17h31c4387487c2b57aE, - ( - ); - } // callseq 20 - -$L__BB1_203: - st.local.u8 [%rd1+344], %rs2264; - -$L__BB1_204: - trap; - -$L__BB1_550: - { // callseq 47, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 47 - -$L__BB1_488: - trap; - -$L__BB1_541: - { // callseq 46, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 46 - -$L__BB1_227: - { // callseq 27, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 27 - -$L__BB1_215: - trap; - -$L__BB1_398: - { // callseq 39, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 39 - -$L__BB1_331: - trap; - -$L__BB1_469: - { // callseq 43, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 43 - -$L__BB1_408: - trap; - -$L__BB1_461: - { // callseq 42, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 42 - -$L__BB1_249: - { // callseq 31, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 31 - -$L__BB1_237: - trap; - -$L__BB1_326: - { // callseq 35, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 35 - -$L__BB1_259: - trap; - -$L__BB1_65: - { // callseq 12, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 12 - -$L__BB1_64: - { // callseq 11, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index26slice_start_index_len_fail17h31c4387487c2b57aE, - ( - ); - } // callseq 11 - -$L__BB1_62: - st.local.u8 [%rd1+272], %rs1383; - -$L__BB1_63: - trap; - -$L__BB1_109: - { // callseq 15, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 15 - -$L__BB1_108: - { // callseq 14, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index26slice_start_index_len_fail17h31c4387487c2b57aE, - ( - ); - } // callseq 14 - -$L__BB1_106: - st.local.u8 [%rd1+304], %rs1623; - -$L__BB1_107: - trap; - -$L__BB1_157: - { // callseq 18, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E, - ( - ); - } // callseq 18 - -$L__BB1_156: - { // callseq 17, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core5slice5index26slice_start_index_len_fail17h31c4387487c2b57aE, - ( - ); - } // callseq 17 - -$L__BB1_154: - st.local.u8 [%rd1+336], %rs1918; - -$L__BB1_155: - trap; - -$L__BB1_482: - trap; - -} -.func _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE( - .param .b64 _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_0, - .param .b64 _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_1, - .param .b64 _ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_2 -) -{ - .reg .pred %p<20>; - .reg .b16 %rs<161>; - .reg .b32 %r<3457>; - .reg .b64 %rd<1429>; - - - ld.param.u64 %rd8, [_ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_0]; - ld.param.u64 %rd9, [_ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_1]; - ld.param.u64 %rd10, [_ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_2]; - cvta.to.local.u64 %rd1, %rd8; - ld.local.u32 %r3448, [%rd1]; - ld.local.u32 %r3447, [%rd1+4]; - ld.local.u32 %r3446, [%rd1+8]; - ld.local.u32 %r3445, [%rd1+12]; - ld.local.u32 %r3444, [%rd1+16]; - ld.local.u32 %r3443, [%rd1+20]; - ld.local.u32 %r3442, [%rd1+24]; - ld.local.u32 %r3441, [%rd1+28]; - cvta.to.local.u64 %rd1428, %rd9; - shl.b64 %rd11, %rd10, 6; - add.s64 %rd3, %rd1428, %rd11; - setp.eq.s64 %p1, %rd1428, %rd3; - @%p1 bra $L__BB2_20; - - mov.pred %p2, 0; - -$L__BB2_2: - ld.local.u8 %rd12, [%rd1428]; - ld.local.u8 %rd13, [%rd1428+1]; - bfi.b64 %rd14, %rd13, %rd12, 8, 8; - ld.local.u8 %rd15, [%rd1428+2]; - ld.local.u8 %rd16, [%rd1428+3]; - bfi.b64 %rd17, %rd16, %rd15, 8, 56; - bfi.b64 %rd18, %rd17, %rd14, 16, 48; - shl.b64 %rd19, %rd18, 8; - mov.b64 {%r33, %r34}, %rd19; - mov.b32 {%rs5, %rs81}, %r34; - mov.b32 {%rs1, %rs3}, %r33; - shr.u16 %rs4, %rs3, 8; - shr.u16 %rs2, %rs1, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd20, [%rd1428+4]; - ld.local.u8 %rd21, [%rd1428+5]; - bfi.b64 %rd22, %rd21, %rd20, 8, 8; - ld.local.u8 %rd23, [%rd1428+6]; - ld.local.u8 %rd24, [%rd1428+7]; - bfi.b64 %rd25, %rd24, %rd23, 8, 56; - bfi.b64 %rd26, %rd25, %rd22, 16, 48; - shl.b64 %rd27, %rd26, 8; - mov.b64 {%r35, %r36}, %rd27; - mov.b32 {%rs10, %rs82}, %r36; - mov.b32 {%rs6, %rs8}, %r35; - shr.u16 %rs9, %rs8, 8; - shr.u16 %rs7, %rs6, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd28, [%rd1428+8]; - ld.local.u8 %rd29, [%rd1428+9]; - bfi.b64 %rd30, %rd29, %rd28, 8, 8; - ld.local.u8 %rd31, [%rd1428+10]; - ld.local.u8 %rd32, [%rd1428+11]; - bfi.b64 %rd33, %rd32, %rd31, 8, 56; - bfi.b64 %rd34, %rd33, %rd30, 16, 48; - shl.b64 %rd35, %rd34, 8; - mov.b64 {%r37, %r38}, %rd35; - mov.b32 {%rs15, %rs83}, %r38; - mov.b32 {%rs11, %rs13}, %r37; - shr.u16 %rs14, %rs13, 8; - shr.u16 %rs12, %rs11, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd36, [%rd1428+12]; - ld.local.u8 %rd37, [%rd1428+13]; - bfi.b64 %rd38, %rd37, %rd36, 8, 8; - ld.local.u8 %rd39, [%rd1428+14]; - ld.local.u8 %rd40, [%rd1428+15]; - bfi.b64 %rd41, %rd40, %rd39, 8, 56; - bfi.b64 %rd42, %rd41, %rd38, 16, 48; - shl.b64 %rd43, %rd42, 8; - mov.b64 {%r39, %r40}, %rd43; - mov.b32 {%rs20, %rs84}, %r40; - mov.b32 {%rs16, %rs18}, %r39; - shr.u16 %rs19, %rs18, 8; - shr.u16 %rs17, %rs16, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd44, [%rd1428+16]; - ld.local.u8 %rd45, [%rd1428+17]; - bfi.b64 %rd46, %rd45, %rd44, 8, 8; - ld.local.u8 %rd47, [%rd1428+18]; - ld.local.u8 %rd48, [%rd1428+19]; - bfi.b64 %rd49, %rd48, %rd47, 8, 56; - bfi.b64 %rd50, %rd49, %rd46, 16, 48; - shl.b64 %rd51, %rd50, 8; - mov.b64 {%r41, %r42}, %rd51; - mov.b32 {%rs25, %rs85}, %r42; - mov.b32 {%rs21, %rs23}, %r41; - shr.u16 %rs24, %rs23, 8; - shr.u16 %rs22, %rs21, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd52, [%rd1428+20]; - ld.local.u8 %rd53, [%rd1428+21]; - bfi.b64 %rd54, %rd53, %rd52, 8, 8; - ld.local.u8 %rd55, [%rd1428+22]; - ld.local.u8 %rd56, [%rd1428+23]; - bfi.b64 %rd57, %rd56, %rd55, 8, 56; - bfi.b64 %rd58, %rd57, %rd54, 16, 48; - shl.b64 %rd59, %rd58, 8; - mov.b64 {%r43, %r44}, %rd59; - mov.b32 {%rs30, %rs86}, %r44; - mov.b32 {%rs26, %rs28}, %r43; - shr.u16 %rs29, %rs28, 8; - shr.u16 %rs27, %rs26, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd60, [%rd1428+24]; - ld.local.u8 %rd61, [%rd1428+25]; - bfi.b64 %rd62, %rd61, %rd60, 8, 8; - ld.local.u8 %rd63, [%rd1428+26]; - ld.local.u8 %rd64, [%rd1428+27]; - bfi.b64 %rd65, %rd64, %rd63, 8, 56; - bfi.b64 %rd66, %rd65, %rd62, 16, 48; - shl.b64 %rd67, %rd66, 8; - mov.b64 {%r45, %r46}, %rd67; - mov.b32 {%rs35, %rs87}, %r46; - mov.b32 {%rs31, %rs33}, %r45; - shr.u16 %rs34, %rs33, 8; - shr.u16 %rs32, %rs31, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd68, [%rd1428+28]; - ld.local.u8 %rd69, [%rd1428+29]; - bfi.b64 %rd70, %rd69, %rd68, 8, 8; - ld.local.u8 %rd71, [%rd1428+30]; - ld.local.u8 %rd72, [%rd1428+31]; - bfi.b64 %rd73, %rd72, %rd71, 8, 56; - bfi.b64 %rd74, %rd73, %rd70, 16, 48; - shl.b64 %rd75, %rd74, 8; - mov.b64 {%r47, %r48}, %rd75; - mov.b32 {%rs40, %rs88}, %r48; - mov.b32 {%rs36, %rs38}, %r47; - shr.u16 %rs39, %rs38, 8; - shr.u16 %rs37, %rs36, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd76, [%rd1428+32]; - ld.local.u8 %rd77, [%rd1428+33]; - bfi.b64 %rd78, %rd77, %rd76, 8, 8; - ld.local.u8 %rd79, [%rd1428+34]; - ld.local.u8 %rd80, [%rd1428+35]; - bfi.b64 %rd81, %rd80, %rd79, 8, 56; - bfi.b64 %rd82, %rd81, %rd78, 16, 48; - shl.b64 %rd83, %rd82, 8; - mov.b64 {%r49, %r50}, %rd83; - mov.b32 {%rs45, %rs89}, %r50; - mov.b32 {%rs41, %rs43}, %r49; - shr.u16 %rs44, %rs43, 8; - shr.u16 %rs42, %rs41, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd84, [%rd1428+36]; - ld.local.u8 %rd85, [%rd1428+37]; - bfi.b64 %rd86, %rd85, %rd84, 8, 8; - ld.local.u8 %rd87, [%rd1428+38]; - ld.local.u8 %rd88, [%rd1428+39]; - bfi.b64 %rd89, %rd88, %rd87, 8, 56; - bfi.b64 %rd90, %rd89, %rd86, 16, 48; - shl.b64 %rd91, %rd90, 8; - mov.b64 {%r51, %r52}, %rd91; - mov.b32 {%rs50, %rs90}, %r52; - mov.b32 {%rs46, %rs48}, %r51; - shr.u16 %rs49, %rs48, 8; - shr.u16 %rs47, %rs46, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd92, [%rd1428+40]; - ld.local.u8 %rd93, [%rd1428+41]; - bfi.b64 %rd94, %rd93, %rd92, 8, 8; - ld.local.u8 %rd95, [%rd1428+42]; - ld.local.u8 %rd96, [%rd1428+43]; - bfi.b64 %rd97, %rd96, %rd95, 8, 56; - bfi.b64 %rd98, %rd97, %rd94, 16, 48; - shl.b64 %rd99, %rd98, 8; - mov.b64 {%r53, %r54}, %rd99; - mov.b32 {%rs55, %rs91}, %r54; - mov.b32 {%rs51, %rs53}, %r53; - shr.u16 %rs54, %rs53, 8; - shr.u16 %rs52, %rs51, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd100, [%rd1428+44]; - ld.local.u8 %rd101, [%rd1428+45]; - bfi.b64 %rd102, %rd101, %rd100, 8, 8; - ld.local.u8 %rd103, [%rd1428+46]; - ld.local.u8 %rd104, [%rd1428+47]; - bfi.b64 %rd105, %rd104, %rd103, 8, 56; - bfi.b64 %rd106, %rd105, %rd102, 16, 48; - shl.b64 %rd107, %rd106, 8; - mov.b64 {%r55, %r56}, %rd107; - mov.b32 {%rs60, %rs92}, %r56; - mov.b32 {%rs56, %rs58}, %r55; - shr.u16 %rs59, %rs58, 8; - shr.u16 %rs57, %rs56, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd108, [%rd1428+48]; - ld.local.u8 %rd109, [%rd1428+49]; - bfi.b64 %rd110, %rd109, %rd108, 8, 8; - ld.local.u8 %rd111, [%rd1428+50]; - ld.local.u8 %rd112, [%rd1428+51]; - bfi.b64 %rd113, %rd112, %rd111, 8, 56; - bfi.b64 %rd114, %rd113, %rd110, 16, 48; - shl.b64 %rd115, %rd114, 8; - mov.b64 {%r57, %r58}, %rd115; - mov.b32 {%rs65, %rs93}, %r58; - mov.b32 {%rs61, %rs63}, %r57; - shr.u16 %rs64, %rs63, 8; - shr.u16 %rs62, %rs61, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd116, [%rd1428+52]; - ld.local.u8 %rd117, [%rd1428+53]; - bfi.b64 %rd118, %rd117, %rd116, 8, 8; - ld.local.u8 %rd119, [%rd1428+54]; - ld.local.u8 %rd120, [%rd1428+55]; - bfi.b64 %rd121, %rd120, %rd119, 8, 56; - bfi.b64 %rd122, %rd121, %rd118, 16, 48; - shl.b64 %rd123, %rd122, 8; - mov.b64 {%r59, %r60}, %rd123; - mov.b32 {%rs70, %rs94}, %r60; - mov.b32 {%rs66, %rs68}, %r59; - shr.u16 %rs69, %rs68, 8; - shr.u16 %rs67, %rs66, 8; - @%p2 bra $L__BB2_18; - - ld.local.u8 %rd124, [%rd1428+56]; - ld.local.u8 %rd125, [%rd1428+57]; - bfi.b64 %rd126, %rd125, %rd124, 8, 8; - ld.local.u8 %rd127, [%rd1428+58]; - ld.local.u8 %rd128, [%rd1428+59]; - bfi.b64 %rd129, %rd128, %rd127, 8, 56; - bfi.b64 %rd130, %rd129, %rd126, 16, 48; - shl.b64 %rd131, %rd130, 8; - mov.b64 {%r61, %r62}, %rd131; - mov.b32 {%rs75, %rs95}, %r62; - mov.b32 {%rs71, %rs73}, %r61; - shr.u16 %rs74, %rs73, 8; - shr.u16 %rs72, %rs71, 8; - @%p2 bra $L__BB2_18; - - mov.pred %p19, -1; - ld.local.u8 %rd132, [%rd1428+60]; - ld.local.u8 %rd133, [%rd1428+61]; - bfi.b64 %rd134, %rd133, %rd132, 8, 8; - ld.local.u8 %rd135, [%rd1428+62]; - ld.local.u8 %rd136, [%rd1428+63]; - bfi.b64 %rd137, %rd136, %rd135, 8, 56; - bfi.b64 %rd138, %rd137, %rd134, 16, 48; - shl.b64 %rd139, %rd138, 8; - mov.b64 {%r63, %r64}, %rd139; - mov.b32 {%rs80, %rs96}, %r64; - mov.b32 {%rs76, %rs78}, %r63; - shr.u16 %rs79, %rs78, 8; - shr.u16 %rs77, %rs76, 8; - @%p19 bra $L__BB2_19; - bra.uni $L__BB2_18; - -$L__BB2_19: - add.s64 %rd1428, %rd1428, 64; - shl.b16 %rs97, %rs73, 8; - or.b16 %rs98, %rs72, %rs97; - shl.b16 %rs99, %rs75, 8; - or.b16 %rs100, %rs74, %rs99; - mov.b32 %r65, {%rs98, %rs100}; - shr.u32 %r66, %r65, 24; - shr.u32 %r67, %r65, 8; - and.b32 %r68, %r67, 65280; - or.b32 %r69, %r68, %r66; - shl.b32 %r70, %r65, 24; - shl.b32 %r71, %r65, 8; - and.b32 %r72, %r71, 16711680; - or.b32 %r73, %r70, %r72; - or.b32 %r74, %r73, %r69; - shl.b16 %rs101, %rs78, 8; - or.b16 %rs102, %rs77, %rs101; - shl.b16 %rs103, %rs80, 8; - or.b16 %rs104, %rs79, %rs103; - mov.b32 %r75, {%rs102, %rs104}; - shr.u32 %r76, %r75, 24; - shr.u32 %r77, %r75, 8; - and.b32 %r78, %r77, 65280; - or.b32 %r79, %r78, %r76; - shl.b32 %r80, %r75, 24; - shl.b32 %r81, %r75, 8; - and.b32 %r82, %r81, 16711680; - or.b32 %r83, %r80, %r82; - or.b32 %r84, %r83, %r79; - shl.b16 %rs105, %rs3, 8; - or.b16 %rs106, %rs2, %rs105; - shl.b16 %rs107, %rs5, 8; - or.b16 %rs108, %rs4, %rs107; - mov.b32 %r85, {%rs106, %rs108}; - shr.u32 %r86, %r85, 24; - shr.u32 %r87, %r85, 8; - and.b32 %r88, %r87, 65280; - or.b32 %r89, %r88, %r86; - shl.b32 %r90, %r85, 24; - shl.b32 %r91, %r85, 8; - and.b32 %r92, %r91, 16711680; - or.b32 %r93, %r90, %r92; - or.b32 %r94, %r93, %r89; - cvt.u64.u32 %rd140, %r94; - shl.b16 %rs109, %rs8, 8; - or.b16 %rs110, %rs7, %rs109; - shl.b16 %rs111, %rs10, 8; - or.b16 %rs112, %rs9, %rs111; - mov.b32 %r95, {%rs110, %rs112}; - shr.u32 %r96, %r95, 24; - shr.u32 %r97, %r95, 8; - and.b32 %r98, %r97, 65280; - or.b32 %r99, %r98, %r96; - shl.b32 %r100, %r95, 24; - shl.b32 %r101, %r95, 8; - and.b32 %r102, %r101, 16711680; - or.b32 %r103, %r100, %r102; - or.b32 %r104, %r103, %r99; - shl.b16 %rs113, %rs13, 8; - or.b16 %rs114, %rs12, %rs113; - shl.b16 %rs115, %rs15, 8; - or.b16 %rs116, %rs14, %rs115; - mov.b32 %r105, {%rs114, %rs116}; - shr.u32 %r106, %r105, 24; - shr.u32 %r107, %r105, 8; - and.b32 %r108, %r107, 65280; - or.b32 %r109, %r108, %r106; - shl.b32 %r110, %r105, 24; - shl.b32 %r111, %r105, 8; - and.b32 %r112, %r111, 16711680; - or.b32 %r113, %r110, %r112; - or.b32 %r114, %r113, %r109; - cvt.u64.u32 %rd141, %r114; - shl.b16 %rs117, %rs18, 8; - or.b16 %rs118, %rs17, %rs117; - shl.b16 %rs119, %rs20, 8; - or.b16 %rs120, %rs19, %rs119; - mov.b32 %r115, {%rs118, %rs120}; - shr.u32 %r116, %r115, 24; - shr.u32 %r117, %r115, 8; - and.b32 %r118, %r117, 65280; - or.b32 %r119, %r118, %r116; - shl.b32 %r120, %r115, 24; - shl.b32 %r121, %r115, 8; - and.b32 %r122, %r121, 16711680; - or.b32 %r123, %r120, %r122; - or.b32 %r124, %r123, %r119; - cvt.u64.u32 %rd142, %r124; - cvt.u64.u32 %rd143, %r104; - bfi.b64 %rd144, %rd140, %rd143, 32, 32; - bfi.b64 %rd145, %rd141, %rd142, 32, 32; - mov.b64 {%r125, %r126}, %rd145; - mov.b64 {%r127, %r128}, %rd144; - add.s32 %r129, %r125, -373957723; - add.s32 %r130, %r126, -1245643825; - add.s32 %r131, %r127, 1899447441; - add.s32 %r132, %r128, 1116352408; - cvt.u64.u32 %rd146, %r132; - cvt.u64.u32 %rd147, %r130; - cvt.u64.u32 %rd148, %r131; - cvt.u64.u32 %rd149, %r129; - bfi.b64 %rd150, %rd147, %rd149, 32, 32; - bfi.b64 %rd151, %rd146, %rd148, 32, 32; - cvt.u64.u32 %rd152, %r3441; - cvt.u64.u32 %rd153, %r3442; - cvt.u64.u32 %rd154, %r3445; - cvt.u64.u32 %rd155, %r3446; - bfi.b64 %rd156, %rd152, %rd153, 32, 32; - bfi.b64 %rd157, %rd154, %rd155, 32, 32; - cvt.u64.u32 %rd158, %r3443; - cvt.u64.u32 %rd159, %r3444; - cvt.u64.u32 %rd160, %r3447; - cvt.u64.u32 %rd161, %r3448; - bfi.b64 %rd162, %rd158, %rd159, 32, 32; - bfi.b64 %rd163, %rd160, %rd161, 32, 32; - mov.b64 {%r133, %r134}, %rd157; - mov.b64 {%r135, %r136}, %rd156; - mov.b64 {%r137, %r138}, %rd163; - mov.b64 {%r139, %r140}, %rd162; - mov.b64 {%r141, %r142}, %rd151; - shf.r.wrap.b32 %r143, %r139, %r139, 6; - shf.r.wrap.b32 %r144, %r139, %r139, 11; - xor.b32 %r145, %r143, %r144; - shf.r.wrap.b32 %r146, %r139, %r139, 25; - xor.b32 %r147, %r145, %r146; - xor.b32 %r148, %r140, %r135; - and.b32 %r149, %r148, %r139; - xor.b32 %r150, %r149, %r135; - add.s32 %r151, %r147, %r136; - add.s32 %r152, %r151, %r150; - add.s32 %r153, %r152, %r142; - shf.r.wrap.b32 %r154, %r137, %r137, 2; - shf.r.wrap.b32 %r155, %r137, %r137, 13; - xor.b32 %r156, %r154, %r155; - shf.r.wrap.b32 %r157, %r137, %r137, 22; - xor.b32 %r158, %r156, %r157; - and.b32 %r159, %r138, %r137; - and.b32 %r160, %r3448, %r3446; - xor.b32 %r161, %r160, %r159; - and.b32 %r162, %r138, %r133; - xor.b32 %r163, %r161, %r162; - add.s32 %r164, %r163, %r158; - add.s32 %r165, %r164, %r153; - add.s32 %r166, %r153, %r134; - shf.r.wrap.b32 %r167, %r166, %r166, 6; - shf.r.wrap.b32 %r168, %r166, %r166, 11; - xor.b32 %r169, %r167, %r168; - shf.r.wrap.b32 %r170, %r166, %r166, 25; - xor.b32 %r171, %r169, %r170; - xor.b32 %r172, %r140, %r139; - and.b32 %r173, %r166, %r172; - xor.b32 %r174, %r173, %r140; - add.s32 %r175, %r141, %r135; - add.s32 %r176, %r175, %r174; - add.s32 %r177, %r176, %r171; - shf.r.wrap.b32 %r178, %r165, %r165, 2; - shf.r.wrap.b32 %r179, %r165, %r165, 13; - xor.b32 %r180, %r178, %r179; - shf.r.wrap.b32 %r181, %r165, %r165, 22; - xor.b32 %r182, %r180, %r181; - xor.b32 %r183, %r138, %r137; - and.b32 %r184, %r165, %r183; - xor.b32 %r185, %r184, %r159; - add.s32 %r186, %r182, %r185; - add.s32 %r187, %r177, %r133; - cvt.u64.u32 %rd164, %r166; - cvt.u64.u32 %rd165, %r187; - cvt.u64.u32 %rd166, %r165; - bfi.b64 %rd167, %rd164, %rd165, 32, 32; - add.s32 %r188, %r186, %r177; - cvt.u64.u32 %rd168, %r188; - bfi.b64 %rd169, %rd166, %rd168, 32, 32; - mov.b64 {%r189, %r190}, %rd169; - mov.b64 {%r191, %r192}, %rd167; - mov.b64 {%r193, %r194}, %rd150; - cvt.u64.u32 %rd170, %r194; - bfi.b64 %rd171, %rd170, %rd149, 32, 32; - cvt.u64.u32 %rd172, %r192; - cvt.u64.u32 %rd173, %r190; - cvt.u64.u32 %rd174, %r191; - bfi.b64 %rd175, %rd172, %rd174, 32, 32; - bfi.b64 %rd176, %rd173, %rd168, 32, 32; - mov.b64 {%r195, %r196}, %rd176; - mov.b64 {%r197, %r198}, %rd175; - mov.b64 {%r199, %r200}, %rd171; - shf.r.wrap.b32 %r201, %r197, %r197, 6; - shf.r.wrap.b32 %r202, %r197, %r197, 11; - xor.b32 %r203, %r201, %r202; - shf.r.wrap.b32 %r204, %r197, %r197, 25; - xor.b32 %r205, %r203, %r204; - xor.b32 %r206, %r198, %r139; - and.b32 %r207, %r206, %r197; - xor.b32 %r208, %r207, %r139; - add.s32 %r209, %r200, %r140; - add.s32 %r210, %r209, %r205; - add.s32 %r211, %r210, %r208; - shf.r.wrap.b32 %r212, %r195, %r195, 2; - shf.r.wrap.b32 %r213, %r195, %r195, 13; - xor.b32 %r214, %r212, %r213; - shf.r.wrap.b32 %r215, %r195, %r195, 22; - xor.b32 %r216, %r214, %r215; - and.b32 %r217, %r196, %r195; - and.b32 %r218, %r188, %r3448; - xor.b32 %r219, %r217, %r218; - and.b32 %r220, %r196, %r137; - xor.b32 %r221, %r219, %r220; - add.s32 %r222, %r221, %r216; - add.s32 %r223, %r222, %r211; - add.s32 %r224, %r211, %r138; - shf.r.wrap.b32 %r225, %r224, %r224, 6; - shf.r.wrap.b32 %r226, %r224, %r224, 11; - xor.b32 %r227, %r225, %r226; - shf.r.wrap.b32 %r228, %r224, %r224, 25; - xor.b32 %r229, %r227, %r228; - xor.b32 %r230, %r198, %r197; - and.b32 %r231, %r224, %r230; - xor.b32 %r232, %r231, %r198; - add.s32 %r233, %r199, %r139; - add.s32 %r234, %r233, %r232; - add.s32 %r235, %r234, %r229; - shf.r.wrap.b32 %r236, %r223, %r223, 2; - shf.r.wrap.b32 %r237, %r223, %r223, 13; - xor.b32 %r238, %r236, %r237; - shf.r.wrap.b32 %r239, %r223, %r223, 22; - xor.b32 %r240, %r238, %r239; - xor.b32 %r241, %r196, %r195; - and.b32 %r242, %r223, %r241; - xor.b32 %r243, %r242, %r217; - add.s32 %r244, %r240, %r243; - add.s32 %r245, %r235, %r137; - cvt.u64.u32 %rd177, %r224; - cvt.u64.u32 %rd178, %r245; - cvt.u64.u32 %rd179, %r223; - add.s32 %r246, %r244, %r235; - cvt.u64.u32 %rd180, %r246; - bfi.b64 %rd181, %rd179, %rd180, 32, 32; - bfi.b64 %rd182, %rd177, %rd178, 32, 32; - mov.b64 {%r247, %r248}, %rd181; - mov.b64 {%r249, %r250}, %rd182; - shl.b16 %rs121, %rs23, 8; - or.b16 %rs122, %rs22, %rs121; - shl.b16 %rs123, %rs25, 8; - or.b16 %rs124, %rs24, %rs123; - mov.b32 %r251, {%rs122, %rs124}; - shr.u32 %r252, %r251, 24; - shr.u32 %r253, %r251, 8; - and.b32 %r254, %r253, 65280; - or.b32 %r255, %r254, %r252; - shl.b32 %r256, %r251, 24; - shl.b32 %r257, %r251, 8; - and.b32 %r258, %r257, 16711680; - or.b32 %r259, %r256, %r258; - or.b32 %r260, %r259, %r255; - cvt.u64.u32 %rd183, %r260; - shl.b16 %rs125, %rs28, 8; - or.b16 %rs126, %rs27, %rs125; - shl.b16 %rs127, %rs30, 8; - or.b16 %rs128, %rs29, %rs127; - mov.b32 %r261, {%rs126, %rs128}; - shr.u32 %r262, %r261, 24; - shr.u32 %r263, %r261, 8; - and.b32 %r264, %r263, 65280; - or.b32 %r265, %r264, %r262; - shl.b32 %r266, %r261, 24; - shl.b32 %r267, %r261, 8; - and.b32 %r268, %r267, 16711680; - or.b32 %r269, %r266, %r268; - or.b32 %r270, %r269, %r265; - shl.b16 %rs129, %rs33, 8; - or.b16 %rs130, %rs32, %rs129; - shl.b16 %rs131, %rs35, 8; - or.b16 %rs132, %rs34, %rs131; - mov.b32 %r271, {%rs130, %rs132}; - shr.u32 %r272, %r271, 24; - shr.u32 %r273, %r271, 8; - and.b32 %r274, %r273, 65280; - or.b32 %r275, %r274, %r272; - shl.b32 %r276, %r271, 24; - shl.b32 %r277, %r271, 8; - and.b32 %r278, %r277, 16711680; - or.b32 %r279, %r276, %r278; - or.b32 %r280, %r279, %r275; - cvt.u64.u32 %rd184, %r280; - shl.b16 %rs133, %rs38, 8; - or.b16 %rs134, %rs37, %rs133; - shl.b16 %rs135, %rs40, 8; - or.b16 %rs136, %rs39, %rs135; - mov.b32 %r281, {%rs134, %rs136}; - shr.u32 %r282, %r281, 24; - shr.u32 %r283, %r281, 8; - and.b32 %r284, %r283, 65280; - or.b32 %r285, %r284, %r282; - shl.b32 %r286, %r281, 24; - shl.b32 %r287, %r281, 8; - and.b32 %r288, %r287, 16711680; - or.b32 %r289, %r286, %r288; - or.b32 %r290, %r289, %r285; - cvt.u64.u32 %rd185, %r290; - cvt.u64.u32 %rd186, %r270; - bfi.b64 %rd187, %rd183, %rd186, 32, 32; - bfi.b64 %rd188, %rd184, %rd185, 32, 32; - mov.b64 {%r291, %r292}, %rd188; - mov.b64 {%r293, %r294}, %rd187; - add.s32 %r295, %r291, -1424204075; - add.s32 %r296, %r292, -1841331548; - add.s32 %r297, %r293, 1508970993; - add.s32 %r298, %r294, 961987163; - cvt.u64.u32 %rd189, %r298; - cvt.u64.u32 %rd190, %r296; - cvt.u64.u32 %rd191, %r297; - cvt.u64.u32 %rd192, %r295; - bfi.b64 %rd193, %rd190, %rd192, 32, 32; - bfi.b64 %rd194, %rd189, %rd191, 32, 32; - cvt.u64.u32 %rd195, %r250; - cvt.u64.u32 %rd196, %r248; - cvt.u64.u32 %rd197, %r249; - bfi.b64 %rd198, %rd196, %rd180, 32, 32; - bfi.b64 %rd199, %rd195, %rd197, 32, 32; - mov.b64 {%r299, %r300}, %rd198; - mov.b64 {%r301, %r302}, %rd199; - mov.b64 {%r303, %r304}, %rd194; - shf.r.wrap.b32 %r305, %r301, %r301, 6; - shf.r.wrap.b32 %r306, %r301, %r301, 11; - xor.b32 %r307, %r305, %r306; - shf.r.wrap.b32 %r308, %r301, %r301, 25; - xor.b32 %r309, %r307, %r308; - xor.b32 %r310, %r302, %r197; - and.b32 %r311, %r310, %r301; - xor.b32 %r312, %r311, %r197; - add.s32 %r313, %r198, %r304; - add.s32 %r314, %r313, %r309; - add.s32 %r315, %r314, %r312; - shf.r.wrap.b32 %r316, %r299, %r299, 2; - shf.r.wrap.b32 %r317, %r299, %r299, 13; - xor.b32 %r318, %r316, %r317; - shf.r.wrap.b32 %r319, %r299, %r299, 22; - xor.b32 %r320, %r318, %r319; - and.b32 %r321, %r300, %r299; - and.b32 %r322, %r246, %r188; - xor.b32 %r323, %r321, %r322; - and.b32 %r324, %r300, %r195; - xor.b32 %r325, %r323, %r324; - add.s32 %r326, %r325, %r320; - add.s32 %r327, %r326, %r315; - add.s32 %r328, %r315, %r196; - shf.r.wrap.b32 %r329, %r328, %r328, 6; - shf.r.wrap.b32 %r330, %r328, %r328, 11; - xor.b32 %r331, %r329, %r330; - shf.r.wrap.b32 %r332, %r328, %r328, 25; - xor.b32 %r333, %r331, %r332; - xor.b32 %r334, %r302, %r301; - and.b32 %r335, %r328, %r334; - xor.b32 %r336, %r335, %r302; - add.s32 %r337, %r197, %r303; - add.s32 %r338, %r337, %r336; - add.s32 %r339, %r338, %r333; - shf.r.wrap.b32 %r340, %r327, %r327, 2; - shf.r.wrap.b32 %r341, %r327, %r327, 13; - xor.b32 %r342, %r340, %r341; - shf.r.wrap.b32 %r343, %r327, %r327, 22; - xor.b32 %r344, %r342, %r343; - xor.b32 %r345, %r300, %r299; - and.b32 %r346, %r327, %r345; - xor.b32 %r347, %r346, %r321; - add.s32 %r348, %r344, %r347; - add.s32 %r349, %r339, %r195; - cvt.u64.u32 %rd200, %r328; - cvt.u64.u32 %rd201, %r349; - cvt.u64.u32 %rd202, %r327; - add.s32 %r350, %r348, %r339; - cvt.u64.u32 %rd203, %r350; - bfi.b64 %rd204, %rd202, %rd203, 32, 32; - bfi.b64 %rd205, %rd200, %rd201, 32, 32; - mov.b64 {%r351, %r352}, %rd204; - mov.b64 {%r353, %r354}, %rd205; - mov.b64 {%r355, %r356}, %rd193; - cvt.u64.u32 %rd206, %r356; - bfi.b64 %rd207, %rd206, %rd192, 32, 32; - cvt.u64.u32 %rd208, %r354; - cvt.u64.u32 %rd209, %r352; - cvt.u64.u32 %rd210, %r353; - bfi.b64 %rd211, %rd209, %rd203, 32, 32; - bfi.b64 %rd212, %rd208, %rd210, 32, 32; - mov.b64 {%r357, %r358}, %rd211; - mov.b64 {%r359, %r360}, %rd212; - mov.b64 {%r361, %r362}, %rd207; - shf.r.wrap.b32 %r363, %r359, %r359, 6; - shf.r.wrap.b32 %r364, %r359, %r359, 11; - xor.b32 %r365, %r363, %r364; - shf.r.wrap.b32 %r366, %r359, %r359, 25; - xor.b32 %r367, %r365, %r366; - xor.b32 %r368, %r360, %r301; - and.b32 %r369, %r368, %r359; - xor.b32 %r370, %r369, %r301; - add.s32 %r371, %r302, %r362; - add.s32 %r372, %r371, %r367; - add.s32 %r373, %r372, %r370; - shf.r.wrap.b32 %r374, %r357, %r357, 2; - shf.r.wrap.b32 %r375, %r357, %r357, 13; - xor.b32 %r376, %r374, %r375; - shf.r.wrap.b32 %r377, %r357, %r357, 22; - xor.b32 %r378, %r376, %r377; - and.b32 %r379, %r358, %r357; - and.b32 %r380, %r350, %r246; - xor.b32 %r381, %r379, %r380; - and.b32 %r382, %r358, %r299; - xor.b32 %r383, %r381, %r382; - add.s32 %r384, %r383, %r378; - add.s32 %r385, %r384, %r373; - add.s32 %r386, %r373, %r300; - shf.r.wrap.b32 %r387, %r386, %r386, 6; - shf.r.wrap.b32 %r388, %r386, %r386, 11; - xor.b32 %r389, %r387, %r388; - shf.r.wrap.b32 %r390, %r386, %r386, 25; - xor.b32 %r391, %r389, %r390; - xor.b32 %r392, %r360, %r359; - and.b32 %r393, %r386, %r392; - xor.b32 %r394, %r393, %r360; - add.s32 %r395, %r301, %r361; - add.s32 %r396, %r395, %r394; - add.s32 %r397, %r396, %r391; - shf.r.wrap.b32 %r398, %r385, %r385, 2; - shf.r.wrap.b32 %r399, %r385, %r385, 13; - xor.b32 %r400, %r398, %r399; - shf.r.wrap.b32 %r401, %r385, %r385, 22; - xor.b32 %r402, %r400, %r401; - xor.b32 %r403, %r358, %r357; - and.b32 %r404, %r385, %r403; - xor.b32 %r405, %r404, %r379; - add.s32 %r406, %r402, %r405; - add.s32 %r407, %r397, %r299; - cvt.u64.u32 %rd213, %r386; - cvt.u64.u32 %rd214, %r407; - cvt.u64.u32 %rd215, %r385; - add.s32 %r408, %r406, %r397; - cvt.u64.u32 %rd216, %r408; - bfi.b64 %rd217, %rd215, %rd216, 32, 32; - bfi.b64 %rd218, %rd213, %rd214, 32, 32; - mov.b64 {%r409, %r410}, %rd217; - mov.b64 {%r411, %r412}, %rd218; - shl.b16 %rs137, %rs43, 8; - or.b16 %rs138, %rs42, %rs137; - shl.b16 %rs139, %rs45, 8; - or.b16 %rs140, %rs44, %rs139; - mov.b32 %r413, {%rs138, %rs140}; - shr.u32 %r414, %r413, 24; - shr.u32 %r415, %r413, 8; - and.b32 %r416, %r415, 65280; - or.b32 %r417, %r416, %r414; - shl.b32 %r418, %r413, 24; - shl.b32 %r419, %r413, 8; - and.b32 %r420, %r419, 16711680; - or.b32 %r421, %r418, %r420; - or.b32 %r422, %r421, %r417; - cvt.u64.u32 %rd219, %r422; - shl.b16 %rs141, %rs48, 8; - or.b16 %rs142, %rs47, %rs141; - shl.b16 %rs143, %rs50, 8; - or.b16 %rs144, %rs49, %rs143; - mov.b32 %r423, {%rs142, %rs144}; - shr.u32 %r424, %r423, 24; - shr.u32 %r425, %r423, 8; - and.b32 %r426, %r425, 65280; - or.b32 %r427, %r426, %r424; - shl.b32 %r428, %r423, 24; - shl.b32 %r429, %r423, 8; - and.b32 %r430, %r429, 16711680; - or.b32 %r431, %r428, %r430; - or.b32 %r432, %r431, %r427; - shl.b16 %rs145, %rs53, 8; - or.b16 %rs146, %rs52, %rs145; - shl.b16 %rs147, %rs55, 8; - or.b16 %rs148, %rs54, %rs147; - mov.b32 %r433, {%rs146, %rs148}; - shr.u32 %r434, %r433, 24; - shr.u32 %r435, %r433, 8; - and.b32 %r436, %r435, 65280; - or.b32 %r437, %r436, %r434; - shl.b32 %r438, %r433, 24; - shl.b32 %r439, %r433, 8; - and.b32 %r440, %r439, 16711680; - or.b32 %r441, %r438, %r440; - or.b32 %r442, %r441, %r437; - cvt.u64.u32 %rd220, %r442; - shl.b16 %rs149, %rs58, 8; - or.b16 %rs150, %rs57, %rs149; - shl.b16 %rs151, %rs60, 8; - or.b16 %rs152, %rs59, %rs151; - mov.b32 %r443, {%rs150, %rs152}; - shr.u32 %r444, %r443, 24; - shr.u32 %r445, %r443, 8; - and.b32 %r446, %r445, 65280; - or.b32 %r447, %r446, %r444; - shl.b32 %r448, %r443, 24; - shl.b32 %r449, %r443, 8; - and.b32 %r450, %r449, 16711680; - or.b32 %r451, %r448, %r450; - or.b32 %r452, %r451, %r447; - cvt.u64.u32 %rd221, %r452; - cvt.u64.u32 %rd222, %r432; - bfi.b64 %rd223, %rd219, %rd222, 32, 32; - bfi.b64 %rd224, %rd220, %rd221, 32, 32; - mov.b64 {%r453, %r454}, %rd224; - mov.b64 {%r455, %r456}, %rd223; - add.s32 %r457, %r453, 1426881987; - add.s32 %r458, %r454, 607225278; - add.s32 %r459, %r455, 310598401; - add.s32 %r460, %r456, -670586216; - cvt.u64.u32 %rd225, %r460; - cvt.u64.u32 %rd226, %r458; - cvt.u64.u32 %rd227, %r459; - cvt.u64.u32 %rd228, %r457; - bfi.b64 %rd229, %rd226, %rd228, 32, 32; - bfi.b64 %rd230, %rd225, %rd227, 32, 32; - cvt.u64.u32 %rd231, %r412; - cvt.u64.u32 %rd232, %r410; - cvt.u64.u32 %rd233, %r411; - bfi.b64 %rd234, %rd232, %rd216, 32, 32; - bfi.b64 %rd235, %rd231, %rd233, 32, 32; - mov.b64 {%r461, %r462}, %rd234; - mov.b64 {%r463, %r464}, %rd235; - mov.b64 {%r465, %r466}, %rd230; - shf.r.wrap.b32 %r467, %r463, %r463, 6; - shf.r.wrap.b32 %r468, %r463, %r463, 11; - xor.b32 %r469, %r467, %r468; - shf.r.wrap.b32 %r470, %r463, %r463, 25; - xor.b32 %r471, %r469, %r470; - xor.b32 %r472, %r464, %r359; - and.b32 %r473, %r472, %r463; - xor.b32 %r474, %r473, %r359; - add.s32 %r475, %r360, %r466; - add.s32 %r476, %r475, %r471; - add.s32 %r477, %r476, %r474; - shf.r.wrap.b32 %r478, %r461, %r461, 2; - shf.r.wrap.b32 %r479, %r461, %r461, 13; - xor.b32 %r480, %r478, %r479; - shf.r.wrap.b32 %r481, %r461, %r461, 22; - xor.b32 %r482, %r480, %r481; - and.b32 %r483, %r462, %r461; - and.b32 %r484, %r408, %r350; - xor.b32 %r485, %r483, %r484; - and.b32 %r486, %r462, %r357; - xor.b32 %r487, %r485, %r486; - add.s32 %r488, %r487, %r482; - add.s32 %r489, %r488, %r477; - add.s32 %r490, %r477, %r358; - shf.r.wrap.b32 %r491, %r490, %r490, 6; - shf.r.wrap.b32 %r492, %r490, %r490, 11; - xor.b32 %r493, %r491, %r492; - shf.r.wrap.b32 %r494, %r490, %r490, 25; - xor.b32 %r495, %r493, %r494; - xor.b32 %r496, %r464, %r463; - and.b32 %r497, %r490, %r496; - xor.b32 %r498, %r497, %r464; - add.s32 %r499, %r359, %r465; - add.s32 %r500, %r499, %r498; - add.s32 %r501, %r500, %r495; - shf.r.wrap.b32 %r502, %r489, %r489, 2; - shf.r.wrap.b32 %r503, %r489, %r489, 13; - xor.b32 %r504, %r502, %r503; - shf.r.wrap.b32 %r505, %r489, %r489, 22; - xor.b32 %r506, %r504, %r505; - xor.b32 %r507, %r462, %r461; - and.b32 %r508, %r489, %r507; - xor.b32 %r509, %r508, %r483; - add.s32 %r510, %r506, %r509; - add.s32 %r511, %r501, %r357; - cvt.u64.u32 %rd236, %r490; - cvt.u64.u32 %rd237, %r511; - cvt.u64.u32 %rd238, %r489; - add.s32 %r512, %r510, %r501; - cvt.u64.u32 %rd239, %r512; - bfi.b64 %rd240, %rd238, %rd239, 32, 32; - bfi.b64 %rd241, %rd236, %rd237, 32, 32; - mov.b64 {%r513, %r514}, %rd240; - mov.b64 {%r515, %r516}, %rd241; - mov.b64 {%r517, %r518}, %rd229; - cvt.u64.u32 %rd242, %r518; - bfi.b64 %rd243, %rd242, %rd228, 32, 32; - cvt.u64.u32 %rd244, %r516; - cvt.u64.u32 %rd245, %r514; - cvt.u64.u32 %rd246, %r515; - bfi.b64 %rd247, %rd245, %rd239, 32, 32; - bfi.b64 %rd248, %rd244, %rd246, 32, 32; - mov.b64 {%r519, %r520}, %rd247; - mov.b64 {%r521, %r522}, %rd248; - mov.b64 {%r523, %r524}, %rd243; - shf.r.wrap.b32 %r525, %r521, %r521, 6; - shf.r.wrap.b32 %r526, %r521, %r521, 11; - xor.b32 %r527, %r525, %r526; - shf.r.wrap.b32 %r528, %r521, %r521, 25; - xor.b32 %r529, %r527, %r528; - xor.b32 %r530, %r522, %r463; - and.b32 %r531, %r530, %r521; - xor.b32 %r532, %r531, %r463; - add.s32 %r533, %r464, %r524; - add.s32 %r534, %r533, %r529; - add.s32 %r535, %r534, %r532; - shf.r.wrap.b32 %r536, %r519, %r519, 2; - shf.r.wrap.b32 %r537, %r519, %r519, 13; - xor.b32 %r538, %r536, %r537; - shf.r.wrap.b32 %r539, %r519, %r519, 22; - xor.b32 %r540, %r538, %r539; - and.b32 %r541, %r520, %r519; - and.b32 %r542, %r512, %r408; - xor.b32 %r543, %r541, %r542; - and.b32 %r544, %r520, %r461; - xor.b32 %r545, %r543, %r544; - add.s32 %r546, %r545, %r540; - add.s32 %r547, %r546, %r535; - add.s32 %r548, %r535, %r462; - shf.r.wrap.b32 %r549, %r548, %r548, 6; - shf.r.wrap.b32 %r550, %r548, %r548, 11; - xor.b32 %r551, %r549, %r550; - shf.r.wrap.b32 %r552, %r548, %r548, 25; - xor.b32 %r553, %r551, %r552; - xor.b32 %r554, %r522, %r521; - and.b32 %r555, %r548, %r554; - xor.b32 %r556, %r555, %r522; - add.s32 %r557, %r463, %r523; - add.s32 %r558, %r557, %r556; - add.s32 %r559, %r558, %r553; - shf.r.wrap.b32 %r560, %r547, %r547, 2; - shf.r.wrap.b32 %r561, %r547, %r547, 13; - xor.b32 %r562, %r560, %r561; - shf.r.wrap.b32 %r563, %r547, %r547, 22; - xor.b32 %r564, %r562, %r563; - xor.b32 %r565, %r520, %r519; - and.b32 %r566, %r547, %r565; - xor.b32 %r567, %r566, %r541; - add.s32 %r568, %r564, %r567; - add.s32 %r569, %r559, %r461; - cvt.u64.u32 %rd249, %r548; - cvt.u64.u32 %rd250, %r569; - cvt.u64.u32 %rd251, %r547; - add.s32 %r570, %r568, %r559; - cvt.u64.u32 %rd252, %r570; - bfi.b64 %rd253, %rd251, %rd252, 32, 32; - bfi.b64 %rd254, %rd249, %rd250, 32, 32; - mov.b64 {%r571, %r572}, %rd253; - mov.b64 {%r573, %r574}, %rd254; - shl.b16 %rs153, %rs63, 8; - or.b16 %rs154, %rs62, %rs153; - shl.b16 %rs155, %rs65, 8; - or.b16 %rs156, %rs64, %rs155; - mov.b32 %r575, {%rs154, %rs156}; - shr.u32 %r576, %r575, 24; - shr.u32 %r577, %r575, 8; - and.b32 %r578, %r577, 65280; - or.b32 %r579, %r578, %r576; - shl.b32 %r580, %r575, 24; - shl.b32 %r581, %r575, 8; - and.b32 %r582, %r581, 16711680; - or.b32 %r583, %r580, %r582; - or.b32 %r584, %r583, %r579; - cvt.u64.u32 %rd255, %r584; - shl.b16 %rs157, %rs68, 8; - or.b16 %rs158, %rs67, %rs157; - shl.b16 %rs159, %rs70, 8; - or.b16 %rs160, %rs69, %rs159; - mov.b32 %r585, {%rs158, %rs160}; - shr.u32 %r586, %r585, 24; - shr.u32 %r587, %r585, 8; - and.b32 %r588, %r587, 65280; - or.b32 %r589, %r588, %r586; - shl.b32 %r590, %r585, 24; - shl.b32 %r591, %r585, 8; - and.b32 %r592, %r591, 16711680; - or.b32 %r593, %r590, %r592; - or.b32 %r594, %r593, %r589; - cvt.u64.u32 %rd256, %r74; - cvt.u64.u32 %rd257, %r84; - cvt.u64.u32 %rd258, %r594; - bfi.b64 %rd259, %rd255, %rd258, 32, 32; - bfi.b64 %rd260, %rd256, %rd257, 32, 32; - mov.b64 {%r595, %r596}, %rd260; - mov.b64 {%r597, %r598}, %rd259; - add.s32 %r599, %r595, -1046744716; - add.s32 %r600, %r596, -1680079193; - add.s32 %r601, %r597, -2132889090; - add.s32 %r602, %r598, 1925078388; - cvt.u64.u32 %rd261, %r602; - cvt.u64.u32 %rd262, %r600; - cvt.u64.u32 %rd263, %r601; - cvt.u64.u32 %rd264, %r599; - bfi.b64 %rd265, %rd262, %rd264, 32, 32; - bfi.b64 %rd266, %rd261, %rd263, 32, 32; - cvt.u64.u32 %rd267, %r574; - cvt.u64.u32 %rd268, %r572; - cvt.u64.u32 %rd269, %r573; - bfi.b64 %rd270, %rd268, %rd252, 32, 32; - bfi.b64 %rd271, %rd267, %rd269, 32, 32; - mov.b64 {%r603, %r604}, %rd270; - mov.b64 {%r605, %r606}, %rd271; - mov.b64 {%r607, %r608}, %rd266; - shf.r.wrap.b32 %r609, %r605, %r605, 6; - shf.r.wrap.b32 %r610, %r605, %r605, 11; - xor.b32 %r611, %r609, %r610; - shf.r.wrap.b32 %r612, %r605, %r605, 25; - xor.b32 %r613, %r611, %r612; - xor.b32 %r614, %r606, %r521; - and.b32 %r615, %r614, %r605; - xor.b32 %r616, %r615, %r521; - add.s32 %r617, %r522, %r608; - add.s32 %r618, %r617, %r613; - add.s32 %r619, %r618, %r616; - shf.r.wrap.b32 %r620, %r603, %r603, 2; - shf.r.wrap.b32 %r621, %r603, %r603, 13; - xor.b32 %r622, %r620, %r621; - shf.r.wrap.b32 %r623, %r603, %r603, 22; - xor.b32 %r624, %r622, %r623; - and.b32 %r625, %r604, %r603; - and.b32 %r626, %r570, %r512; - xor.b32 %r627, %r625, %r626; - and.b32 %r628, %r604, %r519; - xor.b32 %r629, %r627, %r628; - add.s32 %r630, %r629, %r624; - add.s32 %r631, %r630, %r619; - add.s32 %r632, %r619, %r520; - shf.r.wrap.b32 %r633, %r632, %r632, 6; - shf.r.wrap.b32 %r634, %r632, %r632, 11; - xor.b32 %r635, %r633, %r634; - shf.r.wrap.b32 %r636, %r632, %r632, 25; - xor.b32 %r637, %r635, %r636; - xor.b32 %r638, %r606, %r605; - and.b32 %r639, %r632, %r638; - xor.b32 %r640, %r639, %r606; - add.s32 %r641, %r521, %r607; - add.s32 %r642, %r641, %r640; - add.s32 %r643, %r642, %r637; - shf.r.wrap.b32 %r644, %r631, %r631, 2; - shf.r.wrap.b32 %r645, %r631, %r631, 13; - xor.b32 %r646, %r644, %r645; - shf.r.wrap.b32 %r647, %r631, %r631, 22; - xor.b32 %r648, %r646, %r647; - xor.b32 %r649, %r604, %r603; - and.b32 %r650, %r631, %r649; - xor.b32 %r651, %r650, %r625; - add.s32 %r652, %r648, %r651; - add.s32 %r653, %r643, %r519; - cvt.u64.u32 %rd272, %r632; - cvt.u64.u32 %rd273, %r653; - cvt.u64.u32 %rd274, %r631; - add.s32 %r654, %r652, %r643; - cvt.u64.u32 %rd275, %r654; - bfi.b64 %rd276, %rd274, %rd275, 32, 32; - bfi.b64 %rd277, %rd272, %rd273, 32, 32; - mov.b64 {%r655, %r656}, %rd276; - mov.b64 {%r657, %r658}, %rd277; - mov.b64 {%r659, %r660}, %rd265; - cvt.u64.u32 %rd278, %r660; - bfi.b64 %rd279, %rd278, %rd264, 32, 32; - cvt.u64.u32 %rd280, %r658; - cvt.u64.u32 %rd281, %r656; - cvt.u64.u32 %rd282, %r657; - bfi.b64 %rd283, %rd281, %rd275, 32, 32; - bfi.b64 %rd284, %rd280, %rd282, 32, 32; - mov.b64 {%r661, %r662}, %rd283; - mov.b64 {%r663, %r664}, %rd284; - mov.b64 {%r665, %r666}, %rd279; - shf.r.wrap.b32 %r667, %r663, %r663, 6; - shf.r.wrap.b32 %r668, %r663, %r663, 11; - xor.b32 %r669, %r667, %r668; - shf.r.wrap.b32 %r670, %r663, %r663, 25; - xor.b32 %r671, %r669, %r670; - xor.b32 %r672, %r664, %r605; - and.b32 %r673, %r672, %r663; - xor.b32 %r674, %r673, %r605; - add.s32 %r675, %r606, %r666; - add.s32 %r676, %r675, %r671; - add.s32 %r677, %r676, %r674; - shf.r.wrap.b32 %r678, %r661, %r661, 2; - shf.r.wrap.b32 %r679, %r661, %r661, 13; - xor.b32 %r680, %r678, %r679; - shf.r.wrap.b32 %r681, %r661, %r661, 22; - xor.b32 %r682, %r680, %r681; - and.b32 %r683, %r662, %r661; - and.b32 %r684, %r654, %r570; - xor.b32 %r685, %r683, %r684; - and.b32 %r686, %r662, %r603; - xor.b32 %r687, %r685, %r686; - add.s32 %r688, %r687, %r682; - add.s32 %r689, %r688, %r677; - add.s32 %r690, %r677, %r604; - shf.r.wrap.b32 %r691, %r690, %r690, 6; - shf.r.wrap.b32 %r692, %r690, %r690, 11; - xor.b32 %r693, %r691, %r692; - shf.r.wrap.b32 %r694, %r690, %r690, 25; - xor.b32 %r695, %r693, %r694; - xor.b32 %r696, %r664, %r663; - and.b32 %r697, %r690, %r696; - xor.b32 %r698, %r697, %r664; - add.s32 %r699, %r605, %r665; - add.s32 %r700, %r699, %r698; - add.s32 %r701, %r700, %r695; - shf.r.wrap.b32 %r702, %r689, %r689, 2; - shf.r.wrap.b32 %r703, %r689, %r689, 13; - xor.b32 %r704, %r702, %r703; - shf.r.wrap.b32 %r705, %r689, %r689, 22; - xor.b32 %r706, %r704, %r705; - xor.b32 %r707, %r662, %r661; - and.b32 %r708, %r689, %r707; - xor.b32 %r709, %r708, %r683; - add.s32 %r710, %r706, %r709; - add.s32 %r711, %r701, %r603; - cvt.u64.u32 %rd285, %r690; - cvt.u64.u32 %rd286, %r711; - cvt.u64.u32 %rd287, %r689; - add.s32 %r712, %r710, %r701; - cvt.u64.u32 %rd288, %r712; - bfi.b64 %rd289, %rd287, %rd288, 32, 32; - bfi.b64 %rd290, %rd285, %rd286, 32, 32; - mov.b64 {%r713, %r714}, %rd289; - mov.b64 {%r715, %r716}, %rd290; - cvt.u64.u32 %rd291, %r127; - cvt.u64.u32 %rd292, %r126; - cvt.u64.u32 %rd293, %r294; - bfi.b64 %rd294, %rd291, %rd292, 32, 32; - bfi.b64 %rd295, %rd142, %rd293, 32, 32; - mov.b64 {%r717, %r718}, %rd295; - mov.b64 {%r719, %r720}, %rd294; - shr.u32 %r721, %r718, 7; - shr.u32 %r722, %r719, 7; - shr.u32 %r723, %r720, 7; - cvt.u64.u32 %rd296, %r723; - cvt.u64.u32 %rd297, %r721; - shr.u32 %r724, %r717, 7; - cvt.u64.u32 %rd298, %r724; - cvt.u64.u32 %rd299, %r722; - bfi.b64 %rd300, %rd296, %rd299, 32, 32; - bfi.b64 %rd301, %rd297, %rd298, 32, 32; - shl.b32 %r725, %r718, 25; - shl.b32 %r726, %r719, 25; - cvt.u64.u32 %rd302, %r725; - shl.b32 %r727, %r717, 25; - cvt.u64.u32 %rd303, %r727; - cvt.u64.u32 %rd304, %r726; - cvt.u64.u32 %rd305, %r720; - bfi.b64 %rd306, %rd305, %rd304, 57, 7; - bfi.b64 %rd307, %rd302, %rd303, 32, 32; - mov.b64 {%r728, %r729}, %rd301; - mov.b64 {%r730, %r731}, %rd300; - mov.b64 {%r732, %r733}, %rd307; - mov.b64 {%r734, %r735}, %rd306; - or.b64 %rd308, %rd307, %rd301; - or.b32 %r736, %r733, %r729; - or.b32 %r737, %r734, %r730; - or.b32 %r738, %r735, %r731; - cvt.u64.u32 %rd309, %r738; - cvt.u64.u32 %rd310, %r736; - and.b64 %rd311, %rd308, 4294967295; - cvt.u64.u32 %rd312, %r737; - bfi.b64 %rd313, %rd309, %rd312, 32, 32; - bfi.b64 %rd314, %rd310, %rd311, 32, 32; - shr.u32 %r739, %r718, 18; - shr.u32 %r740, %r719, 18; - shr.u32 %r741, %r720, 18; - cvt.u64.u32 %rd315, %r741; - cvt.u64.u32 %rd316, %r739; - shr.u32 %r742, %r717, 18; - cvt.u64.u32 %rd317, %r742; - cvt.u64.u32 %rd318, %r740; - bfi.b64 %rd319, %rd315, %rd318, 32, 32; - bfi.b64 %rd320, %rd316, %rd317, 32, 32; - shl.b32 %r743, %r718, 14; - shl.b32 %r744, %r719, 14; - cvt.u64.u32 %rd321, %r743; - shl.b32 %r745, %r717, 14; - cvt.u64.u32 %rd322, %r745; - cvt.u64.u32 %rd323, %r744; - bfi.b64 %rd324, %rd305, %rd323, 46, 18; - bfi.b64 %rd325, %rd321, %rd322, 32, 32; - mov.b64 {%r746, %r747}, %rd320; - mov.b64 {%r748, %r749}, %rd319; - mov.b64 {%r750, %r751}, %rd325; - mov.b64 {%r752, %r753}, %rd324; - or.b64 %rd326, %rd325, %rd320; - or.b32 %r754, %r751, %r747; - or.b32 %r755, %r752, %r748; - or.b32 %r756, %r753, %r749; - cvt.u64.u32 %rd327, %r756; - cvt.u64.u32 %rd328, %r754; - and.b64 %rd329, %rd326, 4294967295; - cvt.u64.u32 %rd330, %r755; - bfi.b64 %rd331, %rd327, %rd330, 32, 32; - bfi.b64 %rd332, %rd328, %rd329, 32, 32; - shr.u32 %r757, %r718, 3; - shr.u32 %r758, %r719, 3; - shr.u32 %r759, %r720, 3; - cvt.u64.u32 %rd333, %r759; - cvt.u64.u32 %rd334, %r757; - shr.u32 %r760, %r717, 3; - cvt.u64.u32 %rd335, %r760; - cvt.u64.u32 %rd336, %r758; - bfi.b64 %rd337, %rd333, %rd336, 32, 32; - bfi.b64 %rd338, %rd334, %rd335, 32, 32; - mov.b64 {%r761, %r762}, %rd314; - mov.b64 {%r763, %r764}, %rd313; - mov.b64 {%r765, %r766}, %rd332; - mov.b64 {%r767, %r768}, %rd331; - xor.b64 %rd339, %rd332, %rd314; - xor.b32 %r769, %r766, %r762; - xor.b32 %r770, %r767, %r763; - xor.b32 %r771, %r768, %r764; - cvt.u64.u32 %rd340, %r771; - cvt.u64.u32 %rd341, %r769; - and.b64 %rd342, %rd339, 4294967295; - cvt.u64.u32 %rd343, %r770; - bfi.b64 %rd344, %rd340, %rd343, 32, 32; - bfi.b64 %rd345, %rd341, %rd342, 32, 32; - mov.b64 {%r772, %r773}, %rd345; - mov.b64 {%r774, %r775}, %rd344; - mov.b64 {%r776, %r777}, %rd338; - mov.b64 {%r778, %r779}, %rd337; - shf.l.wrap.b32 %r780, %r717, %r717, 25; - shf.l.wrap.b32 %r781, %r717, %r717, 14; - xor.b32 %r782, %r781, %r780; - xor.b32 %r783, %r782, %r760; - xor.b32 %r784, %r773, %r777; - xor.b32 %r785, %r774, %r778; - xor.b32 %r786, %r775, %r779; - cvt.u64.u32 %rd346, %r455; - cvt.u64.u32 %rd347, %r454; - cvt.u64.u32 %rd348, %r598; - bfi.b64 %rd349, %rd346, %rd347, 32, 32; - bfi.b64 %rd350, %rd221, %rd348, 32, 32; - mov.b64 {%r787, %r788}, %rd350; - mov.b64 {%r789, %r790}, %rd349; - shf.r.wrap.b32 %r791, %r596, %r596, 17; - shf.r.wrap.b32 %r792, %r596, %r596, 19; - xor.b32 %r793, %r791, %r792; - shr.u32 %r794, %r596, 10; - xor.b32 %r795, %r793, %r794; - add.s32 %r796, %r795, %r128; - add.s32 %r797, %r796, %r790; - add.s32 %r798, %r797, %r786; - shf.r.wrap.b32 %r799, %r595, %r595, 17; - shf.r.wrap.b32 %r800, %r595, %r595, 19; - xor.b32 %r801, %r799, %r800; - shr.u32 %r802, %r595, 10; - xor.b32 %r803, %r801, %r802; - add.s32 %r804, %r803, %r127; - add.s32 %r805, %r804, %r789; - add.s32 %r806, %r805, %r785; - shf.r.wrap.b32 %r807, %r798, %r798, 17; - shf.r.wrap.b32 %r808, %r798, %r798, 19; - xor.b32 %r809, %r807, %r808; - shr.u32 %r810, %r798, 10; - xor.b32 %r811, %r809, %r810; - add.s32 %r812, %r788, %r126; - add.s32 %r813, %r812, %r784; - add.s32 %r814, %r813, %r811; - shf.r.wrap.b32 %r815, %r806, %r806, 17; - shf.r.wrap.b32 %r816, %r806, %r806, 19; - xor.b32 %r817, %r815, %r816; - shr.u32 %r818, %r806, 10; - xor.b32 %r819, %r817, %r818; - add.s32 %r820, %r787, %r125; - add.s32 %r821, %r820, %r783; - add.s32 %r822, %r821, %r819; - cvt.u64.u32 %rd351, %r798; - cvt.u64.u32 %rd352, %r806; - cvt.u64.u32 %rd353, %r814; - cvt.u64.u32 %rd354, %r822; - bfi.b64 %rd355, %rd353, %rd354, 32, 32; - bfi.b64 %rd356, %rd351, %rd352, 32, 32; - mov.b64 {%r823, %r824}, %rd355; - mov.b64 {%r825, %r826}, %rd356; - add.s32 %r827, %r823, 604807628; - add.s32 %r828, %r824, 264347078; - add.s32 %r829, %r825, -272742522; - add.s32 %r830, %r826, -459576895; - cvt.u64.u32 %rd357, %r830; - cvt.u64.u32 %rd358, %r828; - cvt.u64.u32 %rd359, %r829; - cvt.u64.u32 %rd360, %r827; - bfi.b64 %rd361, %rd358, %rd360, 32, 32; - bfi.b64 %rd362, %rd357, %rd359, 32, 32; - cvt.u64.u32 %rd363, %r716; - cvt.u64.u32 %rd364, %r714; - cvt.u64.u32 %rd365, %r715; - bfi.b64 %rd366, %rd364, %rd288, 32, 32; - bfi.b64 %rd367, %rd363, %rd365, 32, 32; - mov.b64 {%r831, %r832}, %rd366; - mov.b64 {%r833, %r834}, %rd367; - mov.b64 {%r835, %r836}, %rd362; - shf.r.wrap.b32 %r837, %r833, %r833, 6; - shf.r.wrap.b32 %r838, %r833, %r833, 11; - xor.b32 %r839, %r837, %r838; - shf.r.wrap.b32 %r840, %r833, %r833, 25; - xor.b32 %r841, %r839, %r840; - xor.b32 %r842, %r834, %r663; - and.b32 %r843, %r842, %r833; - xor.b32 %r844, %r843, %r663; - add.s32 %r845, %r664, %r836; - add.s32 %r846, %r845, %r841; - add.s32 %r847, %r846, %r844; - shf.r.wrap.b32 %r848, %r831, %r831, 2; - shf.r.wrap.b32 %r849, %r831, %r831, 13; - xor.b32 %r850, %r848, %r849; - shf.r.wrap.b32 %r851, %r831, %r831, 22; - xor.b32 %r852, %r850, %r851; - and.b32 %r853, %r832, %r831; - and.b32 %r854, %r712, %r654; - xor.b32 %r855, %r853, %r854; - and.b32 %r856, %r832, %r661; - xor.b32 %r857, %r855, %r856; - add.s32 %r858, %r857, %r852; - add.s32 %r859, %r858, %r847; - add.s32 %r860, %r847, %r662; - shf.r.wrap.b32 %r861, %r860, %r860, 6; - shf.r.wrap.b32 %r862, %r860, %r860, 11; - xor.b32 %r863, %r861, %r862; - shf.r.wrap.b32 %r864, %r860, %r860, 25; - xor.b32 %r865, %r863, %r864; - xor.b32 %r866, %r834, %r833; - and.b32 %r867, %r860, %r866; - xor.b32 %r868, %r867, %r834; - add.s32 %r869, %r663, %r835; - add.s32 %r870, %r869, %r868; - add.s32 %r871, %r870, %r865; - shf.r.wrap.b32 %r872, %r859, %r859, 2; - shf.r.wrap.b32 %r873, %r859, %r859, 13; - xor.b32 %r874, %r872, %r873; - shf.r.wrap.b32 %r875, %r859, %r859, 22; - xor.b32 %r876, %r874, %r875; - xor.b32 %r877, %r832, %r831; - and.b32 %r878, %r859, %r877; - xor.b32 %r879, %r878, %r853; - add.s32 %r880, %r876, %r879; - add.s32 %r881, %r871, %r661; - cvt.u64.u32 %rd368, %r860; - cvt.u64.u32 %rd369, %r881; - cvt.u64.u32 %rd370, %r859; - add.s32 %r882, %r880, %r871; - cvt.u64.u32 %rd371, %r882; - bfi.b64 %rd372, %rd370, %rd371, 32, 32; - bfi.b64 %rd373, %rd368, %rd369, 32, 32; - mov.b64 {%r883, %r884}, %rd372; - mov.b64 {%r885, %r886}, %rd373; - mov.b64 {%r887, %r888}, %rd361; - cvt.u64.u32 %rd374, %r888; - bfi.b64 %rd375, %rd374, %rd360, 32, 32; - cvt.u64.u32 %rd376, %r886; - cvt.u64.u32 %rd377, %r884; - cvt.u64.u32 %rd378, %r885; - bfi.b64 %rd379, %rd377, %rd371, 32, 32; - bfi.b64 %rd380, %rd376, %rd378, 32, 32; - mov.b64 {%r889, %r890}, %rd379; - mov.b64 {%r891, %r892}, %rd380; - mov.b64 {%r893, %r894}, %rd375; - shf.r.wrap.b32 %r895, %r891, %r891, 6; - shf.r.wrap.b32 %r896, %r891, %r891, 11; - xor.b32 %r897, %r895, %r896; - shf.r.wrap.b32 %r898, %r891, %r891, 25; - xor.b32 %r899, %r897, %r898; - xor.b32 %r900, %r892, %r833; - and.b32 %r901, %r900, %r891; - xor.b32 %r902, %r901, %r833; - add.s32 %r903, %r834, %r894; - add.s32 %r904, %r903, %r899; - add.s32 %r905, %r904, %r902; - shf.r.wrap.b32 %r906, %r889, %r889, 2; - shf.r.wrap.b32 %r907, %r889, %r889, 13; - xor.b32 %r908, %r906, %r907; - shf.r.wrap.b32 %r909, %r889, %r889, 22; - xor.b32 %r910, %r908, %r909; - and.b32 %r911, %r890, %r889; - and.b32 %r912, %r882, %r712; - xor.b32 %r913, %r911, %r912; - and.b32 %r914, %r890, %r831; - xor.b32 %r915, %r913, %r914; - add.s32 %r916, %r915, %r910; - add.s32 %r917, %r916, %r905; - add.s32 %r918, %r905, %r832; - shf.r.wrap.b32 %r919, %r918, %r918, 6; - shf.r.wrap.b32 %r920, %r918, %r918, 11; - xor.b32 %r921, %r919, %r920; - shf.r.wrap.b32 %r922, %r918, %r918, 25; - xor.b32 %r923, %r921, %r922; - xor.b32 %r924, %r892, %r891; - and.b32 %r925, %r918, %r924; - xor.b32 %r926, %r925, %r892; - add.s32 %r927, %r833, %r893; - add.s32 %r928, %r927, %r926; - add.s32 %r929, %r928, %r923; - shf.r.wrap.b32 %r930, %r917, %r917, 2; - shf.r.wrap.b32 %r931, %r917, %r917, 13; - xor.b32 %r932, %r930, %r931; - shf.r.wrap.b32 %r933, %r917, %r917, 22; - xor.b32 %r934, %r932, %r933; - xor.b32 %r935, %r890, %r889; - and.b32 %r936, %r917, %r935; - xor.b32 %r937, %r936, %r911; - add.s32 %r938, %r934, %r937; - add.s32 %r939, %r929, %r831; - cvt.u64.u32 %rd381, %r918; - cvt.u64.u32 %rd382, %r939; - cvt.u64.u32 %rd383, %r917; - add.s32 %r940, %r938, %r929; - cvt.u64.u32 %rd384, %r940; - bfi.b64 %rd385, %rd383, %rd384, 32, 32; - bfi.b64 %rd386, %rd381, %rd382, 32, 32; - mov.b64 {%r941, %r942}, %rd385; - mov.b64 {%r943, %r944}, %rd386; - cvt.u64.u32 %rd387, %r293; - cvt.u64.u32 %rd388, %r292; - cvt.u64.u32 %rd389, %r456; - bfi.b64 %rd390, %rd387, %rd388, 32, 32; - bfi.b64 %rd391, %rd185, %rd389, 32, 32; - mov.b64 {%r945, %r946}, %rd391; - mov.b64 {%r947, %r948}, %rd390; - shr.u32 %r949, %r946, 7; - shr.u32 %r950, %r947, 7; - shr.u32 %r951, %r948, 7; - cvt.u64.u32 %rd392, %r951; - cvt.u64.u32 %rd393, %r949; - shr.u32 %r952, %r945, 7; - cvt.u64.u32 %rd394, %r952; - cvt.u64.u32 %rd395, %r950; - bfi.b64 %rd396, %rd392, %rd395, 32, 32; - bfi.b64 %rd397, %rd393, %rd394, 32, 32; - shl.b32 %r953, %r946, 25; - shl.b32 %r954, %r947, 25; - cvt.u64.u32 %rd398, %r953; - shl.b32 %r955, %r945, 25; - cvt.u64.u32 %rd399, %r955; - cvt.u64.u32 %rd400, %r954; - cvt.u64.u32 %rd401, %r948; - bfi.b64 %rd402, %rd401, %rd400, 57, 7; - bfi.b64 %rd403, %rd398, %rd399, 32, 32; - mov.b64 {%r956, %r957}, %rd397; - mov.b64 {%r958, %r959}, %rd396; - mov.b64 {%r960, %r961}, %rd403; - mov.b64 {%r962, %r963}, %rd402; - or.b64 %rd404, %rd403, %rd397; - or.b32 %r964, %r961, %r957; - or.b32 %r965, %r962, %r958; - or.b32 %r966, %r963, %r959; - cvt.u64.u32 %rd405, %r966; - cvt.u64.u32 %rd406, %r964; - and.b64 %rd407, %rd404, 4294967295; - cvt.u64.u32 %rd408, %r965; - bfi.b64 %rd409, %rd405, %rd408, 32, 32; - bfi.b64 %rd410, %rd406, %rd407, 32, 32; - shr.u32 %r967, %r946, 18; - shr.u32 %r968, %r947, 18; - shr.u32 %r969, %r948, 18; - cvt.u64.u32 %rd411, %r969; - cvt.u64.u32 %rd412, %r967; - shr.u32 %r970, %r945, 18; - cvt.u64.u32 %rd413, %r970; - cvt.u64.u32 %rd414, %r968; - bfi.b64 %rd415, %rd411, %rd414, 32, 32; - bfi.b64 %rd416, %rd412, %rd413, 32, 32; - shl.b32 %r971, %r946, 14; - shl.b32 %r972, %r947, 14; - cvt.u64.u32 %rd417, %r971; - shl.b32 %r973, %r945, 14; - cvt.u64.u32 %rd418, %r973; - cvt.u64.u32 %rd419, %r972; - bfi.b64 %rd420, %rd401, %rd419, 46, 18; - bfi.b64 %rd421, %rd417, %rd418, 32, 32; - mov.b64 {%r974, %r975}, %rd416; - mov.b64 {%r976, %r977}, %rd415; - mov.b64 {%r978, %r979}, %rd421; - mov.b64 {%r980, %r981}, %rd420; - or.b64 %rd422, %rd421, %rd416; - or.b32 %r982, %r979, %r975; - or.b32 %r983, %r980, %r976; - or.b32 %r984, %r981, %r977; - cvt.u64.u32 %rd423, %r984; - cvt.u64.u32 %rd424, %r982; - and.b64 %rd425, %rd422, 4294967295; - cvt.u64.u32 %rd426, %r983; - bfi.b64 %rd427, %rd423, %rd426, 32, 32; - bfi.b64 %rd428, %rd424, %rd425, 32, 32; - shr.u32 %r985, %r946, 3; - shr.u32 %r986, %r947, 3; - shr.u32 %r987, %r948, 3; - cvt.u64.u32 %rd429, %r987; - cvt.u64.u32 %rd430, %r985; - shr.u32 %r988, %r945, 3; - cvt.u64.u32 %rd431, %r988; - cvt.u64.u32 %rd432, %r986; - bfi.b64 %rd433, %rd429, %rd432, 32, 32; - bfi.b64 %rd434, %rd430, %rd431, 32, 32; - mov.b64 {%r989, %r990}, %rd410; - mov.b64 {%r991, %r992}, %rd409; - mov.b64 {%r993, %r994}, %rd428; - mov.b64 {%r995, %r996}, %rd427; - xor.b64 %rd435, %rd428, %rd410; - xor.b32 %r997, %r994, %r990; - xor.b32 %r998, %r995, %r991; - xor.b32 %r999, %r996, %r992; - cvt.u64.u32 %rd436, %r999; - cvt.u64.u32 %rd437, %r997; - and.b64 %rd438, %rd435, 4294967295; - cvt.u64.u32 %rd439, %r998; - bfi.b64 %rd440, %rd436, %rd439, 32, 32; - bfi.b64 %rd441, %rd437, %rd438, 32, 32; - mov.b64 {%r1000, %r1001}, %rd441; - mov.b64 {%r1002, %r1003}, %rd440; - mov.b64 {%r1004, %r1005}, %rd434; - mov.b64 {%r1006, %r1007}, %rd433; - shf.l.wrap.b32 %r1008, %r945, %r945, 25; - shf.l.wrap.b32 %r1009, %r945, %r945, 14; - xor.b32 %r1010, %r1009, %r1008; - xor.b32 %r1011, %r1010, %r988; - xor.b32 %r1012, %r1001, %r1005; - xor.b32 %r1013, %r1002, %r1006; - xor.b32 %r1014, %r1003, %r1007; - cvt.u64.u32 %rd442, %r597; - cvt.u64.u32 %rd443, %r596; - cvt.u64.u32 %rd444, %r826; - bfi.b64 %rd445, %rd257, %rd444, 32, 32; - bfi.b64 %rd446, %rd442, %rd443, 32, 32; - mov.b64 {%r1015, %r1016}, %rd445; - mov.b64 {%r1017, %r1018}, %rd446; - shf.r.wrap.b32 %r1019, %r824, %r824, 17; - shf.r.wrap.b32 %r1020, %r824, %r824, 19; - xor.b32 %r1021, %r1019, %r1020; - shr.u32 %r1022, %r824, 10; - xor.b32 %r1023, %r1021, %r1022; - add.s32 %r1024, %r1014, %r294; - add.s32 %r1025, %r1024, %r1023; - add.s32 %r1026, %r1025, %r1018; - shf.r.wrap.b32 %r1027, %r823, %r823, 17; - shf.r.wrap.b32 %r1028, %r823, %r823, 19; - xor.b32 %r1029, %r1027, %r1028; - shr.u32 %r1030, %r823, 10; - xor.b32 %r1031, %r1029, %r1030; - add.s32 %r1032, %r1013, %r293; - add.s32 %r1033, %r1032, %r1031; - add.s32 %r1034, %r1033, %r1017; - shf.r.wrap.b32 %r1035, %r1026, %r1026, 17; - shf.r.wrap.b32 %r1036, %r1026, %r1026, 19; - xor.b32 %r1037, %r1035, %r1036; - shr.u32 %r1038, %r1026, 10; - xor.b32 %r1039, %r1037, %r1038; - add.s32 %r1040, %r1012, %r292; - add.s32 %r1041, %r1040, %r1016; - add.s32 %r1042, %r1041, %r1039; - shf.r.wrap.b32 %r1043, %r1034, %r1034, 17; - shf.r.wrap.b32 %r1044, %r1034, %r1034, 19; - xor.b32 %r1045, %r1043, %r1044; - shr.u32 %r1046, %r1034, 10; - xor.b32 %r1047, %r1045, %r1046; - add.s32 %r1048, %r1011, %r291; - add.s32 %r1049, %r1048, %r1015; - add.s32 %r1050, %r1049, %r1047; - cvt.u64.u32 %rd447, %r1026; - cvt.u64.u32 %rd448, %r1034; - cvt.u64.u32 %rd449, %r1042; - cvt.u64.u32 %rd450, %r1050; - bfi.b64 %rd451, %rd449, %rd450, 32, 32; - bfi.b64 %rd452, %rd447, %rd448, 32, 32; - mov.b64 {%r1051, %r1052}, %rd451; - mov.b64 {%r1053, %r1054}, %rd452; - cvt.u64.u32 %rd453, %r1054; - cvt.u64.u32 %rd454, %r1052; - cvt.u64.u32 %rd455, %r1053; - bfi.b64 %rd456, %rd453, %rd455, 32, 32; - bfi.b64 %rd457, %rd454, %rd450, 32, 32; - mov.b64 {%r1055, %r1056}, %rd457; - mov.b64 {%r1057, %r1058}, %rd456; - add.s32 %r1059, %r1055, 1996064986; - add.s32 %r1060, %r1056, 1555081692; - add.s32 %r1061, %r1057, 1249150122; - add.s32 %r1062, %r1058, 770255983; - cvt.u64.u32 %rd458, %r1062; - cvt.u64.u32 %rd459, %r1060; - cvt.u64.u32 %rd460, %r1061; - cvt.u64.u32 %rd461, %r1059; - bfi.b64 %rd462, %rd459, %rd461, 32, 32; - bfi.b64 %rd463, %rd458, %rd460, 32, 32; - cvt.u64.u32 %rd464, %r944; - cvt.u64.u32 %rd465, %r942; - cvt.u64.u32 %rd466, %r943; - bfi.b64 %rd467, %rd465, %rd384, 32, 32; - bfi.b64 %rd468, %rd464, %rd466, 32, 32; - mov.b64 {%r1063, %r1064}, %rd467; - mov.b64 {%r1065, %r1066}, %rd468; - mov.b64 {%r1067, %r1068}, %rd463; - shf.r.wrap.b32 %r1069, %r1065, %r1065, 6; - shf.r.wrap.b32 %r1070, %r1065, %r1065, 11; - xor.b32 %r1071, %r1069, %r1070; - shf.r.wrap.b32 %r1072, %r1065, %r1065, 25; - xor.b32 %r1073, %r1071, %r1072; - xor.b32 %r1074, %r1066, %r891; - and.b32 %r1075, %r1074, %r1065; - xor.b32 %r1076, %r1075, %r891; - add.s32 %r1077, %r892, %r1068; - add.s32 %r1078, %r1077, %r1073; - add.s32 %r1079, %r1078, %r1076; - shf.r.wrap.b32 %r1080, %r1063, %r1063, 2; - shf.r.wrap.b32 %r1081, %r1063, %r1063, 13; - xor.b32 %r1082, %r1080, %r1081; - shf.r.wrap.b32 %r1083, %r1063, %r1063, 22; - xor.b32 %r1084, %r1082, %r1083; - and.b32 %r1085, %r1064, %r1063; - and.b32 %r1086, %r940, %r882; - xor.b32 %r1087, %r1085, %r1086; - and.b32 %r1088, %r1064, %r889; - xor.b32 %r1089, %r1087, %r1088; - add.s32 %r1090, %r1089, %r1084; - add.s32 %r1091, %r1090, %r1079; - add.s32 %r1092, %r1079, %r890; - shf.r.wrap.b32 %r1093, %r1092, %r1092, 6; - shf.r.wrap.b32 %r1094, %r1092, %r1092, 11; - xor.b32 %r1095, %r1093, %r1094; - shf.r.wrap.b32 %r1096, %r1092, %r1092, 25; - xor.b32 %r1097, %r1095, %r1096; - xor.b32 %r1098, %r1066, %r1065; - and.b32 %r1099, %r1092, %r1098; - xor.b32 %r1100, %r1099, %r1066; - add.s32 %r1101, %r891, %r1067; - add.s32 %r1102, %r1101, %r1100; - add.s32 %r1103, %r1102, %r1097; - shf.r.wrap.b32 %r1104, %r1091, %r1091, 2; - shf.r.wrap.b32 %r1105, %r1091, %r1091, 13; - xor.b32 %r1106, %r1104, %r1105; - shf.r.wrap.b32 %r1107, %r1091, %r1091, 22; - xor.b32 %r1108, %r1106, %r1107; - xor.b32 %r1109, %r1064, %r1063; - and.b32 %r1110, %r1091, %r1109; - xor.b32 %r1111, %r1110, %r1085; - add.s32 %r1112, %r1108, %r1111; - add.s32 %r1113, %r1103, %r889; - cvt.u64.u32 %rd469, %r1092; - cvt.u64.u32 %rd470, %r1113; - cvt.u64.u32 %rd471, %r1091; - add.s32 %r1114, %r1112, %r1103; - cvt.u64.u32 %rd472, %r1114; - bfi.b64 %rd473, %rd471, %rd472, 32, 32; - bfi.b64 %rd474, %rd469, %rd470, 32, 32; - mov.b64 {%r1115, %r1116}, %rd473; - mov.b64 {%r1117, %r1118}, %rd474; - mov.b64 {%r1119, %r1120}, %rd462; - cvt.u64.u32 %rd475, %r1120; - bfi.b64 %rd476, %rd475, %rd461, 32, 32; - cvt.u64.u32 %rd477, %r1118; - cvt.u64.u32 %rd478, %r1116; - cvt.u64.u32 %rd479, %r1117; - bfi.b64 %rd480, %rd478, %rd472, 32, 32; - bfi.b64 %rd481, %rd477, %rd479, 32, 32; - mov.b64 {%r1121, %r1122}, %rd480; - mov.b64 {%r1123, %r1124}, %rd481; - mov.b64 {%r1125, %r1126}, %rd476; - shf.r.wrap.b32 %r1127, %r1123, %r1123, 6; - shf.r.wrap.b32 %r1128, %r1123, %r1123, 11; - xor.b32 %r1129, %r1127, %r1128; - shf.r.wrap.b32 %r1130, %r1123, %r1123, 25; - xor.b32 %r1131, %r1129, %r1130; - xor.b32 %r1132, %r1124, %r1065; - and.b32 %r1133, %r1132, %r1123; - xor.b32 %r1134, %r1133, %r1065; - add.s32 %r1135, %r1066, %r1126; - add.s32 %r1136, %r1135, %r1131; - add.s32 %r1137, %r1136, %r1134; - shf.r.wrap.b32 %r1138, %r1121, %r1121, 2; - shf.r.wrap.b32 %r1139, %r1121, %r1121, 13; - xor.b32 %r1140, %r1138, %r1139; - shf.r.wrap.b32 %r1141, %r1121, %r1121, 22; - xor.b32 %r1142, %r1140, %r1141; - and.b32 %r1143, %r1122, %r1121; - and.b32 %r1144, %r1114, %r940; - xor.b32 %r1145, %r1143, %r1144; - and.b32 %r1146, %r1122, %r1063; - xor.b32 %r1147, %r1145, %r1146; - add.s32 %r1148, %r1147, %r1142; - add.s32 %r1149, %r1148, %r1137; - add.s32 %r1150, %r1137, %r1064; - shf.r.wrap.b32 %r1151, %r1150, %r1150, 6; - shf.r.wrap.b32 %r1152, %r1150, %r1150, 11; - xor.b32 %r1153, %r1151, %r1152; - shf.r.wrap.b32 %r1154, %r1150, %r1150, 25; - xor.b32 %r1155, %r1153, %r1154; - xor.b32 %r1156, %r1124, %r1123; - and.b32 %r1157, %r1150, %r1156; - xor.b32 %r1158, %r1157, %r1124; - add.s32 %r1159, %r1065, %r1125; - add.s32 %r1160, %r1159, %r1158; - add.s32 %r1161, %r1160, %r1155; - shf.r.wrap.b32 %r1162, %r1149, %r1149, 2; - shf.r.wrap.b32 %r1163, %r1149, %r1149, 13; - xor.b32 %r1164, %r1162, %r1163; - shf.r.wrap.b32 %r1165, %r1149, %r1149, 22; - xor.b32 %r1166, %r1164, %r1165; - xor.b32 %r1167, %r1122, %r1121; - and.b32 %r1168, %r1149, %r1167; - xor.b32 %r1169, %r1168, %r1143; - add.s32 %r1170, %r1166, %r1169; - add.s32 %r1171, %r1161, %r1063; - cvt.u64.u32 %rd482, %r1150; - cvt.u64.u32 %rd483, %r1171; - cvt.u64.u32 %rd484, %r1149; - add.s32 %r1172, %r1170, %r1161; - cvt.u64.u32 %rd485, %r1172; - bfi.b64 %rd486, %rd484, %rd485, 32, 32; - bfi.b64 %rd487, %rd482, %rd483, 32, 32; - mov.b64 {%r1173, %r1174}, %rd486; - mov.b64 {%r1175, %r1176}, %rd487; - shr.u32 %r1177, %r788, 7; - shr.u32 %r1178, %r789, 7; - shr.u32 %r1179, %r790, 7; - cvt.u64.u32 %rd488, %r1179; - cvt.u64.u32 %rd489, %r1177; - shr.u32 %r1180, %r787, 7; - cvt.u64.u32 %rd490, %r1180; - cvt.u64.u32 %rd491, %r1178; - bfi.b64 %rd492, %rd488, %rd491, 32, 32; - bfi.b64 %rd493, %rd489, %rd490, 32, 32; - shl.b32 %r1181, %r788, 25; - shl.b32 %r1182, %r789, 25; - cvt.u64.u32 %rd494, %r1181; - shl.b32 %r1183, %r787, 25; - cvt.u64.u32 %rd495, %r1183; - cvt.u64.u32 %rd496, %r1182; - cvt.u64.u32 %rd497, %r790; - bfi.b64 %rd498, %rd497, %rd496, 57, 7; - bfi.b64 %rd499, %rd494, %rd495, 32, 32; - mov.b64 {%r1184, %r1185}, %rd493; - mov.b64 {%r1186, %r1187}, %rd492; - mov.b64 {%r1188, %r1189}, %rd499; - mov.b64 {%r1190, %r1191}, %rd498; - or.b64 %rd500, %rd499, %rd493; - or.b32 %r1192, %r1189, %r1185; - or.b32 %r1193, %r1190, %r1186; - or.b32 %r1194, %r1191, %r1187; - cvt.u64.u32 %rd501, %r1194; - cvt.u64.u32 %rd502, %r1192; - and.b64 %rd503, %rd500, 4294967295; - cvt.u64.u32 %rd504, %r1193; - bfi.b64 %rd505, %rd501, %rd504, 32, 32; - bfi.b64 %rd506, %rd502, %rd503, 32, 32; - shr.u32 %r1195, %r788, 18; - shr.u32 %r1196, %r789, 18; - shr.u32 %r1197, %r790, 18; - cvt.u64.u32 %rd507, %r1197; - cvt.u64.u32 %rd508, %r1195; - shr.u32 %r1198, %r787, 18; - cvt.u64.u32 %rd509, %r1198; - cvt.u64.u32 %rd510, %r1196; - bfi.b64 %rd511, %rd507, %rd510, 32, 32; - bfi.b64 %rd512, %rd508, %rd509, 32, 32; - shl.b32 %r1199, %r788, 14; - shl.b32 %r1200, %r789, 14; - cvt.u64.u32 %rd513, %r1199; - shl.b32 %r1201, %r787, 14; - cvt.u64.u32 %rd514, %r1201; - cvt.u64.u32 %rd515, %r1200; - bfi.b64 %rd516, %rd497, %rd515, 46, 18; - bfi.b64 %rd517, %rd513, %rd514, 32, 32; - mov.b64 {%r1202, %r1203}, %rd512; - mov.b64 {%r1204, %r1205}, %rd511; - mov.b64 {%r1206, %r1207}, %rd517; - mov.b64 {%r1208, %r1209}, %rd516; - or.b64 %rd518, %rd517, %rd512; - or.b32 %r1210, %r1207, %r1203; - or.b32 %r1211, %r1208, %r1204; - or.b32 %r1212, %r1209, %r1205; - cvt.u64.u32 %rd519, %r1212; - cvt.u64.u32 %rd520, %r1210; - and.b64 %rd521, %rd518, 4294967295; - cvt.u64.u32 %rd522, %r1211; - bfi.b64 %rd523, %rd519, %rd522, 32, 32; - bfi.b64 %rd524, %rd520, %rd521, 32, 32; - shr.u32 %r1213, %r788, 3; - shr.u32 %r1214, %r789, 3; - shr.u32 %r1215, %r790, 3; - cvt.u64.u32 %rd525, %r1215; - cvt.u64.u32 %rd526, %r1213; - shr.u32 %r1216, %r787, 3; - cvt.u64.u32 %rd527, %r1216; - cvt.u64.u32 %rd528, %r1214; - bfi.b64 %rd529, %rd525, %rd528, 32, 32; - bfi.b64 %rd530, %rd526, %rd527, 32, 32; - mov.b64 {%r1217, %r1218}, %rd506; - mov.b64 {%r1219, %r1220}, %rd505; - mov.b64 {%r1221, %r1222}, %rd524; - mov.b64 {%r1223, %r1224}, %rd523; - xor.b64 %rd531, %rd524, %rd506; - xor.b32 %r1225, %r1222, %r1218; - xor.b32 %r1226, %r1223, %r1219; - xor.b32 %r1227, %r1224, %r1220; - cvt.u64.u32 %rd532, %r1227; - cvt.u64.u32 %rd533, %r1225; - and.b64 %rd534, %rd531, 4294967295; - cvt.u64.u32 %rd535, %r1226; - bfi.b64 %rd536, %rd532, %rd535, 32, 32; - bfi.b64 %rd537, %rd533, %rd534, 32, 32; - mov.b64 {%r1228, %r1229}, %rd537; - mov.b64 {%r1230, %r1231}, %rd536; - mov.b64 {%r1232, %r1233}, %rd530; - mov.b64 {%r1234, %r1235}, %rd529; - shf.l.wrap.b32 %r1236, %r787, %r787, 25; - shf.l.wrap.b32 %r1237, %r787, %r787, 14; - xor.b32 %r1238, %r1237, %r1236; - xor.b32 %r1239, %r1238, %r1216; - xor.b32 %r1240, %r1229, %r1233; - xor.b32 %r1241, %r1230, %r1234; - xor.b32 %r1242, %r1231, %r1235; - cvt.u64.u32 %rd538, %r825; - cvt.u64.u32 %rd539, %r824; - cvt.u64.u32 %rd540, %r1058; - bfi.b64 %rd541, %rd354, %rd540, 32, 32; - bfi.b64 %rd542, %rd538, %rd539, 32, 32; - mov.b64 {%r1243, %r1244}, %rd541; - mov.b64 {%r1245, %r1246}, %rd542; - shf.r.wrap.b32 %r1247, %r1056, %r1056, 17; - shf.r.wrap.b32 %r1248, %r1056, %r1056, 19; - xor.b32 %r1249, %r1247, %r1248; - shr.u32 %r1250, %r1056, 10; - xor.b32 %r1251, %r1249, %r1250; - add.s32 %r1252, %r1242, %r456; - add.s32 %r1253, %r1252, %r1251; - add.s32 %r1254, %r1253, %r1246; - shf.r.wrap.b32 %r1255, %r1055, %r1055, 17; - shf.r.wrap.b32 %r1256, %r1055, %r1055, 19; - xor.b32 %r1257, %r1255, %r1256; - shr.u32 %r1258, %r1055, 10; - xor.b32 %r1259, %r1257, %r1258; - add.s32 %r1260, %r1241, %r455; - add.s32 %r1261, %r1260, %r1259; - add.s32 %r1262, %r1261, %r1245; - shf.r.wrap.b32 %r1263, %r1254, %r1254, 17; - shf.r.wrap.b32 %r1264, %r1254, %r1254, 19; - xor.b32 %r1265, %r1263, %r1264; - shr.u32 %r1266, %r1254, 10; - xor.b32 %r1267, %r1265, %r1266; - add.s32 %r1268, %r1240, %r454; - add.s32 %r1269, %r1268, %r1244; - add.s32 %r1270, %r1269, %r1267; - shf.r.wrap.b32 %r1271, %r1262, %r1262, 17; - shf.r.wrap.b32 %r1272, %r1262, %r1262, 19; - xor.b32 %r1273, %r1271, %r1272; - shr.u32 %r1274, %r1262, 10; - xor.b32 %r1275, %r1273, %r1274; - add.s32 %r1276, %r1239, %r453; - add.s32 %r1277, %r1276, %r1243; - add.s32 %r1278, %r1277, %r1275; - cvt.u64.u32 %rd543, %r1254; - cvt.u64.u32 %rd544, %r1262; - cvt.u64.u32 %rd545, %r1270; - cvt.u64.u32 %rd546, %r1278; - bfi.b64 %rd547, %rd545, %rd546, 32, 32; - bfi.b64 %rd548, %rd543, %rd544, 32, 32; - mov.b64 {%r1279, %r1280}, %rd547; - mov.b64 {%r1281, %r1282}, %rd548; - cvt.u64.u32 %rd549, %r1282; - cvt.u64.u32 %rd550, %r1280; - cvt.u64.u32 %rd551, %r1281; - bfi.b64 %rd552, %rd549, %rd551, 32, 32; - bfi.b64 %rd553, %rd550, %rd546, 32, 32; - mov.b64 {%r1283, %r1284}, %rd553; - mov.b64 {%r1285, %r1286}, %rd552; - add.s32 %r1287, %r1283, -1084653625; - add.s32 %r1288, %r1284, -1341970488; - add.s32 %r1289, %r1285, -1473132947; - add.s32 %r1290, %r1286, -1740746414; - cvt.u64.u32 %rd554, %r1290; - cvt.u64.u32 %rd555, %r1288; - cvt.u64.u32 %rd556, %r1289; - cvt.u64.u32 %rd557, %r1287; - bfi.b64 %rd558, %rd555, %rd557, 32, 32; - bfi.b64 %rd559, %rd554, %rd556, 32, 32; - cvt.u64.u32 %rd560, %r1176; - cvt.u64.u32 %rd561, %r1174; - cvt.u64.u32 %rd562, %r1175; - bfi.b64 %rd563, %rd561, %rd485, 32, 32; - bfi.b64 %rd564, %rd560, %rd562, 32, 32; - mov.b64 {%r1291, %r1292}, %rd563; - mov.b64 {%r1293, %r1294}, %rd564; - mov.b64 {%r1295, %r1296}, %rd559; - shf.r.wrap.b32 %r1297, %r1293, %r1293, 6; - shf.r.wrap.b32 %r1298, %r1293, %r1293, 11; - xor.b32 %r1299, %r1297, %r1298; - shf.r.wrap.b32 %r1300, %r1293, %r1293, 25; - xor.b32 %r1301, %r1299, %r1300; - xor.b32 %r1302, %r1294, %r1123; - and.b32 %r1303, %r1302, %r1293; - xor.b32 %r1304, %r1303, %r1123; - add.s32 %r1305, %r1124, %r1296; - add.s32 %r1306, %r1305, %r1301; - add.s32 %r1307, %r1306, %r1304; - shf.r.wrap.b32 %r1308, %r1291, %r1291, 2; - shf.r.wrap.b32 %r1309, %r1291, %r1291, 13; - xor.b32 %r1310, %r1308, %r1309; - shf.r.wrap.b32 %r1311, %r1291, %r1291, 22; - xor.b32 %r1312, %r1310, %r1311; - and.b32 %r1313, %r1292, %r1291; - and.b32 %r1314, %r1172, %r1114; - xor.b32 %r1315, %r1313, %r1314; - and.b32 %r1316, %r1292, %r1121; - xor.b32 %r1317, %r1315, %r1316; - add.s32 %r1318, %r1317, %r1312; - add.s32 %r1319, %r1318, %r1307; - add.s32 %r1320, %r1307, %r1122; - shf.r.wrap.b32 %r1321, %r1320, %r1320, 6; - shf.r.wrap.b32 %r1322, %r1320, %r1320, 11; - xor.b32 %r1323, %r1321, %r1322; - shf.r.wrap.b32 %r1324, %r1320, %r1320, 25; - xor.b32 %r1325, %r1323, %r1324; - xor.b32 %r1326, %r1294, %r1293; - and.b32 %r1327, %r1320, %r1326; - xor.b32 %r1328, %r1327, %r1294; - add.s32 %r1329, %r1123, %r1295; - add.s32 %r1330, %r1329, %r1328; - add.s32 %r1331, %r1330, %r1325; - shf.r.wrap.b32 %r1332, %r1319, %r1319, 2; - shf.r.wrap.b32 %r1333, %r1319, %r1319, 13; - xor.b32 %r1334, %r1332, %r1333; - shf.r.wrap.b32 %r1335, %r1319, %r1319, 22; - xor.b32 %r1336, %r1334, %r1335; - xor.b32 %r1337, %r1292, %r1291; - and.b32 %r1338, %r1319, %r1337; - xor.b32 %r1339, %r1338, %r1313; - add.s32 %r1340, %r1336, %r1339; - add.s32 %r1341, %r1331, %r1121; - cvt.u64.u32 %rd565, %r1320; - cvt.u64.u32 %rd566, %r1341; - cvt.u64.u32 %rd567, %r1319; - add.s32 %r1342, %r1340, %r1331; - cvt.u64.u32 %rd568, %r1342; - bfi.b64 %rd569, %rd567, %rd568, 32, 32; - bfi.b64 %rd570, %rd565, %rd566, 32, 32; - mov.b64 {%r1343, %r1344}, %rd569; - mov.b64 {%r1345, %r1346}, %rd570; - mov.b64 {%r1347, %r1348}, %rd558; - cvt.u64.u32 %rd571, %r1348; - bfi.b64 %rd572, %rd571, %rd557, 32, 32; - cvt.u64.u32 %rd573, %r1346; - cvt.u64.u32 %rd574, %r1344; - cvt.u64.u32 %rd575, %r1345; - bfi.b64 %rd576, %rd574, %rd568, 32, 32; - bfi.b64 %rd577, %rd573, %rd575, 32, 32; - mov.b64 {%r1349, %r1350}, %rd576; - mov.b64 {%r1351, %r1352}, %rd577; - mov.b64 {%r1353, %r1354}, %rd572; - shf.r.wrap.b32 %r1355, %r1351, %r1351, 6; - shf.r.wrap.b32 %r1356, %r1351, %r1351, 11; - xor.b32 %r1357, %r1355, %r1356; - shf.r.wrap.b32 %r1358, %r1351, %r1351, 25; - xor.b32 %r1359, %r1357, %r1358; - xor.b32 %r1360, %r1352, %r1293; - and.b32 %r1361, %r1360, %r1351; - xor.b32 %r1362, %r1361, %r1293; - add.s32 %r1363, %r1294, %r1354; - add.s32 %r1364, %r1363, %r1359; - add.s32 %r1365, %r1364, %r1362; - shf.r.wrap.b32 %r1366, %r1349, %r1349, 2; - shf.r.wrap.b32 %r1367, %r1349, %r1349, 13; - xor.b32 %r1368, %r1366, %r1367; - shf.r.wrap.b32 %r1369, %r1349, %r1349, 22; - xor.b32 %r1370, %r1368, %r1369; - and.b32 %r1371, %r1350, %r1349; - and.b32 %r1372, %r1342, %r1172; - xor.b32 %r1373, %r1371, %r1372; - and.b32 %r1374, %r1350, %r1291; - xor.b32 %r1375, %r1373, %r1374; - add.s32 %r1376, %r1375, %r1370; - add.s32 %r1377, %r1376, %r1365; - add.s32 %r1378, %r1365, %r1292; - shf.r.wrap.b32 %r1379, %r1378, %r1378, 6; - shf.r.wrap.b32 %r1380, %r1378, %r1378, 11; - xor.b32 %r1381, %r1379, %r1380; - shf.r.wrap.b32 %r1382, %r1378, %r1378, 25; - xor.b32 %r1383, %r1381, %r1382; - xor.b32 %r1384, %r1352, %r1351; - and.b32 %r1385, %r1378, %r1384; - xor.b32 %r1386, %r1385, %r1352; - add.s32 %r1387, %r1293, %r1353; - add.s32 %r1388, %r1387, %r1386; - add.s32 %r1389, %r1388, %r1383; - shf.r.wrap.b32 %r1390, %r1377, %r1377, 2; - shf.r.wrap.b32 %r1391, %r1377, %r1377, 13; - xor.b32 %r1392, %r1390, %r1391; - shf.r.wrap.b32 %r1393, %r1377, %r1377, 22; - xor.b32 %r1394, %r1392, %r1393; - xor.b32 %r1395, %r1350, %r1349; - and.b32 %r1396, %r1377, %r1395; - xor.b32 %r1397, %r1396, %r1371; - add.s32 %r1398, %r1394, %r1397; - add.s32 %r1399, %r1389, %r1291; - cvt.u64.u32 %rd578, %r1378; - cvt.u64.u32 %rd579, %r1399; - cvt.u64.u32 %rd580, %r1377; - add.s32 %r1400, %r1398, %r1389; - cvt.u64.u32 %rd581, %r1400; - bfi.b64 %rd582, %rd580, %rd581, 32, 32; - bfi.b64 %rd583, %rd578, %rd579, 32, 32; - mov.b64 {%r1401, %r1402}, %rd582; - mov.b64 {%r1403, %r1404}, %rd583; - shr.u32 %r1405, %r1016, 7; - shr.u32 %r1406, %r1017, 7; - shr.u32 %r1407, %r1018, 7; - cvt.u64.u32 %rd584, %r1407; - cvt.u64.u32 %rd585, %r1405; - shr.u32 %r1408, %r1015, 7; - cvt.u64.u32 %rd586, %r1408; - cvt.u64.u32 %rd587, %r1406; - bfi.b64 %rd588, %rd585, %rd586, 32, 32; - bfi.b64 %rd589, %rd584, %rd587, 32, 32; - shl.b32 %r1409, %r1016, 25; - shl.b32 %r1410, %r1017, 25; - cvt.u64.u32 %rd590, %r1409; - shl.b32 %r1411, %r1015, 25; - cvt.u64.u32 %rd591, %r1411; - cvt.u64.u32 %rd592, %r1410; - bfi.b64 %rd593, %rd590, %rd591, 32, 32; - cvt.u64.u32 %rd594, %r1018; - bfi.b64 %rd595, %rd594, %rd592, 57, 7; - mov.b64 {%r1412, %r1413}, %rd588; - mov.b64 {%r1414, %r1415}, %rd589; - mov.b64 {%r1416, %r1417}, %rd593; - mov.b64 {%r1418, %r1419}, %rd595; - or.b64 %rd596, %rd593, %rd588; - or.b32 %r1420, %r1417, %r1413; - or.b32 %r1421, %r1418, %r1414; - or.b32 %r1422, %r1419, %r1415; - cvt.u64.u32 %rd597, %r1422; - cvt.u64.u32 %rd598, %r1420; - and.b64 %rd599, %rd596, 4294967295; - cvt.u64.u32 %rd600, %r1421; - bfi.b64 %rd601, %rd598, %rd599, 32, 32; - bfi.b64 %rd602, %rd597, %rd600, 32, 32; - shr.u32 %r1423, %r1016, 18; - shr.u32 %r1424, %r1017, 18; - shr.u32 %r1425, %r1018, 18; - cvt.u64.u32 %rd603, %r1425; - cvt.u64.u32 %rd604, %r1423; - shr.u32 %r1426, %r1015, 18; - cvt.u64.u32 %rd605, %r1426; - cvt.u64.u32 %rd606, %r1424; - bfi.b64 %rd607, %rd604, %rd605, 32, 32; - bfi.b64 %rd608, %rd603, %rd606, 32, 32; - shl.b32 %r1427, %r1016, 14; - shl.b32 %r1428, %r1017, 14; - cvt.u64.u32 %rd609, %r1427; - shl.b32 %r1429, %r1015, 14; - cvt.u64.u32 %rd610, %r1429; - cvt.u64.u32 %rd611, %r1428; - bfi.b64 %rd612, %rd609, %rd610, 32, 32; - bfi.b64 %rd613, %rd594, %rd611, 46, 18; - mov.b64 {%r1430, %r1431}, %rd607; - mov.b64 {%r1432, %r1433}, %rd608; - mov.b64 {%r1434, %r1435}, %rd612; - mov.b64 {%r1436, %r1437}, %rd613; - or.b64 %rd614, %rd612, %rd607; - or.b32 %r1438, %r1435, %r1431; - or.b32 %r1439, %r1436, %r1432; - or.b32 %r1440, %r1437, %r1433; - cvt.u64.u32 %rd615, %r1440; - cvt.u64.u32 %rd616, %r1438; - and.b64 %rd617, %rd614, 4294967295; - cvt.u64.u32 %rd618, %r1439; - bfi.b64 %rd619, %rd616, %rd617, 32, 32; - bfi.b64 %rd620, %rd615, %rd618, 32, 32; - shr.u32 %r1441, %r1016, 3; - shr.u32 %r1442, %r1017, 3; - shr.u32 %r1443, %r1018, 3; - cvt.u64.u32 %rd621, %r1443; - cvt.u64.u32 %rd622, %r1441; - shr.u32 %r1444, %r1015, 3; - cvt.u64.u32 %rd623, %r1444; - cvt.u64.u32 %rd624, %r1442; - bfi.b64 %rd625, %rd622, %rd623, 32, 32; - bfi.b64 %rd626, %rd621, %rd624, 32, 32; - mov.b64 {%r1445, %r1446}, %rd601; - mov.b64 {%r1447, %r1448}, %rd602; - mov.b64 {%r1449, %r1450}, %rd619; - mov.b64 {%r1451, %r1452}, %rd620; - xor.b64 %rd627, %rd619, %rd601; - xor.b32 %r1453, %r1450, %r1446; - xor.b32 %r1454, %r1451, %r1447; - xor.b32 %r1455, %r1452, %r1448; - cvt.u64.u32 %rd628, %r1455; - cvt.u64.u32 %rd629, %r1453; - and.b64 %rd630, %rd627, 4294967295; - cvt.u64.u32 %rd631, %r1454; - bfi.b64 %rd632, %rd629, %rd630, 32, 32; - bfi.b64 %rd633, %rd628, %rd631, 32, 32; - mov.b64 {%r1456, %r1457}, %rd632; - mov.b64 {%r1458, %r1459}, %rd633; - mov.b64 {%r1460, %r1461}, %rd625; - mov.b64 {%r1462, %r1463}, %rd626; - shf.l.wrap.b32 %r1464, %r1015, %r1015, 25; - shf.l.wrap.b32 %r1465, %r1015, %r1015, 14; - xor.b32 %r1466, %r1465, %r1464; - xor.b32 %r1467, %r1466, %r1444; - xor.b32 %r1468, %r1457, %r1461; - xor.b32 %r1469, %r1458, %r1462; - xor.b32 %r1470, %r1459, %r1463; - cvt.u64.u32 %rd634, %r1057; - cvt.u64.u32 %rd635, %r1056; - cvt.u64.u32 %rd636, %r1286; - bfi.b64 %rd637, %rd450, %rd636, 32, 32; - bfi.b64 %rd638, %rd634, %rd635, 32, 32; - mov.b64 {%r1471, %r1472}, %rd637; - mov.b64 {%r1473, %r1474}, %rd638; - shf.r.wrap.b32 %r1475, %r1284, %r1284, 17; - shf.r.wrap.b32 %r1476, %r1284, %r1284, 19; - xor.b32 %r1477, %r1475, %r1476; - shr.u32 %r1478, %r1284, 10; - xor.b32 %r1479, %r1477, %r1478; - add.s32 %r1480, %r1470, %r598; - add.s32 %r1481, %r1480, %r1479; - add.s32 %r1482, %r1481, %r1474; - shf.r.wrap.b32 %r1483, %r1283, %r1283, 17; - shf.r.wrap.b32 %r1484, %r1283, %r1283, 19; - xor.b32 %r1485, %r1483, %r1484; - shr.u32 %r1486, %r1283, 10; - xor.b32 %r1487, %r1485, %r1486; - add.s32 %r1488, %r1469, %r597; - add.s32 %r1489, %r1488, %r1487; - add.s32 %r1490, %r1489, %r1473; - shf.r.wrap.b32 %r1491, %r1482, %r1482, 17; - shf.r.wrap.b32 %r1492, %r1482, %r1482, 19; - xor.b32 %r1493, %r1491, %r1492; - shr.u32 %r1494, %r1482, 10; - xor.b32 %r1495, %r1493, %r1494; - add.s32 %r1496, %r1468, %r596; - add.s32 %r1497, %r1496, %r1472; - add.s32 %r1498, %r1497, %r1495; - shf.r.wrap.b32 %r1499, %r1490, %r1490, 17; - shf.r.wrap.b32 %r1500, %r1490, %r1490, 19; - xor.b32 %r1501, %r1499, %r1500; - shr.u32 %r1502, %r1490, 10; - xor.b32 %r1503, %r1501, %r1502; - add.s32 %r1504, %r1467, %r595; - add.s32 %r1505, %r1504, %r1471; - add.s32 %r1506, %r1505, %r1503; - cvt.u64.u32 %rd639, %r1482; - cvt.u64.u32 %rd640, %r1490; - cvt.u64.u32 %rd641, %r1498; - cvt.u64.u32 %rd642, %r1506; - bfi.b64 %rd643, %rd641, %rd642, 32, 32; - bfi.b64 %rd644, %rd639, %rd640, 32, 32; - mov.b64 {%r1507, %r1508}, %rd643; - mov.b64 {%r1509, %r1510}, %rd644; - cvt.u64.u32 %rd645, %r1510; - cvt.u64.u32 %rd646, %r1508; - cvt.u64.u32 %rd647, %r1509; - bfi.b64 %rd648, %rd645, %rd647, 32, 32; - bfi.b64 %rd649, %rd646, %rd642, 32, 32; - mov.b64 {%r1511, %r1512}, %rd649; - mov.b64 {%r1513, %r1514}, %rd648; - add.s32 %r1515, %r1511, 338241895; - add.s32 %r1516, %r1512, 113926993; - add.s32 %r1517, %r1513, -710438585; - add.s32 %r1518, %r1514, -958395405; - cvt.u64.u32 %rd650, %r1518; - cvt.u64.u32 %rd651, %r1516; - cvt.u64.u32 %rd652, %r1517; - cvt.u64.u32 %rd653, %r1515; - bfi.b64 %rd654, %rd651, %rd653, 32, 32; - bfi.b64 %rd655, %rd650, %rd652, 32, 32; - cvt.u64.u32 %rd656, %r1404; - cvt.u64.u32 %rd657, %r1402; - cvt.u64.u32 %rd658, %r1403; - bfi.b64 %rd659, %rd657, %rd581, 32, 32; - bfi.b64 %rd660, %rd656, %rd658, 32, 32; - mov.b64 {%r1519, %r1520}, %rd659; - mov.b64 {%r1521, %r1522}, %rd660; - mov.b64 {%r1523, %r1524}, %rd655; - shf.r.wrap.b32 %r1525, %r1521, %r1521, 6; - shf.r.wrap.b32 %r1526, %r1521, %r1521, 11; - xor.b32 %r1527, %r1525, %r1526; - shf.r.wrap.b32 %r1528, %r1521, %r1521, 25; - xor.b32 %r1529, %r1527, %r1528; - xor.b32 %r1530, %r1522, %r1351; - and.b32 %r1531, %r1530, %r1521; - xor.b32 %r1532, %r1531, %r1351; - add.s32 %r1533, %r1352, %r1524; - add.s32 %r1534, %r1533, %r1529; - add.s32 %r1535, %r1534, %r1532; - shf.r.wrap.b32 %r1536, %r1519, %r1519, 2; - shf.r.wrap.b32 %r1537, %r1519, %r1519, 13; - xor.b32 %r1538, %r1536, %r1537; - shf.r.wrap.b32 %r1539, %r1519, %r1519, 22; - xor.b32 %r1540, %r1538, %r1539; - and.b32 %r1541, %r1520, %r1519; - and.b32 %r1542, %r1400, %r1342; - xor.b32 %r1543, %r1541, %r1542; - and.b32 %r1544, %r1520, %r1349; - xor.b32 %r1545, %r1543, %r1544; - add.s32 %r1546, %r1545, %r1540; - add.s32 %r1547, %r1546, %r1535; - add.s32 %r1548, %r1535, %r1350; - shf.r.wrap.b32 %r1549, %r1548, %r1548, 6; - shf.r.wrap.b32 %r1550, %r1548, %r1548, 11; - xor.b32 %r1551, %r1549, %r1550; - shf.r.wrap.b32 %r1552, %r1548, %r1548, 25; - xor.b32 %r1553, %r1551, %r1552; - xor.b32 %r1554, %r1522, %r1521; - and.b32 %r1555, %r1548, %r1554; - xor.b32 %r1556, %r1555, %r1522; - add.s32 %r1557, %r1351, %r1523; - add.s32 %r1558, %r1557, %r1556; - add.s32 %r1559, %r1558, %r1553; - shf.r.wrap.b32 %r1560, %r1547, %r1547, 2; - shf.r.wrap.b32 %r1561, %r1547, %r1547, 13; - xor.b32 %r1562, %r1560, %r1561; - shf.r.wrap.b32 %r1563, %r1547, %r1547, 22; - xor.b32 %r1564, %r1562, %r1563; - xor.b32 %r1565, %r1520, %r1519; - and.b32 %r1566, %r1547, %r1565; - xor.b32 %r1567, %r1566, %r1541; - add.s32 %r1568, %r1564, %r1567; - add.s32 %r1569, %r1559, %r1349; - cvt.u64.u32 %rd661, %r1548; - cvt.u64.u32 %rd662, %r1569; - cvt.u64.u32 %rd663, %r1547; - add.s32 %r1570, %r1568, %r1559; - cvt.u64.u32 %rd664, %r1570; - bfi.b64 %rd665, %rd663, %rd664, 32, 32; - bfi.b64 %rd666, %rd661, %rd662, 32, 32; - mov.b64 {%r1571, %r1572}, %rd665; - mov.b64 {%r1573, %r1574}, %rd666; - mov.b64 {%r1575, %r1576}, %rd654; - cvt.u64.u32 %rd667, %r1576; - bfi.b64 %rd668, %rd667, %rd653, 32, 32; - cvt.u64.u32 %rd669, %r1574; - cvt.u64.u32 %rd670, %r1572; - cvt.u64.u32 %rd671, %r1573; - bfi.b64 %rd672, %rd670, %rd664, 32, 32; - bfi.b64 %rd673, %rd669, %rd671, 32, 32; - mov.b64 {%r1577, %r1578}, %rd672; - mov.b64 {%r1579, %r1580}, %rd673; - mov.b64 {%r1581, %r1582}, %rd668; - shf.r.wrap.b32 %r1583, %r1579, %r1579, 6; - shf.r.wrap.b32 %r1584, %r1579, %r1579, 11; - xor.b32 %r1585, %r1583, %r1584; - shf.r.wrap.b32 %r1586, %r1579, %r1579, 25; - xor.b32 %r1587, %r1585, %r1586; - xor.b32 %r1588, %r1580, %r1521; - and.b32 %r1589, %r1588, %r1579; - xor.b32 %r1590, %r1589, %r1521; - add.s32 %r1591, %r1522, %r1582; - add.s32 %r1592, %r1591, %r1587; - add.s32 %r1593, %r1592, %r1590; - shf.r.wrap.b32 %r1594, %r1577, %r1577, 2; - shf.r.wrap.b32 %r1595, %r1577, %r1577, 13; - xor.b32 %r1596, %r1594, %r1595; - shf.r.wrap.b32 %r1597, %r1577, %r1577, 22; - xor.b32 %r1598, %r1596, %r1597; - and.b32 %r1599, %r1578, %r1577; - and.b32 %r1600, %r1570, %r1400; - xor.b32 %r1601, %r1599, %r1600; - and.b32 %r1602, %r1578, %r1519; - xor.b32 %r1603, %r1601, %r1602; - add.s32 %r1604, %r1603, %r1598; - add.s32 %r1605, %r1604, %r1593; - add.s32 %r1606, %r1593, %r1520; - shf.r.wrap.b32 %r1607, %r1606, %r1606, 6; - shf.r.wrap.b32 %r1608, %r1606, %r1606, 11; - xor.b32 %r1609, %r1607, %r1608; - shf.r.wrap.b32 %r1610, %r1606, %r1606, 25; - xor.b32 %r1611, %r1609, %r1610; - xor.b32 %r1612, %r1580, %r1579; - and.b32 %r1613, %r1606, %r1612; - xor.b32 %r1614, %r1613, %r1580; - add.s32 %r1615, %r1521, %r1581; - add.s32 %r1616, %r1615, %r1614; - add.s32 %r1617, %r1616, %r1611; - shf.r.wrap.b32 %r1618, %r1605, %r1605, 2; - shf.r.wrap.b32 %r1619, %r1605, %r1605, 13; - xor.b32 %r1620, %r1618, %r1619; - shf.r.wrap.b32 %r1621, %r1605, %r1605, 22; - xor.b32 %r1622, %r1620, %r1621; - xor.b32 %r1623, %r1578, %r1577; - and.b32 %r1624, %r1605, %r1623; - xor.b32 %r1625, %r1624, %r1599; - add.s32 %r1626, %r1622, %r1625; - add.s32 %r1627, %r1617, %r1519; - cvt.u64.u32 %rd674, %r1606; - cvt.u64.u32 %rd675, %r1627; - cvt.u64.u32 %rd676, %r1605; - add.s32 %r1628, %r1626, %r1617; - cvt.u64.u32 %rd677, %r1628; - bfi.b64 %rd678, %rd676, %rd677, 32, 32; - bfi.b64 %rd679, %rd674, %rd675, 32, 32; - mov.b64 {%r1629, %r1630}, %rd678; - mov.b64 {%r1631, %r1632}, %rd679; - shr.u32 %r1633, %r1244, 7; - shr.u32 %r1634, %r1245, 7; - shr.u32 %r1635, %r1246, 7; - cvt.u64.u32 %rd680, %r1635; - cvt.u64.u32 %rd681, %r1633; - shr.u32 %r1636, %r1243, 7; - cvt.u64.u32 %rd682, %r1636; - cvt.u64.u32 %rd683, %r1634; - bfi.b64 %rd684, %rd681, %rd682, 32, 32; - bfi.b64 %rd685, %rd680, %rd683, 32, 32; - shl.b32 %r1637, %r1244, 25; - shl.b32 %r1638, %r1245, 25; - cvt.u64.u32 %rd686, %r1637; - shl.b32 %r1639, %r1243, 25; - cvt.u64.u32 %rd687, %r1639; - cvt.u64.u32 %rd688, %r1638; - bfi.b64 %rd689, %rd686, %rd687, 32, 32; - cvt.u64.u32 %rd690, %r1246; - bfi.b64 %rd691, %rd690, %rd688, 57, 7; - mov.b64 {%r1640, %r1641}, %rd684; - mov.b64 {%r1642, %r1643}, %rd685; - mov.b64 {%r1644, %r1645}, %rd689; - mov.b64 {%r1646, %r1647}, %rd691; - or.b64 %rd692, %rd689, %rd684; - or.b32 %r1648, %r1645, %r1641; - or.b32 %r1649, %r1646, %r1642; - or.b32 %r1650, %r1647, %r1643; - cvt.u64.u32 %rd693, %r1650; - cvt.u64.u32 %rd694, %r1648; - and.b64 %rd695, %rd692, 4294967295; - cvt.u64.u32 %rd696, %r1649; - bfi.b64 %rd697, %rd694, %rd695, 32, 32; - bfi.b64 %rd698, %rd693, %rd696, 32, 32; - shr.u32 %r1651, %r1244, 18; - shr.u32 %r1652, %r1245, 18; - shr.u32 %r1653, %r1246, 18; - cvt.u64.u32 %rd699, %r1653; - cvt.u64.u32 %rd700, %r1651; - shr.u32 %r1654, %r1243, 18; - cvt.u64.u32 %rd701, %r1654; - cvt.u64.u32 %rd702, %r1652; - bfi.b64 %rd703, %rd700, %rd701, 32, 32; - bfi.b64 %rd704, %rd699, %rd702, 32, 32; - shl.b32 %r1655, %r1244, 14; - shl.b32 %r1656, %r1245, 14; - cvt.u64.u32 %rd705, %r1655; - shl.b32 %r1657, %r1243, 14; - cvt.u64.u32 %rd706, %r1657; - cvt.u64.u32 %rd707, %r1656; - bfi.b64 %rd708, %rd705, %rd706, 32, 32; - bfi.b64 %rd709, %rd690, %rd707, 46, 18; - mov.b64 {%r1658, %r1659}, %rd703; - mov.b64 {%r1660, %r1661}, %rd704; - mov.b64 {%r1662, %r1663}, %rd708; - mov.b64 {%r1664, %r1665}, %rd709; - or.b64 %rd710, %rd708, %rd703; - or.b32 %r1666, %r1663, %r1659; - or.b32 %r1667, %r1664, %r1660; - or.b32 %r1668, %r1665, %r1661; - cvt.u64.u32 %rd711, %r1668; - cvt.u64.u32 %rd712, %r1666; - and.b64 %rd713, %rd710, 4294967295; - cvt.u64.u32 %rd714, %r1667; - bfi.b64 %rd715, %rd712, %rd713, 32, 32; - bfi.b64 %rd716, %rd711, %rd714, 32, 32; - shr.u32 %r1669, %r1244, 3; - shr.u32 %r1670, %r1245, 3; - shr.u32 %r1671, %r1246, 3; - cvt.u64.u32 %rd717, %r1671; - cvt.u64.u32 %rd718, %r1669; - shr.u32 %r1672, %r1243, 3; - cvt.u64.u32 %rd719, %r1672; - cvt.u64.u32 %rd720, %r1670; - bfi.b64 %rd721, %rd718, %rd719, 32, 32; - bfi.b64 %rd722, %rd717, %rd720, 32, 32; - mov.b64 {%r1673, %r1674}, %rd697; - mov.b64 {%r1675, %r1676}, %rd698; - mov.b64 {%r1677, %r1678}, %rd715; - mov.b64 {%r1679, %r1680}, %rd716; - xor.b64 %rd723, %rd715, %rd697; - xor.b32 %r1681, %r1678, %r1674; - xor.b32 %r1682, %r1679, %r1675; - xor.b32 %r1683, %r1680, %r1676; - cvt.u64.u32 %rd724, %r1683; - cvt.u64.u32 %rd725, %r1681; - and.b64 %rd726, %rd723, 4294967295; - cvt.u64.u32 %rd727, %r1682; - bfi.b64 %rd728, %rd725, %rd726, 32, 32; - bfi.b64 %rd729, %rd724, %rd727, 32, 32; - mov.b64 {%r1684, %r1685}, %rd728; - mov.b64 {%r1686, %r1687}, %rd729; - mov.b64 {%r1688, %r1689}, %rd721; - mov.b64 {%r1690, %r1691}, %rd722; - shf.l.wrap.b32 %r1692, %r1243, %r1243, 25; - shf.l.wrap.b32 %r1693, %r1243, %r1243, 14; - xor.b32 %r1694, %r1693, %r1692; - xor.b32 %r1695, %r1694, %r1672; - xor.b32 %r1696, %r1685, %r1689; - xor.b32 %r1697, %r1686, %r1690; - xor.b32 %r1698, %r1687, %r1691; - cvt.u64.u32 %rd730, %r1285; - cvt.u64.u32 %rd731, %r1284; - cvt.u64.u32 %rd732, %r1514; - bfi.b64 %rd733, %rd546, %rd732, 32, 32; - bfi.b64 %rd734, %rd730, %rd731, 32, 32; - mov.b64 {%r1699, %r1700}, %rd733; - mov.b64 {%r1701, %r1702}, %rd734; - shf.r.wrap.b32 %r1703, %r1512, %r1512, 17; - shf.r.wrap.b32 %r1704, %r1512, %r1512, 19; - xor.b32 %r1705, %r1703, %r1704; - shr.u32 %r1706, %r1512, 10; - xor.b32 %r1707, %r1705, %r1706; - add.s32 %r1708, %r1698, %r826; - add.s32 %r1709, %r1708, %r1707; - add.s32 %r1710, %r1709, %r1702; - shf.r.wrap.b32 %r1711, %r1511, %r1511, 17; - shf.r.wrap.b32 %r1712, %r1511, %r1511, 19; - xor.b32 %r1713, %r1711, %r1712; - shr.u32 %r1714, %r1511, 10; - xor.b32 %r1715, %r1713, %r1714; - add.s32 %r1716, %r1697, %r825; - add.s32 %r1717, %r1716, %r1715; - add.s32 %r1718, %r1717, %r1701; - shf.r.wrap.b32 %r1719, %r1710, %r1710, 17; - shf.r.wrap.b32 %r1720, %r1710, %r1710, 19; - xor.b32 %r1721, %r1719, %r1720; - shr.u32 %r1722, %r1710, 10; - xor.b32 %r1723, %r1721, %r1722; - add.s32 %r1724, %r1696, %r824; - add.s32 %r1725, %r1724, %r1700; - add.s32 %r1726, %r1725, %r1723; - shf.r.wrap.b32 %r1727, %r1718, %r1718, 17; - shf.r.wrap.b32 %r1728, %r1718, %r1718, 19; - xor.b32 %r1729, %r1727, %r1728; - shr.u32 %r1730, %r1718, 10; - xor.b32 %r1731, %r1729, %r1730; - add.s32 %r1732, %r1695, %r823; - add.s32 %r1733, %r1732, %r1699; - add.s32 %r1734, %r1733, %r1731; - cvt.u64.u32 %rd735, %r1710; - cvt.u64.u32 %rd736, %r1718; - cvt.u64.u32 %rd737, %r1726; - cvt.u64.u32 %rd738, %r1734; - bfi.b64 %rd739, %rd737, %rd738, 32, 32; - bfi.b64 %rd740, %rd735, %rd736, 32, 32; - mov.b64 {%r1735, %r1736}, %rd739; - mov.b64 {%r1737, %r1738}, %rd740; - cvt.u64.u32 %rd741, %r1738; - cvt.u64.u32 %rd742, %r1736; - cvt.u64.u32 %rd743, %r1737; - bfi.b64 %rd744, %rd741, %rd743, 32, 32; - bfi.b64 %rd745, %rd742, %rd738, 32, 32; - mov.b64 {%r1739, %r1740}, %rd745; - mov.b64 {%r1741, %r1742}, %rd744; - add.s32 %r1743, %r1739, 1396182291; - add.s32 %r1744, %r1740, 1294757372; - add.s32 %r1745, %r1741, 773529912; - add.s32 %r1746, %r1742, 666307205; - cvt.u64.u32 %rd746, %r1746; - cvt.u64.u32 %rd747, %r1744; - cvt.u64.u32 %rd748, %r1745; - cvt.u64.u32 %rd749, %r1743; - bfi.b64 %rd750, %rd747, %rd749, 32, 32; - bfi.b64 %rd751, %rd746, %rd748, 32, 32; - cvt.u64.u32 %rd752, %r1632; - cvt.u64.u32 %rd753, %r1630; - cvt.u64.u32 %rd754, %r1631; - bfi.b64 %rd755, %rd753, %rd677, 32, 32; - bfi.b64 %rd756, %rd752, %rd754, 32, 32; - mov.b64 {%r1747, %r1748}, %rd755; - mov.b64 {%r1749, %r1750}, %rd756; - mov.b64 {%r1751, %r1752}, %rd751; - shf.r.wrap.b32 %r1753, %r1749, %r1749, 6; - shf.r.wrap.b32 %r1754, %r1749, %r1749, 11; - xor.b32 %r1755, %r1753, %r1754; - shf.r.wrap.b32 %r1756, %r1749, %r1749, 25; - xor.b32 %r1757, %r1755, %r1756; - xor.b32 %r1758, %r1750, %r1579; - and.b32 %r1759, %r1758, %r1749; - xor.b32 %r1760, %r1759, %r1579; - add.s32 %r1761, %r1580, %r1752; - add.s32 %r1762, %r1761, %r1757; - add.s32 %r1763, %r1762, %r1760; - shf.r.wrap.b32 %r1764, %r1747, %r1747, 2; - shf.r.wrap.b32 %r1765, %r1747, %r1747, 13; - xor.b32 %r1766, %r1764, %r1765; - shf.r.wrap.b32 %r1767, %r1747, %r1747, 22; - xor.b32 %r1768, %r1766, %r1767; - and.b32 %r1769, %r1748, %r1747; - and.b32 %r1770, %r1628, %r1570; - xor.b32 %r1771, %r1769, %r1770; - and.b32 %r1772, %r1748, %r1577; - xor.b32 %r1773, %r1771, %r1772; - add.s32 %r1774, %r1773, %r1768; - add.s32 %r1775, %r1774, %r1763; - add.s32 %r1776, %r1763, %r1578; - shf.r.wrap.b32 %r1777, %r1776, %r1776, 6; - shf.r.wrap.b32 %r1778, %r1776, %r1776, 11; - xor.b32 %r1779, %r1777, %r1778; - shf.r.wrap.b32 %r1780, %r1776, %r1776, 25; - xor.b32 %r1781, %r1779, %r1780; - xor.b32 %r1782, %r1750, %r1749; - and.b32 %r1783, %r1776, %r1782; - xor.b32 %r1784, %r1783, %r1750; - add.s32 %r1785, %r1579, %r1751; - add.s32 %r1786, %r1785, %r1784; - add.s32 %r1787, %r1786, %r1781; - shf.r.wrap.b32 %r1788, %r1775, %r1775, 2; - shf.r.wrap.b32 %r1789, %r1775, %r1775, 13; - xor.b32 %r1790, %r1788, %r1789; - shf.r.wrap.b32 %r1791, %r1775, %r1775, 22; - xor.b32 %r1792, %r1790, %r1791; - xor.b32 %r1793, %r1748, %r1747; - and.b32 %r1794, %r1775, %r1793; - xor.b32 %r1795, %r1794, %r1769; - add.s32 %r1796, %r1792, %r1795; - add.s32 %r1797, %r1787, %r1577; - cvt.u64.u32 %rd757, %r1776; - cvt.u64.u32 %rd758, %r1797; - cvt.u64.u32 %rd759, %r1775; - add.s32 %r1798, %r1796, %r1787; - cvt.u64.u32 %rd760, %r1798; - bfi.b64 %rd761, %rd759, %rd760, 32, 32; - bfi.b64 %rd762, %rd757, %rd758, 32, 32; - mov.b64 {%r1799, %r1800}, %rd761; - mov.b64 {%r1801, %r1802}, %rd762; - mov.b64 {%r1803, %r1804}, %rd750; - cvt.u64.u32 %rd763, %r1804; - bfi.b64 %rd764, %rd763, %rd749, 32, 32; - cvt.u64.u32 %rd765, %r1802; - cvt.u64.u32 %rd766, %r1800; - cvt.u64.u32 %rd767, %r1801; - bfi.b64 %rd768, %rd766, %rd760, 32, 32; - bfi.b64 %rd769, %rd765, %rd767, 32, 32; - mov.b64 {%r1805, %r1806}, %rd768; - mov.b64 {%r1807, %r1808}, %rd769; - mov.b64 {%r1809, %r1810}, %rd764; - shf.r.wrap.b32 %r1811, %r1807, %r1807, 6; - shf.r.wrap.b32 %r1812, %r1807, %r1807, 11; - xor.b32 %r1813, %r1811, %r1812; - shf.r.wrap.b32 %r1814, %r1807, %r1807, 25; - xor.b32 %r1815, %r1813, %r1814; - xor.b32 %r1816, %r1808, %r1749; - and.b32 %r1817, %r1816, %r1807; - xor.b32 %r1818, %r1817, %r1749; - add.s32 %r1819, %r1750, %r1810; - add.s32 %r1820, %r1819, %r1815; - add.s32 %r1821, %r1820, %r1818; - shf.r.wrap.b32 %r1822, %r1805, %r1805, 2; - shf.r.wrap.b32 %r1823, %r1805, %r1805, 13; - xor.b32 %r1824, %r1822, %r1823; - shf.r.wrap.b32 %r1825, %r1805, %r1805, 22; - xor.b32 %r1826, %r1824, %r1825; - and.b32 %r1827, %r1806, %r1805; - and.b32 %r1828, %r1798, %r1628; - xor.b32 %r1829, %r1827, %r1828; - and.b32 %r1830, %r1806, %r1747; - xor.b32 %r1831, %r1829, %r1830; - add.s32 %r1832, %r1831, %r1826; - add.s32 %r1833, %r1832, %r1821; - add.s32 %r1834, %r1821, %r1748; - shf.r.wrap.b32 %r1835, %r1834, %r1834, 6; - shf.r.wrap.b32 %r1836, %r1834, %r1834, 11; - xor.b32 %r1837, %r1835, %r1836; - shf.r.wrap.b32 %r1838, %r1834, %r1834, 25; - xor.b32 %r1839, %r1837, %r1838; - xor.b32 %r1840, %r1808, %r1807; - and.b32 %r1841, %r1834, %r1840; - xor.b32 %r1842, %r1841, %r1808; - add.s32 %r1843, %r1749, %r1809; - add.s32 %r1844, %r1843, %r1842; - add.s32 %r1845, %r1844, %r1839; - shf.r.wrap.b32 %r1846, %r1833, %r1833, 2; - shf.r.wrap.b32 %r1847, %r1833, %r1833, 13; - xor.b32 %r1848, %r1846, %r1847; - shf.r.wrap.b32 %r1849, %r1833, %r1833, 22; - xor.b32 %r1850, %r1848, %r1849; - xor.b32 %r1851, %r1806, %r1805; - and.b32 %r1852, %r1833, %r1851; - xor.b32 %r1853, %r1852, %r1827; - add.s32 %r1854, %r1850, %r1853; - add.s32 %r1855, %r1845, %r1747; - cvt.u64.u32 %rd770, %r1834; - cvt.u64.u32 %rd771, %r1855; - cvt.u64.u32 %rd772, %r1833; - add.s32 %r1856, %r1854, %r1845; - cvt.u64.u32 %rd773, %r1856; - bfi.b64 %rd774, %rd772, %rd773, 32, 32; - bfi.b64 %rd775, %rd770, %rd771, 32, 32; - mov.b64 {%r1857, %r1858}, %rd774; - mov.b64 {%r1859, %r1860}, %rd775; - shr.u32 %r1861, %r1472, 7; - shr.u32 %r1862, %r1473, 7; - shr.u32 %r1863, %r1474, 7; - cvt.u64.u32 %rd776, %r1863; - cvt.u64.u32 %rd777, %r1861; - shr.u32 %r1864, %r1471, 7; - cvt.u64.u32 %rd778, %r1864; - cvt.u64.u32 %rd779, %r1862; - bfi.b64 %rd780, %rd777, %rd778, 32, 32; - bfi.b64 %rd781, %rd776, %rd779, 32, 32; - shl.b32 %r1865, %r1472, 25; - shl.b32 %r1866, %r1473, 25; - cvt.u64.u32 %rd782, %r1865; - shl.b32 %r1867, %r1471, 25; - cvt.u64.u32 %rd783, %r1867; - cvt.u64.u32 %rd784, %r1866; - bfi.b64 %rd785, %rd782, %rd783, 32, 32; - cvt.u64.u32 %rd786, %r1474; - bfi.b64 %rd787, %rd786, %rd784, 57, 7; - mov.b64 {%r1868, %r1869}, %rd780; - mov.b64 {%r1870, %r1871}, %rd781; - mov.b64 {%r1872, %r1873}, %rd785; - mov.b64 {%r1874, %r1875}, %rd787; - or.b64 %rd788, %rd785, %rd780; - or.b32 %r1876, %r1873, %r1869; - or.b32 %r1877, %r1874, %r1870; - or.b32 %r1878, %r1875, %r1871; - cvt.u64.u32 %rd789, %r1878; - cvt.u64.u32 %rd790, %r1876; - and.b64 %rd791, %rd788, 4294967295; - cvt.u64.u32 %rd792, %r1877; - bfi.b64 %rd793, %rd790, %rd791, 32, 32; - bfi.b64 %rd794, %rd789, %rd792, 32, 32; - shr.u32 %r1879, %r1472, 18; - shr.u32 %r1880, %r1473, 18; - shr.u32 %r1881, %r1474, 18; - cvt.u64.u32 %rd795, %r1881; - cvt.u64.u32 %rd796, %r1879; - shr.u32 %r1882, %r1471, 18; - cvt.u64.u32 %rd797, %r1882; - cvt.u64.u32 %rd798, %r1880; - bfi.b64 %rd799, %rd796, %rd797, 32, 32; - bfi.b64 %rd800, %rd795, %rd798, 32, 32; - shl.b32 %r1883, %r1472, 14; - shl.b32 %r1884, %r1473, 14; - cvt.u64.u32 %rd801, %r1883; - shl.b32 %r1885, %r1471, 14; - cvt.u64.u32 %rd802, %r1885; - cvt.u64.u32 %rd803, %r1884; - bfi.b64 %rd804, %rd801, %rd802, 32, 32; - bfi.b64 %rd805, %rd786, %rd803, 46, 18; - mov.b64 {%r1886, %r1887}, %rd799; - mov.b64 {%r1888, %r1889}, %rd800; - mov.b64 {%r1890, %r1891}, %rd804; - mov.b64 {%r1892, %r1893}, %rd805; - or.b64 %rd806, %rd804, %rd799; - or.b32 %r1894, %r1891, %r1887; - or.b32 %r1895, %r1892, %r1888; - or.b32 %r1896, %r1893, %r1889; - cvt.u64.u32 %rd807, %r1896; - cvt.u64.u32 %rd808, %r1894; - and.b64 %rd809, %rd806, 4294967295; - cvt.u64.u32 %rd810, %r1895; - bfi.b64 %rd811, %rd808, %rd809, 32, 32; - bfi.b64 %rd812, %rd807, %rd810, 32, 32; - shr.u32 %r1897, %r1472, 3; - shr.u32 %r1898, %r1473, 3; - shr.u32 %r1899, %r1474, 3; - cvt.u64.u32 %rd813, %r1899; - cvt.u64.u32 %rd814, %r1897; - shr.u32 %r1900, %r1471, 3; - cvt.u64.u32 %rd815, %r1900; - cvt.u64.u32 %rd816, %r1898; - bfi.b64 %rd817, %rd814, %rd815, 32, 32; - bfi.b64 %rd818, %rd813, %rd816, 32, 32; - mov.b64 {%r1901, %r1902}, %rd793; - mov.b64 {%r1903, %r1904}, %rd794; - mov.b64 {%r1905, %r1906}, %rd811; - mov.b64 {%r1907, %r1908}, %rd812; - xor.b64 %rd819, %rd811, %rd793; - xor.b32 %r1909, %r1906, %r1902; - xor.b32 %r1910, %r1907, %r1903; - xor.b32 %r1911, %r1908, %r1904; - cvt.u64.u32 %rd820, %r1911; - cvt.u64.u32 %rd821, %r1909; - and.b64 %rd822, %rd819, 4294967295; - cvt.u64.u32 %rd823, %r1910; - bfi.b64 %rd824, %rd821, %rd822, 32, 32; - bfi.b64 %rd825, %rd820, %rd823, 32, 32; - mov.b64 {%r1912, %r1913}, %rd824; - mov.b64 {%r1914, %r1915}, %rd825; - mov.b64 {%r1916, %r1917}, %rd817; - mov.b64 {%r1918, %r1919}, %rd818; - shf.l.wrap.b32 %r1920, %r1471, %r1471, 25; - shf.l.wrap.b32 %r1921, %r1471, %r1471, 14; - xor.b32 %r1922, %r1921, %r1920; - xor.b32 %r1923, %r1922, %r1900; - xor.b32 %r1924, %r1913, %r1917; - xor.b32 %r1925, %r1914, %r1918; - xor.b32 %r1926, %r1915, %r1919; - cvt.u64.u32 %rd826, %r1513; - cvt.u64.u32 %rd827, %r1512; - cvt.u64.u32 %rd828, %r1742; - bfi.b64 %rd829, %rd642, %rd828, 32, 32; - bfi.b64 %rd830, %rd826, %rd827, 32, 32; - mov.b64 {%r1927, %r1928}, %rd829; - mov.b64 {%r1929, %r1930}, %rd830; - shf.r.wrap.b32 %r1931, %r1740, %r1740, 17; - shf.r.wrap.b32 %r1932, %r1740, %r1740, 19; - xor.b32 %r1933, %r1931, %r1932; - shr.u32 %r1934, %r1740, 10; - xor.b32 %r1935, %r1933, %r1934; - add.s32 %r1936, %r1926, %r1058; - add.s32 %r1937, %r1936, %r1935; - add.s32 %r1938, %r1937, %r1930; - shf.r.wrap.b32 %r1939, %r1739, %r1739, 17; - shf.r.wrap.b32 %r1940, %r1739, %r1739, 19; - xor.b32 %r1941, %r1939, %r1940; - shr.u32 %r1942, %r1739, 10; - xor.b32 %r1943, %r1941, %r1942; - add.s32 %r1944, %r1925, %r1057; - add.s32 %r1945, %r1944, %r1943; - add.s32 %r1946, %r1945, %r1929; - shf.r.wrap.b32 %r1947, %r1938, %r1938, 17; - shf.r.wrap.b32 %r1948, %r1938, %r1938, 19; - xor.b32 %r1949, %r1947, %r1948; - shr.u32 %r1950, %r1938, 10; - xor.b32 %r1951, %r1949, %r1950; - add.s32 %r1952, %r1924, %r1056; - add.s32 %r1953, %r1952, %r1928; - add.s32 %r1954, %r1953, %r1951; - shf.r.wrap.b32 %r1955, %r1946, %r1946, 17; - shf.r.wrap.b32 %r1956, %r1946, %r1946, 19; - xor.b32 %r1957, %r1955, %r1956; - shr.u32 %r1958, %r1946, 10; - xor.b32 %r1959, %r1957, %r1958; - add.s32 %r1960, %r1923, %r1055; - add.s32 %r1961, %r1960, %r1927; - add.s32 %r1962, %r1961, %r1959; - cvt.u64.u32 %rd831, %r1938; - cvt.u64.u32 %rd832, %r1946; - cvt.u64.u32 %rd833, %r1954; - cvt.u64.u32 %rd834, %r1962; - bfi.b64 %rd835, %rd833, %rd834, 32, 32; - bfi.b64 %rd836, %rd831, %rd832, 32, 32; - mov.b64 {%r1963, %r1964}, %rd835; - mov.b64 {%r1965, %r1966}, %rd836; - add.s32 %r1967, %r1963, -1838011259; - add.s32 %r1968, %r1964, -2117940946; - add.s32 %r1969, %r1965, 1986661051; - add.s32 %r1970, %r1966, 1695183700; - cvt.u64.u32 %rd837, %r1970; - cvt.u64.u32 %rd838, %r1968; - cvt.u64.u32 %rd839, %r1969; - cvt.u64.u32 %rd840, %r1967; - bfi.b64 %rd841, %rd838, %rd840, 32, 32; - bfi.b64 %rd842, %rd837, %rd839, 32, 32; - cvt.u64.u32 %rd843, %r1860; - cvt.u64.u32 %rd844, %r1858; - cvt.u64.u32 %rd845, %r1859; - bfi.b64 %rd846, %rd844, %rd773, 32, 32; - bfi.b64 %rd847, %rd843, %rd845, 32, 32; - mov.b64 {%r1971, %r1972}, %rd846; - mov.b64 {%r1973, %r1974}, %rd847; - mov.b64 {%r1975, %r1976}, %rd842; - shf.r.wrap.b32 %r1977, %r1973, %r1973, 6; - shf.r.wrap.b32 %r1978, %r1973, %r1973, 11; - xor.b32 %r1979, %r1977, %r1978; - shf.r.wrap.b32 %r1980, %r1973, %r1973, 25; - xor.b32 %r1981, %r1979, %r1980; - xor.b32 %r1982, %r1974, %r1807; - and.b32 %r1983, %r1982, %r1973; - xor.b32 %r1984, %r1983, %r1807; - add.s32 %r1985, %r1808, %r1976; - add.s32 %r1986, %r1985, %r1981; - add.s32 %r1987, %r1986, %r1984; - shf.r.wrap.b32 %r1988, %r1971, %r1971, 2; - shf.r.wrap.b32 %r1989, %r1971, %r1971, 13; - xor.b32 %r1990, %r1988, %r1989; - shf.r.wrap.b32 %r1991, %r1971, %r1971, 22; - xor.b32 %r1992, %r1990, %r1991; - and.b32 %r1993, %r1972, %r1971; - and.b32 %r1994, %r1856, %r1798; - xor.b32 %r1995, %r1993, %r1994; - and.b32 %r1996, %r1972, %r1805; - xor.b32 %r1997, %r1995, %r1996; - add.s32 %r1998, %r1997, %r1992; - add.s32 %r1999, %r1998, %r1987; - add.s32 %r2000, %r1987, %r1806; - shf.r.wrap.b32 %r2001, %r2000, %r2000, 6; - shf.r.wrap.b32 %r2002, %r2000, %r2000, 11; - xor.b32 %r2003, %r2001, %r2002; - shf.r.wrap.b32 %r2004, %r2000, %r2000, 25; - xor.b32 %r2005, %r2003, %r2004; - xor.b32 %r2006, %r1974, %r1973; - and.b32 %r2007, %r2000, %r2006; - xor.b32 %r2008, %r2007, %r1974; - add.s32 %r2009, %r1807, %r1975; - add.s32 %r2010, %r2009, %r2008; - add.s32 %r2011, %r2010, %r2005; - shf.r.wrap.b32 %r2012, %r1999, %r1999, 2; - shf.r.wrap.b32 %r2013, %r1999, %r1999, 13; - xor.b32 %r2014, %r2012, %r2013; - shf.r.wrap.b32 %r2015, %r1999, %r1999, 22; - xor.b32 %r2016, %r2014, %r2015; - xor.b32 %r2017, %r1972, %r1971; - and.b32 %r2018, %r1999, %r2017; - xor.b32 %r2019, %r2018, %r1993; - add.s32 %r2020, %r2016, %r2019; - add.s32 %r2021, %r2011, %r1805; - cvt.u64.u32 %rd848, %r2000; - cvt.u64.u32 %rd849, %r2021; - cvt.u64.u32 %rd850, %r1999; - add.s32 %r2022, %r2020, %r2011; - cvt.u64.u32 %rd851, %r2022; - bfi.b64 %rd852, %rd850, %rd851, 32, 32; - bfi.b64 %rd853, %rd848, %rd849, 32, 32; - mov.b64 {%r2023, %r2024}, %rd852; - mov.b64 {%r2025, %r2026}, %rd853; - mov.b64 {%r2027, %r2028}, %rd841; - cvt.u64.u32 %rd854, %r2028; - bfi.b64 %rd855, %rd854, %rd840, 32, 32; - cvt.u64.u32 %rd856, %r2026; - cvt.u64.u32 %rd857, %r2024; - cvt.u64.u32 %rd858, %r2025; - bfi.b64 %rd859, %rd857, %rd851, 32, 32; - bfi.b64 %rd860, %rd856, %rd858, 32, 32; - mov.b64 {%r2029, %r2030}, %rd859; - mov.b64 {%r2031, %r2032}, %rd860; - mov.b64 {%r2033, %r2034}, %rd855; - shf.r.wrap.b32 %r2035, %r2031, %r2031, 6; - shf.r.wrap.b32 %r2036, %r2031, %r2031, 11; - xor.b32 %r2037, %r2035, %r2036; - shf.r.wrap.b32 %r2038, %r2031, %r2031, 25; - xor.b32 %r2039, %r2037, %r2038; - xor.b32 %r2040, %r2032, %r1973; - and.b32 %r2041, %r2040, %r2031; - xor.b32 %r2042, %r2041, %r1973; - add.s32 %r2043, %r1974, %r2034; - add.s32 %r2044, %r2043, %r2039; - add.s32 %r2045, %r2044, %r2042; - shf.r.wrap.b32 %r2046, %r2029, %r2029, 2; - shf.r.wrap.b32 %r2047, %r2029, %r2029, 13; - xor.b32 %r2048, %r2046, %r2047; - shf.r.wrap.b32 %r2049, %r2029, %r2029, 22; - xor.b32 %r2050, %r2048, %r2049; - and.b32 %r2051, %r2030, %r2029; - and.b32 %r2052, %r2022, %r1856; - xor.b32 %r2053, %r2051, %r2052; - and.b32 %r2054, %r2030, %r1971; - xor.b32 %r2055, %r2053, %r2054; - add.s32 %r2056, %r2055, %r2050; - add.s32 %r2057, %r2056, %r2045; - add.s32 %r2058, %r2045, %r1972; - shf.r.wrap.b32 %r2059, %r2058, %r2058, 6; - shf.r.wrap.b32 %r2060, %r2058, %r2058, 11; - xor.b32 %r2061, %r2059, %r2060; - shf.r.wrap.b32 %r2062, %r2058, %r2058, 25; - xor.b32 %r2063, %r2061, %r2062; - xor.b32 %r2064, %r2032, %r2031; - and.b32 %r2065, %r2058, %r2064; - xor.b32 %r2066, %r2065, %r2032; - add.s32 %r2067, %r1973, %r2033; - add.s32 %r2068, %r2067, %r2066; - add.s32 %r2069, %r2068, %r2063; - shf.r.wrap.b32 %r2070, %r2057, %r2057, 2; - shf.r.wrap.b32 %r2071, %r2057, %r2057, 13; - xor.b32 %r2072, %r2070, %r2071; - shf.r.wrap.b32 %r2073, %r2057, %r2057, 22; - xor.b32 %r2074, %r2072, %r2073; - xor.b32 %r2075, %r2030, %r2029; - and.b32 %r2076, %r2057, %r2075; - xor.b32 %r2077, %r2076, %r2051; - add.s32 %r2078, %r2074, %r2077; - add.s32 %r2079, %r2069, %r1971; - cvt.u64.u32 %rd861, %r2058; - cvt.u64.u32 %rd862, %r2079; - cvt.u64.u32 %rd863, %r2057; - add.s32 %r2080, %r2078, %r2069; - cvt.u64.u32 %rd864, %r2080; - bfi.b64 %rd865, %rd863, %rd864, 32, 32; - bfi.b64 %rd866, %rd861, %rd862, 32, 32; - mov.b64 {%r2081, %r2082}, %rd865; - mov.b64 {%r2083, %r2084}, %rd866; - shr.u32 %r2085, %r1700, 7; - shr.u32 %r2086, %r1701, 7; - shr.u32 %r2087, %r1702, 7; - cvt.u64.u32 %rd867, %r2087; - cvt.u64.u32 %rd868, %r2085; - shr.u32 %r2088, %r1699, 7; - cvt.u64.u32 %rd869, %r2088; - cvt.u64.u32 %rd870, %r2086; - bfi.b64 %rd871, %rd868, %rd869, 32, 32; - bfi.b64 %rd872, %rd867, %rd870, 32, 32; - shl.b32 %r2089, %r1700, 25; - shl.b32 %r2090, %r1701, 25; - cvt.u64.u32 %rd873, %r2089; - shl.b32 %r2091, %r1699, 25; - cvt.u64.u32 %rd874, %r2091; - cvt.u64.u32 %rd875, %r2090; - bfi.b64 %rd876, %rd873, %rd874, 32, 32; - cvt.u64.u32 %rd877, %r1702; - bfi.b64 %rd878, %rd877, %rd875, 57, 7; - mov.b64 {%r2092, %r2093}, %rd871; - mov.b64 {%r2094, %r2095}, %rd872; - mov.b64 {%r2096, %r2097}, %rd876; - mov.b64 {%r2098, %r2099}, %rd878; - or.b64 %rd879, %rd876, %rd871; - or.b32 %r2100, %r2097, %r2093; - or.b32 %r2101, %r2098, %r2094; - or.b32 %r2102, %r2099, %r2095; - cvt.u64.u32 %rd880, %r2102; - cvt.u64.u32 %rd881, %r2100; - and.b64 %rd882, %rd879, 4294967295; - cvt.u64.u32 %rd883, %r2101; - bfi.b64 %rd884, %rd881, %rd882, 32, 32; - bfi.b64 %rd885, %rd880, %rd883, 32, 32; - shr.u32 %r2103, %r1700, 18; - shr.u32 %r2104, %r1701, 18; - shr.u32 %r2105, %r1702, 18; - cvt.u64.u32 %rd886, %r2105; - cvt.u64.u32 %rd887, %r2103; - shr.u32 %r2106, %r1699, 18; - cvt.u64.u32 %rd888, %r2106; - cvt.u64.u32 %rd889, %r2104; - bfi.b64 %rd890, %rd887, %rd888, 32, 32; - bfi.b64 %rd891, %rd886, %rd889, 32, 32; - shl.b32 %r2107, %r1700, 14; - shl.b32 %r2108, %r1701, 14; - cvt.u64.u32 %rd892, %r2107; - shl.b32 %r2109, %r1699, 14; - cvt.u64.u32 %rd893, %r2109; - cvt.u64.u32 %rd894, %r2108; - bfi.b64 %rd895, %rd892, %rd893, 32, 32; - bfi.b64 %rd896, %rd877, %rd894, 46, 18; - mov.b64 {%r2110, %r2111}, %rd890; - mov.b64 {%r2112, %r2113}, %rd891; - mov.b64 {%r2114, %r2115}, %rd895; - mov.b64 {%r2116, %r2117}, %rd896; - or.b64 %rd897, %rd895, %rd890; - or.b32 %r2118, %r2115, %r2111; - or.b32 %r2119, %r2116, %r2112; - or.b32 %r2120, %r2117, %r2113; - cvt.u64.u32 %rd898, %r2120; - cvt.u64.u32 %rd899, %r2118; - and.b64 %rd900, %rd897, 4294967295; - cvt.u64.u32 %rd901, %r2119; - bfi.b64 %rd902, %rd899, %rd900, 32, 32; - bfi.b64 %rd903, %rd898, %rd901, 32, 32; - shr.u32 %r2121, %r1700, 3; - shr.u32 %r2122, %r1701, 3; - shr.u32 %r2123, %r1702, 3; - cvt.u64.u32 %rd904, %r2123; - cvt.u64.u32 %rd905, %r2121; - shr.u32 %r2124, %r1699, 3; - cvt.u64.u32 %rd906, %r2124; - cvt.u64.u32 %rd907, %r2122; - bfi.b64 %rd908, %rd905, %rd906, 32, 32; - bfi.b64 %rd909, %rd904, %rd907, 32, 32; - mov.b64 {%r2125, %r2126}, %rd884; - mov.b64 {%r2127, %r2128}, %rd885; - mov.b64 {%r2129, %r2130}, %rd902; - mov.b64 {%r2131, %r2132}, %rd903; - xor.b64 %rd910, %rd902, %rd884; - xor.b32 %r2133, %r2130, %r2126; - xor.b32 %r2134, %r2131, %r2127; - xor.b32 %r2135, %r2132, %r2128; - cvt.u64.u32 %rd911, %r2135; - cvt.u64.u32 %rd912, %r2133; - and.b64 %rd913, %rd910, 4294967295; - cvt.u64.u32 %rd914, %r2134; - bfi.b64 %rd915, %rd912, %rd913, 32, 32; - bfi.b64 %rd916, %rd911, %rd914, 32, 32; - mov.b64 {%r2136, %r2137}, %rd915; - mov.b64 {%r2138, %r2139}, %rd916; - mov.b64 {%r2140, %r2141}, %rd908; - mov.b64 {%r2142, %r2143}, %rd909; - shf.l.wrap.b32 %r2144, %r1699, %r1699, 25; - shf.l.wrap.b32 %r2145, %r1699, %r1699, 14; - xor.b32 %r2146, %r2145, %r2144; - xor.b32 %r2147, %r2146, %r2124; - xor.b32 %r2148, %r2137, %r2141; - xor.b32 %r2149, %r2138, %r2142; - xor.b32 %r2150, %r2139, %r2143; - cvt.u64.u32 %rd917, %r1741; - cvt.u64.u32 %rd918, %r1740; - cvt.u64.u32 %rd919, %r1966; - bfi.b64 %rd920, %rd738, %rd919, 32, 32; - bfi.b64 %rd921, %rd917, %rd918, 32, 32; - mov.b64 {%r2151, %r2152}, %rd920; - mov.b64 {%r2153, %r2154}, %rd921; - shf.r.wrap.b32 %r2155, %r1964, %r1964, 17; - shf.r.wrap.b32 %r2156, %r1964, %r1964, 19; - xor.b32 %r2157, %r2155, %r2156; - shr.u32 %r2158, %r1964, 10; - xor.b32 %r2159, %r2157, %r2158; - add.s32 %r2160, %r2150, %r1286; - add.s32 %r2161, %r2160, %r2159; - add.s32 %r2162, %r2161, %r2154; - shf.r.wrap.b32 %r2163, %r1963, %r1963, 17; - shf.r.wrap.b32 %r2164, %r1963, %r1963, 19; - xor.b32 %r2165, %r2163, %r2164; - shr.u32 %r2166, %r1963, 10; - xor.b32 %r2167, %r2165, %r2166; - add.s32 %r2168, %r2149, %r1285; - add.s32 %r2169, %r2168, %r2167; - add.s32 %r2170, %r2169, %r2153; - shf.r.wrap.b32 %r2171, %r2162, %r2162, 17; - shf.r.wrap.b32 %r2172, %r2162, %r2162, 19; - xor.b32 %r2173, %r2171, %r2172; - shr.u32 %r2174, %r2162, 10; - xor.b32 %r2175, %r2173, %r2174; - add.s32 %r2176, %r2148, %r1284; - add.s32 %r2177, %r2176, %r2152; - add.s32 %r2178, %r2177, %r2175; - shf.r.wrap.b32 %r2179, %r2170, %r2170, 17; - shf.r.wrap.b32 %r2180, %r2170, %r2170, 19; - xor.b32 %r2181, %r2179, %r2180; - shr.u32 %r2182, %r2170, 10; - xor.b32 %r2183, %r2181, %r2182; - add.s32 %r2184, %r2147, %r1283; - add.s32 %r2185, %r2184, %r2151; - add.s32 %r2186, %r2185, %r2183; - cvt.u64.u32 %rd922, %r2162; - cvt.u64.u32 %rd923, %r2170; - cvt.u64.u32 %rd924, %r2178; - cvt.u64.u32 %rd925, %r2186; - bfi.b64 %rd926, %rd924, %rd925, 32, 32; - bfi.b64 %rd927, %rd922, %rd923, 32, 32; - mov.b64 {%r2187, %r2188}, %rd926; - mov.b64 {%r2189, %r2190}, %rd927; - cvt.u64.u32 %rd928, %r2190; - cvt.u64.u32 %rd929, %r2188; - cvt.u64.u32 %rd930, %r2189; - bfi.b64 %rd931, %rd928, %rd930, 32, 32; - bfi.b64 %rd932, %rd929, %rd925, 32, 32; - mov.b64 {%r2191, %r2192}, %rd932; - mov.b64 {%r2193, %r2194}, %rd931; - add.s32 %r2195, %r2191, -949202525; - add.s32 %r2196, %r2192, -1035236496; - add.s32 %r2197, %r2193, -1474664885; - add.s32 %r2198, %r2194, -1564481375; - cvt.u64.u32 %rd933, %r2198; - cvt.u64.u32 %rd934, %r2196; - cvt.u64.u32 %rd935, %r2197; - cvt.u64.u32 %rd936, %r2195; - bfi.b64 %rd937, %rd934, %rd936, 32, 32; - bfi.b64 %rd938, %rd933, %rd935, 32, 32; - cvt.u64.u32 %rd939, %r2084; - cvt.u64.u32 %rd940, %r2082; - cvt.u64.u32 %rd941, %r2083; - bfi.b64 %rd942, %rd940, %rd864, 32, 32; - bfi.b64 %rd943, %rd939, %rd941, 32, 32; - mov.b64 {%r2199, %r2200}, %rd942; - mov.b64 {%r2201, %r2202}, %rd943; - mov.b64 {%r2203, %r2204}, %rd938; - shf.r.wrap.b32 %r2205, %r2201, %r2201, 6; - shf.r.wrap.b32 %r2206, %r2201, %r2201, 11; - xor.b32 %r2207, %r2205, %r2206; - shf.r.wrap.b32 %r2208, %r2201, %r2201, 25; - xor.b32 %r2209, %r2207, %r2208; - xor.b32 %r2210, %r2202, %r2031; - and.b32 %r2211, %r2210, %r2201; - xor.b32 %r2212, %r2211, %r2031; - add.s32 %r2213, %r2032, %r2204; - add.s32 %r2214, %r2213, %r2209; - add.s32 %r2215, %r2214, %r2212; - shf.r.wrap.b32 %r2216, %r2199, %r2199, 2; - shf.r.wrap.b32 %r2217, %r2199, %r2199, 13; - xor.b32 %r2218, %r2216, %r2217; - shf.r.wrap.b32 %r2219, %r2199, %r2199, 22; - xor.b32 %r2220, %r2218, %r2219; - and.b32 %r2221, %r2200, %r2199; - and.b32 %r2222, %r2080, %r2022; - xor.b32 %r2223, %r2221, %r2222; - and.b32 %r2224, %r2200, %r2029; - xor.b32 %r2225, %r2223, %r2224; - add.s32 %r2226, %r2225, %r2220; - add.s32 %r2227, %r2226, %r2215; - add.s32 %r2228, %r2215, %r2030; - shf.r.wrap.b32 %r2229, %r2228, %r2228, 6; - shf.r.wrap.b32 %r2230, %r2228, %r2228, 11; - xor.b32 %r2231, %r2229, %r2230; - shf.r.wrap.b32 %r2232, %r2228, %r2228, 25; - xor.b32 %r2233, %r2231, %r2232; - xor.b32 %r2234, %r2202, %r2201; - and.b32 %r2235, %r2228, %r2234; - xor.b32 %r2236, %r2235, %r2202; - add.s32 %r2237, %r2031, %r2203; - add.s32 %r2238, %r2237, %r2236; - add.s32 %r2239, %r2238, %r2233; - shf.r.wrap.b32 %r2240, %r2227, %r2227, 2; - shf.r.wrap.b32 %r2241, %r2227, %r2227, 13; - xor.b32 %r2242, %r2240, %r2241; - shf.r.wrap.b32 %r2243, %r2227, %r2227, 22; - xor.b32 %r2244, %r2242, %r2243; - xor.b32 %r2245, %r2200, %r2199; - and.b32 %r2246, %r2227, %r2245; - xor.b32 %r2247, %r2246, %r2221; - add.s32 %r2248, %r2244, %r2247; - add.s32 %r2249, %r2239, %r2029; - cvt.u64.u32 %rd944, %r2228; - cvt.u64.u32 %rd945, %r2249; - cvt.u64.u32 %rd946, %r2227; - add.s32 %r2250, %r2248, %r2239; - cvt.u64.u32 %rd947, %r2250; - bfi.b64 %rd948, %rd946, %rd947, 32, 32; - bfi.b64 %rd949, %rd944, %rd945, 32, 32; - mov.b64 {%r2251, %r2252}, %rd948; - mov.b64 {%r2253, %r2254}, %rd949; - mov.b64 {%r2255, %r2256}, %rd937; - cvt.u64.u32 %rd950, %r2256; - bfi.b64 %rd951, %rd950, %rd936, 32, 32; - cvt.u64.u32 %rd952, %r2254; - cvt.u64.u32 %rd953, %r2252; - cvt.u64.u32 %rd954, %r2253; - bfi.b64 %rd955, %rd953, %rd947, 32, 32; - bfi.b64 %rd956, %rd952, %rd954, 32, 32; - mov.b64 {%r2257, %r2258}, %rd955; - mov.b64 {%r2259, %r2260}, %rd956; - mov.b64 {%r2261, %r2262}, %rd951; - shf.r.wrap.b32 %r2263, %r2259, %r2259, 6; - shf.r.wrap.b32 %r2264, %r2259, %r2259, 11; - xor.b32 %r2265, %r2263, %r2264; - shf.r.wrap.b32 %r2266, %r2259, %r2259, 25; - xor.b32 %r2267, %r2265, %r2266; - xor.b32 %r2268, %r2260, %r2201; - and.b32 %r2269, %r2268, %r2259; - xor.b32 %r2270, %r2269, %r2201; - add.s32 %r2271, %r2202, %r2262; - add.s32 %r2272, %r2271, %r2267; - add.s32 %r2273, %r2272, %r2270; - shf.r.wrap.b32 %r2274, %r2257, %r2257, 2; - shf.r.wrap.b32 %r2275, %r2257, %r2257, 13; - xor.b32 %r2276, %r2274, %r2275; - shf.r.wrap.b32 %r2277, %r2257, %r2257, 22; - xor.b32 %r2278, %r2276, %r2277; - and.b32 %r2279, %r2258, %r2257; - and.b32 %r2280, %r2250, %r2080; - xor.b32 %r2281, %r2279, %r2280; - and.b32 %r2282, %r2258, %r2199; - xor.b32 %r2283, %r2281, %r2282; - add.s32 %r2284, %r2283, %r2278; - add.s32 %r2285, %r2284, %r2273; - add.s32 %r2286, %r2273, %r2200; - shf.r.wrap.b32 %r2287, %r2286, %r2286, 6; - shf.r.wrap.b32 %r2288, %r2286, %r2286, 11; - xor.b32 %r2289, %r2287, %r2288; - shf.r.wrap.b32 %r2290, %r2286, %r2286, 25; - xor.b32 %r2291, %r2289, %r2290; - xor.b32 %r2292, %r2260, %r2259; - and.b32 %r2293, %r2286, %r2292; - xor.b32 %r2294, %r2293, %r2260; - add.s32 %r2295, %r2201, %r2261; - add.s32 %r2296, %r2295, %r2294; - add.s32 %r2297, %r2296, %r2291; - shf.r.wrap.b32 %r2298, %r2285, %r2285, 2; - shf.r.wrap.b32 %r2299, %r2285, %r2285, 13; - xor.b32 %r2300, %r2298, %r2299; - shf.r.wrap.b32 %r2301, %r2285, %r2285, 22; - xor.b32 %r2302, %r2300, %r2301; - xor.b32 %r2303, %r2258, %r2257; - and.b32 %r2304, %r2285, %r2303; - xor.b32 %r2305, %r2304, %r2279; - add.s32 %r2306, %r2302, %r2305; - add.s32 %r2307, %r2297, %r2199; - cvt.u64.u32 %rd957, %r2286; - cvt.u64.u32 %rd958, %r2307; - cvt.u64.u32 %rd959, %r2285; - add.s32 %r2308, %r2306, %r2297; - cvt.u64.u32 %rd960, %r2308; - bfi.b64 %rd961, %rd959, %rd960, 32, 32; - bfi.b64 %rd962, %rd957, %rd958, 32, 32; - mov.b64 {%r2309, %r2310}, %rd961; - mov.b64 {%r2311, %r2312}, %rd962; - shr.u32 %r2313, %r1928, 7; - shr.u32 %r2314, %r1929, 7; - shr.u32 %r2315, %r1930, 7; - cvt.u64.u32 %rd963, %r2315; - cvt.u64.u32 %rd964, %r2313; - shr.u32 %r2316, %r1927, 7; - cvt.u64.u32 %rd965, %r2316; - cvt.u64.u32 %rd966, %r2314; - bfi.b64 %rd967, %rd964, %rd965, 32, 32; - bfi.b64 %rd968, %rd963, %rd966, 32, 32; - shl.b32 %r2317, %r1928, 25; - shl.b32 %r2318, %r1929, 25; - cvt.u64.u32 %rd969, %r2317; - shl.b32 %r2319, %r1927, 25; - cvt.u64.u32 %rd970, %r2319; - cvt.u64.u32 %rd971, %r2318; - bfi.b64 %rd972, %rd969, %rd970, 32, 32; - cvt.u64.u32 %rd973, %r1930; - bfi.b64 %rd974, %rd973, %rd971, 57, 7; - mov.b64 {%r2320, %r2321}, %rd967; - mov.b64 {%r2322, %r2323}, %rd968; - mov.b64 {%r2324, %r2325}, %rd972; - mov.b64 {%r2326, %r2327}, %rd974; - or.b64 %rd975, %rd972, %rd967; - or.b32 %r2328, %r2325, %r2321; - or.b32 %r2329, %r2326, %r2322; - or.b32 %r2330, %r2327, %r2323; - cvt.u64.u32 %rd976, %r2330; - cvt.u64.u32 %rd977, %r2328; - and.b64 %rd978, %rd975, 4294967295; - cvt.u64.u32 %rd979, %r2329; - bfi.b64 %rd980, %rd977, %rd978, 32, 32; - bfi.b64 %rd981, %rd976, %rd979, 32, 32; - shr.u32 %r2331, %r1928, 18; - shr.u32 %r2332, %r1929, 18; - shr.u32 %r2333, %r1930, 18; - cvt.u64.u32 %rd982, %r2333; - cvt.u64.u32 %rd983, %r2331; - shr.u32 %r2334, %r1927, 18; - cvt.u64.u32 %rd984, %r2334; - cvt.u64.u32 %rd985, %r2332; - bfi.b64 %rd986, %rd983, %rd984, 32, 32; - bfi.b64 %rd987, %rd982, %rd985, 32, 32; - shl.b32 %r2335, %r1928, 14; - shl.b32 %r2336, %r1929, 14; - cvt.u64.u32 %rd988, %r2335; - shl.b32 %r2337, %r1927, 14; - cvt.u64.u32 %rd989, %r2337; - cvt.u64.u32 %rd990, %r2336; - bfi.b64 %rd991, %rd988, %rd989, 32, 32; - bfi.b64 %rd992, %rd973, %rd990, 46, 18; - mov.b64 {%r2338, %r2339}, %rd986; - mov.b64 {%r2340, %r2341}, %rd987; - mov.b64 {%r2342, %r2343}, %rd991; - mov.b64 {%r2344, %r2345}, %rd992; - or.b64 %rd993, %rd991, %rd986; - or.b32 %r2346, %r2343, %r2339; - or.b32 %r2347, %r2344, %r2340; - or.b32 %r2348, %r2345, %r2341; - cvt.u64.u32 %rd994, %r2348; - cvt.u64.u32 %rd995, %r2346; - and.b64 %rd996, %rd993, 4294967295; - cvt.u64.u32 %rd997, %r2347; - bfi.b64 %rd998, %rd995, %rd996, 32, 32; - bfi.b64 %rd999, %rd994, %rd997, 32, 32; - shr.u32 %r2349, %r1928, 3; - shr.u32 %r2350, %r1929, 3; - shr.u32 %r2351, %r1930, 3; - cvt.u64.u32 %rd1000, %r2351; - cvt.u64.u32 %rd1001, %r2349; - shr.u32 %r2352, %r1927, 3; - cvt.u64.u32 %rd1002, %r2352; - cvt.u64.u32 %rd1003, %r2350; - bfi.b64 %rd1004, %rd1001, %rd1002, 32, 32; - bfi.b64 %rd1005, %rd1000, %rd1003, 32, 32; - mov.b64 {%r2353, %r2354}, %rd980; - mov.b64 {%r2355, %r2356}, %rd981; - mov.b64 {%r2357, %r2358}, %rd998; - mov.b64 {%r2359, %r2360}, %rd999; - xor.b64 %rd1006, %rd998, %rd980; - xor.b32 %r2361, %r2358, %r2354; - xor.b32 %r2362, %r2359, %r2355; - xor.b32 %r2363, %r2360, %r2356; - cvt.u64.u32 %rd1007, %r2363; - cvt.u64.u32 %rd1008, %r2361; - and.b64 %rd1009, %rd1006, 4294967295; - cvt.u64.u32 %rd1010, %r2362; - bfi.b64 %rd1011, %rd1008, %rd1009, 32, 32; - bfi.b64 %rd1012, %rd1007, %rd1010, 32, 32; - mov.b64 {%r2364, %r2365}, %rd1011; - mov.b64 {%r2366, %r2367}, %rd1012; - mov.b64 {%r2368, %r2369}, %rd1004; - mov.b64 {%r2370, %r2371}, %rd1005; - shf.l.wrap.b32 %r2372, %r1927, %r1927, 25; - shf.l.wrap.b32 %r2373, %r1927, %r1927, 14; - xor.b32 %r2374, %r2373, %r2372; - xor.b32 %r2375, %r2374, %r2352; - xor.b32 %r2376, %r2365, %r2369; - xor.b32 %r2377, %r2366, %r2370; - xor.b32 %r2378, %r2367, %r2371; - cvt.u64.u32 %rd1013, %r1965; - cvt.u64.u32 %rd1014, %r1964; - cvt.u64.u32 %rd1015, %r2194; - bfi.b64 %rd1016, %rd834, %rd1015, 32, 32; - bfi.b64 %rd1017, %rd1013, %rd1014, 32, 32; - mov.b64 {%r2379, %r2380}, %rd1016; - mov.b64 {%r2381, %r2382}, %rd1017; - shf.r.wrap.b32 %r2383, %r2192, %r2192, 17; - shf.r.wrap.b32 %r2384, %r2192, %r2192, 19; - xor.b32 %r2385, %r2383, %r2384; - shr.u32 %r2386, %r2192, 10; - xor.b32 %r2387, %r2385, %r2386; - add.s32 %r2388, %r2378, %r1514; - add.s32 %r2389, %r2388, %r2387; - add.s32 %r2390, %r2389, %r2382; - shf.r.wrap.b32 %r2391, %r2191, %r2191, 17; - shf.r.wrap.b32 %r2392, %r2191, %r2191, 19; - xor.b32 %r2393, %r2391, %r2392; - shr.u32 %r2394, %r2191, 10; - xor.b32 %r2395, %r2393, %r2394; - add.s32 %r2396, %r2377, %r1513; - add.s32 %r2397, %r2396, %r2395; - add.s32 %r2398, %r2397, %r2381; - shf.r.wrap.b32 %r2399, %r2390, %r2390, 17; - shf.r.wrap.b32 %r2400, %r2390, %r2390, 19; - xor.b32 %r2401, %r2399, %r2400; - shr.u32 %r2402, %r2390, 10; - xor.b32 %r2403, %r2401, %r2402; - add.s32 %r2404, %r2376, %r1512; - add.s32 %r2405, %r2404, %r2380; - add.s32 %r2406, %r2405, %r2403; - shf.r.wrap.b32 %r2407, %r2398, %r2398, 17; - shf.r.wrap.b32 %r2408, %r2398, %r2398, 19; - xor.b32 %r2409, %r2407, %r2408; - shr.u32 %r2410, %r2398, 10; - xor.b32 %r2411, %r2409, %r2410; - add.s32 %r2412, %r2375, %r1511; - add.s32 %r2413, %r2412, %r2379; - add.s32 %r2414, %r2413, %r2411; - cvt.u64.u32 %rd1018, %r2390; - cvt.u64.u32 %rd1019, %r2398; - cvt.u64.u32 %rd1020, %r2406; - cvt.u64.u32 %rd1021, %r2414; - bfi.b64 %rd1022, %rd1020, %rd1021, 32, 32; - bfi.b64 %rd1023, %rd1018, %rd1019, 32, 32; - mov.b64 {%r2415, %r2416}, %rd1022; - mov.b64 {%r2417, %r2418}, %rd1023; - cvt.u64.u32 %rd1024, %r2418; - cvt.u64.u32 %rd1025, %r2416; - cvt.u64.u32 %rd1026, %r2417; - bfi.b64 %rd1027, %rd1024, %rd1026, 32, 32; - bfi.b64 %rd1028, %rd1025, %rd1021, 32, 32; - mov.b64 {%r2419, %r2420}, %rd1028; - mov.b64 {%r2421, %r2422}, %rd1027; - add.s32 %r2423, %r2419, 275423344; - add.s32 %r2424, %r2420, -200395387; - add.s32 %r2425, %r2421, -694614492; - add.s32 %r2426, %r2422, -778901479; - cvt.u64.u32 %rd1029, %r2426; - cvt.u64.u32 %rd1030, %r2424; - cvt.u64.u32 %rd1031, %r2425; - cvt.u64.u32 %rd1032, %r2423; - bfi.b64 %rd1033, %rd1030, %rd1032, 32, 32; - bfi.b64 %rd1034, %rd1029, %rd1031, 32, 32; - cvt.u64.u32 %rd1035, %r2312; - cvt.u64.u32 %rd1036, %r2310; - cvt.u64.u32 %rd1037, %r2311; - bfi.b64 %rd1038, %rd1036, %rd960, 32, 32; - bfi.b64 %rd1039, %rd1035, %rd1037, 32, 32; - mov.b64 {%r2427, %r2428}, %rd1038; - mov.b64 {%r2429, %r2430}, %rd1039; - mov.b64 {%r2431, %r2432}, %rd1034; - shf.r.wrap.b32 %r2433, %r2429, %r2429, 6; - shf.r.wrap.b32 %r2434, %r2429, %r2429, 11; - xor.b32 %r2435, %r2433, %r2434; - shf.r.wrap.b32 %r2436, %r2429, %r2429, 25; - xor.b32 %r2437, %r2435, %r2436; - xor.b32 %r2438, %r2430, %r2259; - and.b32 %r2439, %r2438, %r2429; - xor.b32 %r2440, %r2439, %r2259; - add.s32 %r2441, %r2260, %r2432; - add.s32 %r2442, %r2441, %r2437; - add.s32 %r2443, %r2442, %r2440; - shf.r.wrap.b32 %r2444, %r2427, %r2427, 2; - shf.r.wrap.b32 %r2445, %r2427, %r2427, 13; - xor.b32 %r2446, %r2444, %r2445; - shf.r.wrap.b32 %r2447, %r2427, %r2427, 22; - xor.b32 %r2448, %r2446, %r2447; - and.b32 %r2449, %r2428, %r2427; - and.b32 %r2450, %r2308, %r2250; - xor.b32 %r2451, %r2449, %r2450; - and.b32 %r2452, %r2428, %r2257; - xor.b32 %r2453, %r2451, %r2452; - add.s32 %r2454, %r2453, %r2448; - add.s32 %r2455, %r2454, %r2443; - add.s32 %r2456, %r2443, %r2258; - shf.r.wrap.b32 %r2457, %r2456, %r2456, 6; - shf.r.wrap.b32 %r2458, %r2456, %r2456, 11; - xor.b32 %r2459, %r2457, %r2458; - shf.r.wrap.b32 %r2460, %r2456, %r2456, 25; - xor.b32 %r2461, %r2459, %r2460; - xor.b32 %r2462, %r2430, %r2429; - and.b32 %r2463, %r2456, %r2462; - xor.b32 %r2464, %r2463, %r2430; - add.s32 %r2465, %r2259, %r2431; - add.s32 %r2466, %r2465, %r2464; - add.s32 %r2467, %r2466, %r2461; - shf.r.wrap.b32 %r2468, %r2455, %r2455, 2; - shf.r.wrap.b32 %r2469, %r2455, %r2455, 13; - xor.b32 %r2470, %r2468, %r2469; - shf.r.wrap.b32 %r2471, %r2455, %r2455, 22; - xor.b32 %r2472, %r2470, %r2471; - xor.b32 %r2473, %r2428, %r2427; - and.b32 %r2474, %r2455, %r2473; - xor.b32 %r2475, %r2474, %r2449; - add.s32 %r2476, %r2472, %r2475; - add.s32 %r2477, %r2467, %r2257; - cvt.u64.u32 %rd1040, %r2456; - cvt.u64.u32 %rd1041, %r2477; - cvt.u64.u32 %rd1042, %r2455; - add.s32 %r2478, %r2476, %r2467; - cvt.u64.u32 %rd1043, %r2478; - bfi.b64 %rd1044, %rd1042, %rd1043, 32, 32; - bfi.b64 %rd1045, %rd1040, %rd1041, 32, 32; - mov.b64 {%r2479, %r2480}, %rd1044; - mov.b64 {%r2481, %r2482}, %rd1045; - mov.b64 {%r2483, %r2484}, %rd1033; - cvt.u64.u32 %rd1046, %r2484; - bfi.b64 %rd1047, %rd1046, %rd1032, 32, 32; - cvt.u64.u32 %rd1048, %r2482; - cvt.u64.u32 %rd1049, %r2480; - cvt.u64.u32 %rd1050, %r2481; - bfi.b64 %rd1051, %rd1049, %rd1043, 32, 32; - bfi.b64 %rd1052, %rd1048, %rd1050, 32, 32; - mov.b64 {%r2485, %r2486}, %rd1051; - mov.b64 {%r2487, %r2488}, %rd1052; - mov.b64 {%r2489, %r2490}, %rd1047; - shf.r.wrap.b32 %r2491, %r2487, %r2487, 6; - shf.r.wrap.b32 %r2492, %r2487, %r2487, 11; - xor.b32 %r2493, %r2491, %r2492; - shf.r.wrap.b32 %r2494, %r2487, %r2487, 25; - xor.b32 %r2495, %r2493, %r2494; - xor.b32 %r2496, %r2488, %r2429; - and.b32 %r2497, %r2496, %r2487; - xor.b32 %r2498, %r2497, %r2429; - add.s32 %r2499, %r2430, %r2490; - add.s32 %r2500, %r2499, %r2495; - add.s32 %r2501, %r2500, %r2498; - shf.r.wrap.b32 %r2502, %r2485, %r2485, 2; - shf.r.wrap.b32 %r2503, %r2485, %r2485, 13; - xor.b32 %r2504, %r2502, %r2503; - shf.r.wrap.b32 %r2505, %r2485, %r2485, 22; - xor.b32 %r2506, %r2504, %r2505; - and.b32 %r2507, %r2486, %r2485; - and.b32 %r2508, %r2478, %r2308; - xor.b32 %r2509, %r2507, %r2508; - and.b32 %r2510, %r2486, %r2427; - xor.b32 %r2511, %r2509, %r2510; - add.s32 %r2512, %r2511, %r2506; - add.s32 %r2513, %r2512, %r2501; - add.s32 %r2514, %r2501, %r2428; - shf.r.wrap.b32 %r2515, %r2514, %r2514, 6; - shf.r.wrap.b32 %r2516, %r2514, %r2514, 11; - xor.b32 %r2517, %r2515, %r2516; - shf.r.wrap.b32 %r2518, %r2514, %r2514, 25; - xor.b32 %r2519, %r2517, %r2518; - xor.b32 %r2520, %r2488, %r2487; - and.b32 %r2521, %r2514, %r2520; - xor.b32 %r2522, %r2521, %r2488; - add.s32 %r2523, %r2429, %r2489; - add.s32 %r2524, %r2523, %r2522; - add.s32 %r2525, %r2524, %r2519; - shf.r.wrap.b32 %r2526, %r2513, %r2513, 2; - shf.r.wrap.b32 %r2527, %r2513, %r2513, 13; - xor.b32 %r2528, %r2526, %r2527; - shf.r.wrap.b32 %r2529, %r2513, %r2513, 22; - xor.b32 %r2530, %r2528, %r2529; - xor.b32 %r2531, %r2486, %r2485; - and.b32 %r2532, %r2513, %r2531; - xor.b32 %r2533, %r2532, %r2507; - add.s32 %r2534, %r2530, %r2533; - add.s32 %r2535, %r2525, %r2427; - cvt.u64.u32 %rd1053, %r2514; - cvt.u64.u32 %rd1054, %r2535; - cvt.u64.u32 %rd1055, %r2513; - add.s32 %r2536, %r2534, %r2525; - cvt.u64.u32 %rd1056, %r2536; - bfi.b64 %rd1057, %rd1055, %rd1056, 32, 32; - bfi.b64 %rd1058, %rd1053, %rd1054, 32, 32; - mov.b64 {%r2537, %r2538}, %rd1057; - mov.b64 {%r2539, %r2540}, %rd1058; - shr.u32 %r2541, %r2152, 7; - shr.u32 %r2542, %r2153, 7; - shr.u32 %r2543, %r2154, 7; - cvt.u64.u32 %rd1059, %r2543; - cvt.u64.u32 %rd1060, %r2541; - shr.u32 %r2544, %r2151, 7; - cvt.u64.u32 %rd1061, %r2544; - cvt.u64.u32 %rd1062, %r2542; - bfi.b64 %rd1063, %rd1060, %rd1061, 32, 32; - bfi.b64 %rd1064, %rd1059, %rd1062, 32, 32; - shl.b32 %r2545, %r2152, 25; - shl.b32 %r2546, %r2153, 25; - cvt.u64.u32 %rd1065, %r2545; - shl.b32 %r2547, %r2151, 25; - cvt.u64.u32 %rd1066, %r2547; - cvt.u64.u32 %rd1067, %r2546; - bfi.b64 %rd1068, %rd1065, %rd1066, 32, 32; - cvt.u64.u32 %rd1069, %r2154; - bfi.b64 %rd1070, %rd1069, %rd1067, 57, 7; - mov.b64 {%r2548, %r2549}, %rd1063; - mov.b64 {%r2550, %r2551}, %rd1064; - mov.b64 {%r2552, %r2553}, %rd1068; - mov.b64 {%r2554, %r2555}, %rd1070; - or.b64 %rd1071, %rd1068, %rd1063; - or.b32 %r2556, %r2553, %r2549; - or.b32 %r2557, %r2554, %r2550; - or.b32 %r2558, %r2555, %r2551; - cvt.u64.u32 %rd1072, %r2558; - cvt.u64.u32 %rd1073, %r2556; - and.b64 %rd1074, %rd1071, 4294967295; - cvt.u64.u32 %rd1075, %r2557; - bfi.b64 %rd1076, %rd1073, %rd1074, 32, 32; - bfi.b64 %rd1077, %rd1072, %rd1075, 32, 32; - shr.u32 %r2559, %r2152, 18; - shr.u32 %r2560, %r2153, 18; - shr.u32 %r2561, %r2154, 18; - cvt.u64.u32 %rd1078, %r2561; - cvt.u64.u32 %rd1079, %r2559; - shr.u32 %r2562, %r2151, 18; - cvt.u64.u32 %rd1080, %r2562; - cvt.u64.u32 %rd1081, %r2560; - bfi.b64 %rd1082, %rd1079, %rd1080, 32, 32; - bfi.b64 %rd1083, %rd1078, %rd1081, 32, 32; - shl.b32 %r2563, %r2152, 14; - shl.b32 %r2564, %r2153, 14; - cvt.u64.u32 %rd1084, %r2563; - shl.b32 %r2565, %r2151, 14; - cvt.u64.u32 %rd1085, %r2565; - cvt.u64.u32 %rd1086, %r2564; - bfi.b64 %rd1087, %rd1084, %rd1085, 32, 32; - bfi.b64 %rd1088, %rd1069, %rd1086, 46, 18; - mov.b64 {%r2566, %r2567}, %rd1082; - mov.b64 {%r2568, %r2569}, %rd1083; - mov.b64 {%r2570, %r2571}, %rd1087; - mov.b64 {%r2572, %r2573}, %rd1088; - or.b64 %rd1089, %rd1087, %rd1082; - or.b32 %r2574, %r2571, %r2567; - or.b32 %r2575, %r2572, %r2568; - or.b32 %r2576, %r2573, %r2569; - cvt.u64.u32 %rd1090, %r2576; - cvt.u64.u32 %rd1091, %r2574; - and.b64 %rd1092, %rd1089, 4294967295; - cvt.u64.u32 %rd1093, %r2575; - bfi.b64 %rd1094, %rd1091, %rd1092, 32, 32; - bfi.b64 %rd1095, %rd1090, %rd1093, 32, 32; - shr.u32 %r2577, %r2152, 3; - shr.u32 %r2578, %r2153, 3; - shr.u32 %r2579, %r2154, 3; - cvt.u64.u32 %rd1096, %r2579; - cvt.u64.u32 %rd1097, %r2577; - shr.u32 %r2580, %r2151, 3; - cvt.u64.u32 %rd1098, %r2580; - cvt.u64.u32 %rd1099, %r2578; - bfi.b64 %rd1100, %rd1097, %rd1098, 32, 32; - bfi.b64 %rd1101, %rd1096, %rd1099, 32, 32; - mov.b64 {%r2581, %r2582}, %rd1076; - mov.b64 {%r2583, %r2584}, %rd1077; - mov.b64 {%r2585, %r2586}, %rd1094; - mov.b64 {%r2587, %r2588}, %rd1095; - xor.b64 %rd1102, %rd1094, %rd1076; - xor.b32 %r2589, %r2586, %r2582; - xor.b32 %r2590, %r2587, %r2583; - xor.b32 %r2591, %r2588, %r2584; - cvt.u64.u32 %rd1103, %r2591; - cvt.u64.u32 %rd1104, %r2589; - and.b64 %rd1105, %rd1102, 4294967295; - cvt.u64.u32 %rd1106, %r2590; - bfi.b64 %rd1107, %rd1104, %rd1105, 32, 32; - bfi.b64 %rd1108, %rd1103, %rd1106, 32, 32; - mov.b64 {%r2592, %r2593}, %rd1107; - mov.b64 {%r2594, %r2595}, %rd1108; - mov.b64 {%r2596, %r2597}, %rd1100; - mov.b64 {%r2598, %r2599}, %rd1101; - shf.l.wrap.b32 %r2600, %r2151, %r2151, 25; - shf.l.wrap.b32 %r2601, %r2151, %r2151, 14; - xor.b32 %r2602, %r2601, %r2600; - xor.b32 %r2603, %r2602, %r2580; - xor.b32 %r2604, %r2593, %r2597; - xor.b32 %r2605, %r2594, %r2598; - xor.b32 %r2606, %r2595, %r2599; - cvt.u64.u32 %rd1109, %r2193; - cvt.u64.u32 %rd1110, %r2192; - cvt.u64.u32 %rd1111, %r2422; - bfi.b64 %rd1112, %rd925, %rd1111, 32, 32; - bfi.b64 %rd1113, %rd1109, %rd1110, 32, 32; - mov.b64 {%r2607, %r2608}, %rd1112; - mov.b64 {%r2609, %r2610}, %rd1113; - shf.r.wrap.b32 %r2611, %r2420, %r2420, 17; - shf.r.wrap.b32 %r2612, %r2420, %r2420, 19; - xor.b32 %r2613, %r2611, %r2612; - shr.u32 %r2614, %r2420, 10; - xor.b32 %r2615, %r2613, %r2614; - add.s32 %r2616, %r2606, %r1742; - add.s32 %r2617, %r2616, %r2615; - add.s32 %r2618, %r2617, %r2610; - shf.r.wrap.b32 %r2619, %r2419, %r2419, 17; - shf.r.wrap.b32 %r2620, %r2419, %r2419, 19; - xor.b32 %r2621, %r2619, %r2620; - shr.u32 %r2622, %r2419, 10; - xor.b32 %r2623, %r2621, %r2622; - add.s32 %r2624, %r2605, %r1741; - add.s32 %r2625, %r2624, %r2623; - add.s32 %r2626, %r2625, %r2609; - shf.r.wrap.b32 %r2627, %r2618, %r2618, 17; - shf.r.wrap.b32 %r2628, %r2618, %r2618, 19; - xor.b32 %r2629, %r2627, %r2628; - shr.u32 %r2630, %r2618, 10; - xor.b32 %r2631, %r2629, %r2630; - add.s32 %r2632, %r2604, %r1740; - add.s32 %r2633, %r2632, %r2608; - add.s32 %r2634, %r2633, %r2631; - shf.r.wrap.b32 %r2635, %r2626, %r2626, 17; - shf.r.wrap.b32 %r2636, %r2626, %r2626, 19; - xor.b32 %r2637, %r2635, %r2636; - shr.u32 %r2638, %r2626, 10; - xor.b32 %r2639, %r2637, %r2638; - add.s32 %r2640, %r2603, %r1739; - add.s32 %r2641, %r2640, %r2607; - add.s32 %r2642, %r2641, %r2639; - cvt.u64.u32 %rd1114, %r2618; - cvt.u64.u32 %rd1115, %r2626; - cvt.u64.u32 %rd1116, %r2634; - cvt.u64.u32 %rd1117, %r2642; - bfi.b64 %rd1118, %rd1116, %rd1117, 32, 32; - bfi.b64 %rd1119, %rd1114, %rd1115, 32, 32; - mov.b64 {%r2643, %r2644}, %rd1118; - mov.b64 {%r2645, %r2646}, %rd1119; - cvt.u64.u32 %rd1120, %r2646; - cvt.u64.u32 %rd1121, %r2644; - cvt.u64.u32 %rd1122, %r2645; - bfi.b64 %rd1123, %rd1120, %rd1122, 32, 32; - bfi.b64 %rd1124, %rd1121, %rd1117, 32, 32; - mov.b64 {%r2647, %r2648}, %rd1124; - mov.b64 {%r2649, %r2650}, %rd1123; - add.s32 %r2651, %r2647, 883997877; - add.s32 %r2652, %r2648, 659060556; - add.s32 %r2653, %r2649, 506948616; - add.s32 %r2654, %r2650, 430227734; - cvt.u64.u32 %rd1125, %r2654; - cvt.u64.u32 %rd1126, %r2652; - cvt.u64.u32 %rd1127, %r2653; - cvt.u64.u32 %rd1128, %r2651; - bfi.b64 %rd1129, %rd1126, %rd1128, 32, 32; - bfi.b64 %rd1130, %rd1125, %rd1127, 32, 32; - cvt.u64.u32 %rd1131, %r2540; - cvt.u64.u32 %rd1132, %r2538; - cvt.u64.u32 %rd1133, %r2539; - bfi.b64 %rd1134, %rd1132, %rd1056, 32, 32; - bfi.b64 %rd1135, %rd1131, %rd1133, 32, 32; - mov.b64 {%r2655, %r2656}, %rd1134; - mov.b64 {%r2657, %r2658}, %rd1135; - mov.b64 {%r2659, %r2660}, %rd1130; - shf.r.wrap.b32 %r2661, %r2657, %r2657, 6; - shf.r.wrap.b32 %r2662, %r2657, %r2657, 11; - xor.b32 %r2663, %r2661, %r2662; - shf.r.wrap.b32 %r2664, %r2657, %r2657, 25; - xor.b32 %r2665, %r2663, %r2664; - xor.b32 %r2666, %r2658, %r2487; - and.b32 %r2667, %r2666, %r2657; - xor.b32 %r2668, %r2667, %r2487; - add.s32 %r2669, %r2488, %r2660; - add.s32 %r2670, %r2669, %r2665; - add.s32 %r2671, %r2670, %r2668; - shf.r.wrap.b32 %r2672, %r2655, %r2655, 2; - shf.r.wrap.b32 %r2673, %r2655, %r2655, 13; - xor.b32 %r2674, %r2672, %r2673; - shf.r.wrap.b32 %r2675, %r2655, %r2655, 22; - xor.b32 %r2676, %r2674, %r2675; - and.b32 %r2677, %r2656, %r2655; - and.b32 %r2678, %r2536, %r2478; - xor.b32 %r2679, %r2677, %r2678; - and.b32 %r2680, %r2656, %r2485; - xor.b32 %r2681, %r2679, %r2680; - add.s32 %r2682, %r2681, %r2676; - add.s32 %r2683, %r2682, %r2671; - add.s32 %r2684, %r2671, %r2486; - shf.r.wrap.b32 %r2685, %r2684, %r2684, 6; - shf.r.wrap.b32 %r2686, %r2684, %r2684, 11; - xor.b32 %r2687, %r2685, %r2686; - shf.r.wrap.b32 %r2688, %r2684, %r2684, 25; - xor.b32 %r2689, %r2687, %r2688; - xor.b32 %r2690, %r2658, %r2657; - and.b32 %r2691, %r2684, %r2690; - xor.b32 %r2692, %r2691, %r2658; - add.s32 %r2693, %r2487, %r2659; - add.s32 %r2694, %r2693, %r2692; - add.s32 %r2695, %r2694, %r2689; - shf.r.wrap.b32 %r2696, %r2683, %r2683, 2; - shf.r.wrap.b32 %r2697, %r2683, %r2683, 13; - xor.b32 %r2698, %r2696, %r2697; - shf.r.wrap.b32 %r2699, %r2683, %r2683, 22; - xor.b32 %r2700, %r2698, %r2699; - xor.b32 %r2701, %r2656, %r2655; - and.b32 %r2702, %r2683, %r2701; - xor.b32 %r2703, %r2702, %r2677; - add.s32 %r2704, %r2700, %r2703; - add.s32 %r2705, %r2695, %r2485; - cvt.u64.u32 %rd1136, %r2684; - cvt.u64.u32 %rd1137, %r2705; - cvt.u64.u32 %rd1138, %r2683; - add.s32 %r2706, %r2704, %r2695; - cvt.u64.u32 %rd1139, %r2706; - bfi.b64 %rd1140, %rd1138, %rd1139, 32, 32; - bfi.b64 %rd1141, %rd1136, %rd1137, 32, 32; - mov.b64 {%r2707, %r2708}, %rd1140; - mov.b64 {%r2709, %r2710}, %rd1141; - mov.b64 {%r2711, %r2712}, %rd1129; - cvt.u64.u32 %rd1142, %r2712; - bfi.b64 %rd1143, %rd1142, %rd1128, 32, 32; - cvt.u64.u32 %rd1144, %r2710; - cvt.u64.u32 %rd1145, %r2708; - cvt.u64.u32 %rd1146, %r2709; - bfi.b64 %rd1147, %rd1145, %rd1139, 32, 32; - bfi.b64 %rd1148, %rd1144, %rd1146, 32, 32; - mov.b64 {%r2713, %r2714}, %rd1147; - mov.b64 {%r2715, %r2716}, %rd1148; - mov.b64 {%r2717, %r2718}, %rd1143; - shf.r.wrap.b32 %r2719, %r2715, %r2715, 6; - shf.r.wrap.b32 %r2720, %r2715, %r2715, 11; - xor.b32 %r2721, %r2719, %r2720; - shf.r.wrap.b32 %r2722, %r2715, %r2715, 25; - xor.b32 %r2723, %r2721, %r2722; - xor.b32 %r2724, %r2716, %r2657; - and.b32 %r2725, %r2724, %r2715; - xor.b32 %r2726, %r2725, %r2657; - add.s32 %r2727, %r2658, %r2718; - add.s32 %r2728, %r2727, %r2723; - add.s32 %r2729, %r2728, %r2726; - shf.r.wrap.b32 %r2730, %r2713, %r2713, 2; - shf.r.wrap.b32 %r2731, %r2713, %r2713, 13; - xor.b32 %r2732, %r2730, %r2731; - shf.r.wrap.b32 %r2733, %r2713, %r2713, 22; - xor.b32 %r2734, %r2732, %r2733; - and.b32 %r2735, %r2714, %r2713; - and.b32 %r2736, %r2706, %r2536; - xor.b32 %r2737, %r2735, %r2736; - and.b32 %r2738, %r2714, %r2655; - xor.b32 %r2739, %r2737, %r2738; - add.s32 %r2740, %r2739, %r2734; - add.s32 %r2741, %r2740, %r2729; - add.s32 %r2742, %r2729, %r2656; - shf.r.wrap.b32 %r2743, %r2742, %r2742, 6; - shf.r.wrap.b32 %r2744, %r2742, %r2742, 11; - xor.b32 %r2745, %r2743, %r2744; - shf.r.wrap.b32 %r2746, %r2742, %r2742, 25; - xor.b32 %r2747, %r2745, %r2746; - xor.b32 %r2748, %r2716, %r2715; - and.b32 %r2749, %r2742, %r2748; - xor.b32 %r2750, %r2749, %r2716; - add.s32 %r2751, %r2657, %r2717; - add.s32 %r2752, %r2751, %r2750; - add.s32 %r2753, %r2752, %r2747; - shf.r.wrap.b32 %r2754, %r2741, %r2741, 2; - shf.r.wrap.b32 %r2755, %r2741, %r2741, 13; - xor.b32 %r2756, %r2754, %r2755; - shf.r.wrap.b32 %r2757, %r2741, %r2741, 22; - xor.b32 %r2758, %r2756, %r2757; - xor.b32 %r2759, %r2714, %r2713; - and.b32 %r2760, %r2741, %r2759; - xor.b32 %r2761, %r2760, %r2735; - add.s32 %r2762, %r2758, %r2761; - add.s32 %r2763, %r2753, %r2655; - cvt.u64.u32 %rd1149, %r2742; - cvt.u64.u32 %rd1150, %r2763; - cvt.u64.u32 %rd1151, %r2741; - add.s32 %r2764, %r2762, %r2753; - cvt.u64.u32 %rd1152, %r2764; - bfi.b64 %rd1153, %rd1151, %rd1152, 32, 32; - bfi.b64 %rd1154, %rd1149, %rd1150, 32, 32; - mov.b64 {%r2765, %r2766}, %rd1153; - mov.b64 {%r2767, %r2768}, %rd1154; - shr.u32 %r2769, %r2380, 7; - shr.u32 %r2770, %r2381, 7; - shr.u32 %r2771, %r2382, 7; - cvt.u64.u32 %rd1155, %r2771; - cvt.u64.u32 %rd1156, %r2769; - shr.u32 %r2772, %r2379, 7; - cvt.u64.u32 %rd1157, %r2772; - cvt.u64.u32 %rd1158, %r2770; - bfi.b64 %rd1159, %rd1156, %rd1157, 32, 32; - bfi.b64 %rd1160, %rd1155, %rd1158, 32, 32; - shl.b32 %r2773, %r2380, 25; - shl.b32 %r2774, %r2381, 25; - cvt.u64.u32 %rd1161, %r2773; - shl.b32 %r2775, %r2379, 25; - cvt.u64.u32 %rd1162, %r2775; - cvt.u64.u32 %rd1163, %r2774; - bfi.b64 %rd1164, %rd1161, %rd1162, 32, 32; - cvt.u64.u32 %rd1165, %r2382; - bfi.b64 %rd1166, %rd1165, %rd1163, 57, 7; - mov.b64 {%r2776, %r2777}, %rd1159; - mov.b64 {%r2778, %r2779}, %rd1160; - mov.b64 {%r2780, %r2781}, %rd1164; - mov.b64 {%r2782, %r2783}, %rd1166; - or.b64 %rd1167, %rd1164, %rd1159; - or.b32 %r2784, %r2781, %r2777; - or.b32 %r2785, %r2782, %r2778; - or.b32 %r2786, %r2783, %r2779; - cvt.u64.u32 %rd1168, %r2786; - cvt.u64.u32 %rd1169, %r2784; - and.b64 %rd1170, %rd1167, 4294967295; - cvt.u64.u32 %rd1171, %r2785; - bfi.b64 %rd1172, %rd1169, %rd1170, 32, 32; - bfi.b64 %rd1173, %rd1168, %rd1171, 32, 32; - shr.u32 %r2787, %r2380, 18; - shr.u32 %r2788, %r2381, 18; - shr.u32 %r2789, %r2382, 18; - cvt.u64.u32 %rd1174, %r2789; - cvt.u64.u32 %rd1175, %r2787; - shr.u32 %r2790, %r2379, 18; - cvt.u64.u32 %rd1176, %r2790; - cvt.u64.u32 %rd1177, %r2788; - bfi.b64 %rd1178, %rd1175, %rd1176, 32, 32; - bfi.b64 %rd1179, %rd1174, %rd1177, 32, 32; - shl.b32 %r2791, %r2380, 14; - shl.b32 %r2792, %r2381, 14; - cvt.u64.u32 %rd1180, %r2791; - shl.b32 %r2793, %r2379, 14; - cvt.u64.u32 %rd1181, %r2793; - cvt.u64.u32 %rd1182, %r2792; - bfi.b64 %rd1183, %rd1180, %rd1181, 32, 32; - bfi.b64 %rd1184, %rd1165, %rd1182, 46, 18; - mov.b64 {%r2794, %r2795}, %rd1178; - mov.b64 {%r2796, %r2797}, %rd1179; - mov.b64 {%r2798, %r2799}, %rd1183; - mov.b64 {%r2800, %r2801}, %rd1184; - or.b64 %rd1185, %rd1183, %rd1178; - or.b32 %r2802, %r2799, %r2795; - or.b32 %r2803, %r2800, %r2796; - or.b32 %r2804, %r2801, %r2797; - cvt.u64.u32 %rd1186, %r2804; - cvt.u64.u32 %rd1187, %r2802; - and.b64 %rd1188, %rd1185, 4294967295; - cvt.u64.u32 %rd1189, %r2803; - bfi.b64 %rd1190, %rd1187, %rd1188, 32, 32; - bfi.b64 %rd1191, %rd1186, %rd1189, 32, 32; - shr.u32 %r2805, %r2380, 3; - shr.u32 %r2806, %r2381, 3; - shr.u32 %r2807, %r2382, 3; - cvt.u64.u32 %rd1192, %r2807; - cvt.u64.u32 %rd1193, %r2805; - shr.u32 %r2808, %r2379, 3; - cvt.u64.u32 %rd1194, %r2808; - cvt.u64.u32 %rd1195, %r2806; - bfi.b64 %rd1196, %rd1193, %rd1194, 32, 32; - bfi.b64 %rd1197, %rd1192, %rd1195, 32, 32; - mov.b64 {%r2809, %r2810}, %rd1172; - mov.b64 {%r2811, %r2812}, %rd1173; - mov.b64 {%r2813, %r2814}, %rd1190; - mov.b64 {%r2815, %r2816}, %rd1191; - xor.b64 %rd1198, %rd1190, %rd1172; - xor.b32 %r2817, %r2814, %r2810; - xor.b32 %r2818, %r2815, %r2811; - xor.b32 %r2819, %r2816, %r2812; - cvt.u64.u32 %rd1199, %r2819; - cvt.u64.u32 %rd1200, %r2817; - and.b64 %rd1201, %rd1198, 4294967295; - cvt.u64.u32 %rd1202, %r2818; - bfi.b64 %rd1203, %rd1200, %rd1201, 32, 32; - bfi.b64 %rd1204, %rd1199, %rd1202, 32, 32; - mov.b64 {%r2820, %r2821}, %rd1203; - mov.b64 {%r2822, %r2823}, %rd1204; - mov.b64 {%r2824, %r2825}, %rd1196; - mov.b64 {%r2826, %r2827}, %rd1197; - shf.l.wrap.b32 %r2828, %r2379, %r2379, 25; - shf.l.wrap.b32 %r2829, %r2379, %r2379, 14; - xor.b32 %r2830, %r2829, %r2828; - xor.b32 %r2831, %r2830, %r2808; - xor.b32 %r2832, %r2821, %r2825; - xor.b32 %r2833, %r2822, %r2826; - xor.b32 %r2834, %r2823, %r2827; - cvt.u64.u32 %rd1205, %r2421; - cvt.u64.u32 %rd1206, %r2420; - cvt.u64.u32 %rd1207, %r2650; - bfi.b64 %rd1208, %rd1021, %rd1207, 32, 32; - bfi.b64 %rd1209, %rd1205, %rd1206, 32, 32; - mov.b64 {%r2835, %r2836}, %rd1208; - mov.b64 {%r2837, %r2838}, %rd1209; - shf.r.wrap.b32 %r2839, %r2648, %r2648, 17; - shf.r.wrap.b32 %r2840, %r2648, %r2648, 19; - xor.b32 %r2841, %r2839, %r2840; - shr.u32 %r2842, %r2648, 10; - xor.b32 %r2843, %r2841, %r2842; - add.s32 %r2844, %r2834, %r1966; - add.s32 %r2845, %r2844, %r2843; - add.s32 %r2846, %r2845, %r2838; - shf.r.wrap.b32 %r2847, %r2647, %r2647, 17; - shf.r.wrap.b32 %r2848, %r2647, %r2647, 19; - xor.b32 %r2849, %r2847, %r2848; - shr.u32 %r2850, %r2647, 10; - xor.b32 %r2851, %r2849, %r2850; - add.s32 %r2852, %r2833, %r1965; - add.s32 %r2853, %r2852, %r2851; - add.s32 %r2854, %r2853, %r2837; - shf.r.wrap.b32 %r2855, %r2846, %r2846, 17; - shf.r.wrap.b32 %r2856, %r2846, %r2846, 19; - xor.b32 %r2857, %r2855, %r2856; - shr.u32 %r2858, %r2846, 10; - xor.b32 %r2859, %r2857, %r2858; - add.s32 %r2860, %r2832, %r1964; - add.s32 %r2861, %r2860, %r2836; - add.s32 %r2862, %r2861, %r2859; - shf.r.wrap.b32 %r2863, %r2854, %r2854, 17; - shf.r.wrap.b32 %r2864, %r2854, %r2854, 19; - xor.b32 %r2865, %r2863, %r2864; - shr.u32 %r2866, %r2854, 10; - xor.b32 %r2867, %r2865, %r2866; - add.s32 %r2868, %r2831, %r1963; - add.s32 %r2869, %r2868, %r2835; - add.s32 %r2870, %r2869, %r2867; - cvt.u64.u32 %rd1210, %r2846; - cvt.u64.u32 %rd1211, %r2854; - cvt.u64.u32 %rd1212, %r2862; - cvt.u64.u32 %rd1213, %r2870; - bfi.b64 %rd1214, %rd1212, %rd1213, 32, 32; - bfi.b64 %rd1215, %rd1210, %rd1211, 32, 32; - mov.b64 {%r2871, %r2872}, %rd1214; - mov.b64 {%r2873, %r2874}, %rd1215; - cvt.u64.u32 %rd1216, %r2874; - cvt.u64.u32 %rd1217, %r2872; - cvt.u64.u32 %rd1218, %r2873; - bfi.b64 %rd1219, %rd1216, %rd1218, 32, 32; - bfi.b64 %rd1220, %rd1217, %rd1213, 32, 32; - mov.b64 {%r2875, %r2876}, %rd1220; - mov.b64 {%r2877, %r2878}, %rd1219; - add.s32 %r2879, %r2875, 1747873779; - add.s32 %r2880, %r2876, 1537002063; - add.s32 %r2881, %r2877, 1322822218; - add.s32 %r2882, %r2878, 958139571; - cvt.u64.u32 %rd1221, %r2882; - cvt.u64.u32 %rd1222, %r2880; - cvt.u64.u32 %rd1223, %r2881; - cvt.u64.u32 %rd1224, %r2879; - bfi.b64 %rd1225, %rd1222, %rd1224, 32, 32; - bfi.b64 %rd1226, %rd1221, %rd1223, 32, 32; - cvt.u64.u32 %rd1227, %r2768; - cvt.u64.u32 %rd1228, %r2766; - cvt.u64.u32 %rd1229, %r2767; - bfi.b64 %rd1230, %rd1228, %rd1152, 32, 32; - bfi.b64 %rd1231, %rd1227, %rd1229, 32, 32; - mov.b64 {%r2883, %r2884}, %rd1230; - mov.b64 {%r2885, %r2886}, %rd1231; - mov.b64 {%r2887, %r2888}, %rd1226; - shf.r.wrap.b32 %r2889, %r2885, %r2885, 6; - shf.r.wrap.b32 %r2890, %r2885, %r2885, 11; - xor.b32 %r2891, %r2889, %r2890; - shf.r.wrap.b32 %r2892, %r2885, %r2885, 25; - xor.b32 %r2893, %r2891, %r2892; - xor.b32 %r2894, %r2886, %r2715; - and.b32 %r2895, %r2894, %r2885; - xor.b32 %r2896, %r2895, %r2715; - add.s32 %r2897, %r2716, %r2888; - add.s32 %r2898, %r2897, %r2893; - add.s32 %r2899, %r2898, %r2896; - shf.r.wrap.b32 %r2900, %r2883, %r2883, 2; - shf.r.wrap.b32 %r2901, %r2883, %r2883, 13; - xor.b32 %r2902, %r2900, %r2901; - shf.r.wrap.b32 %r2903, %r2883, %r2883, 22; - xor.b32 %r2904, %r2902, %r2903; - and.b32 %r2905, %r2884, %r2883; - and.b32 %r2906, %r2764, %r2706; - xor.b32 %r2907, %r2905, %r2906; - and.b32 %r2908, %r2884, %r2713; - xor.b32 %r2909, %r2907, %r2908; - add.s32 %r2910, %r2909, %r2904; - add.s32 %r2911, %r2910, %r2899; - add.s32 %r2912, %r2899, %r2714; - shf.r.wrap.b32 %r2913, %r2912, %r2912, 6; - shf.r.wrap.b32 %r2914, %r2912, %r2912, 11; - xor.b32 %r2915, %r2913, %r2914; - shf.r.wrap.b32 %r2916, %r2912, %r2912, 25; - xor.b32 %r2917, %r2915, %r2916; - xor.b32 %r2918, %r2886, %r2885; - and.b32 %r2919, %r2912, %r2918; - xor.b32 %r2920, %r2919, %r2886; - add.s32 %r2921, %r2715, %r2887; - add.s32 %r2922, %r2921, %r2920; - add.s32 %r2923, %r2922, %r2917; - shf.r.wrap.b32 %r2924, %r2911, %r2911, 2; - shf.r.wrap.b32 %r2925, %r2911, %r2911, 13; - xor.b32 %r2926, %r2924, %r2925; - shf.r.wrap.b32 %r2927, %r2911, %r2911, 22; - xor.b32 %r2928, %r2926, %r2927; - xor.b32 %r2929, %r2884, %r2883; - and.b32 %r2930, %r2911, %r2929; - xor.b32 %r2931, %r2930, %r2905; - add.s32 %r2932, %r2928, %r2931; - add.s32 %r2933, %r2923, %r2713; - cvt.u64.u32 %rd1232, %r2912; - cvt.u64.u32 %rd1233, %r2933; - cvt.u64.u32 %rd1234, %r2911; - add.s32 %r2934, %r2932, %r2923; - cvt.u64.u32 %rd1235, %r2934; - bfi.b64 %rd1236, %rd1234, %rd1235, 32, 32; - bfi.b64 %rd1237, %rd1232, %rd1233, 32, 32; - mov.b64 {%r2935, %r2936}, %rd1236; - mov.b64 {%r2937, %r2938}, %rd1237; - mov.b64 {%r2939, %r2940}, %rd1225; - cvt.u64.u32 %rd1238, %r2940; - bfi.b64 %rd1239, %rd1238, %rd1224, 32, 32; - cvt.u64.u32 %rd1240, %r2938; - cvt.u64.u32 %rd1241, %r2936; - cvt.u64.u32 %rd1242, %r2937; - bfi.b64 %rd1243, %rd1241, %rd1235, 32, 32; - bfi.b64 %rd1244, %rd1240, %rd1242, 32, 32; - mov.b64 {%r2941, %r2942}, %rd1243; - mov.b64 {%r2943, %r2944}, %rd1244; - mov.b64 {%r2945, %r2946}, %rd1239; - shf.r.wrap.b32 %r2947, %r2943, %r2943, 6; - shf.r.wrap.b32 %r2948, %r2943, %r2943, 11; - xor.b32 %r2949, %r2947, %r2948; - shf.r.wrap.b32 %r2950, %r2943, %r2943, 25; - xor.b32 %r2951, %r2949, %r2950; - xor.b32 %r2952, %r2944, %r2885; - and.b32 %r2953, %r2952, %r2943; - xor.b32 %r2954, %r2953, %r2885; - add.s32 %r2955, %r2886, %r2946; - add.s32 %r2956, %r2955, %r2951; - add.s32 %r2957, %r2956, %r2954; - shf.r.wrap.b32 %r2958, %r2941, %r2941, 2; - shf.r.wrap.b32 %r2959, %r2941, %r2941, 13; - xor.b32 %r2960, %r2958, %r2959; - shf.r.wrap.b32 %r2961, %r2941, %r2941, 22; - xor.b32 %r2962, %r2960, %r2961; - and.b32 %r2963, %r2942, %r2941; - and.b32 %r2964, %r2934, %r2764; - xor.b32 %r2965, %r2963, %r2964; - and.b32 %r2966, %r2942, %r2883; - xor.b32 %r2967, %r2965, %r2966; - add.s32 %r2968, %r2967, %r2962; - add.s32 %r2969, %r2968, %r2957; - add.s32 %r2970, %r2957, %r2884; - shf.r.wrap.b32 %r2971, %r2970, %r2970, 6; - shf.r.wrap.b32 %r2972, %r2970, %r2970, 11; - xor.b32 %r2973, %r2971, %r2972; - shf.r.wrap.b32 %r2974, %r2970, %r2970, 25; - xor.b32 %r2975, %r2973, %r2974; - xor.b32 %r2976, %r2944, %r2943; - and.b32 %r2977, %r2970, %r2976; - xor.b32 %r2978, %r2977, %r2944; - add.s32 %r2979, %r2885, %r2945; - add.s32 %r2980, %r2979, %r2978; - add.s32 %r2981, %r2980, %r2975; - shf.r.wrap.b32 %r2982, %r2969, %r2969, 2; - shf.r.wrap.b32 %r2983, %r2969, %r2969, 13; - xor.b32 %r2984, %r2982, %r2983; - shf.r.wrap.b32 %r2985, %r2969, %r2969, 22; - xor.b32 %r2986, %r2984, %r2985; - xor.b32 %r2987, %r2942, %r2941; - and.b32 %r2988, %r2969, %r2987; - xor.b32 %r2989, %r2988, %r2963; - add.s32 %r2990, %r2986, %r2989; - add.s32 %r2991, %r2981, %r2883; - cvt.u64.u32 %rd1245, %r2970; - cvt.u64.u32 %rd1246, %r2991; - cvt.u64.u32 %rd1247, %r2969; - add.s32 %r2992, %r2990, %r2981; - cvt.u64.u32 %rd1248, %r2992; - bfi.b64 %rd1249, %rd1247, %rd1248, 32, 32; - bfi.b64 %rd1250, %rd1245, %rd1246, 32, 32; - mov.b64 {%r2993, %r2994}, %rd1249; - mov.b64 {%r2995, %r2996}, %rd1250; - shr.u32 %r2997, %r2608, 7; - shr.u32 %r2998, %r2609, 7; - shr.u32 %r2999, %r2610, 7; - cvt.u64.u32 %rd1251, %r2999; - cvt.u64.u32 %rd1252, %r2997; - shr.u32 %r3000, %r2607, 7; - cvt.u64.u32 %rd1253, %r3000; - cvt.u64.u32 %rd1254, %r2998; - bfi.b64 %rd1255, %rd1252, %rd1253, 32, 32; - bfi.b64 %rd1256, %rd1251, %rd1254, 32, 32; - shl.b32 %r3001, %r2608, 25; - shl.b32 %r3002, %r2609, 25; - cvt.u64.u32 %rd1257, %r3001; - shl.b32 %r3003, %r2607, 25; - cvt.u64.u32 %rd1258, %r3003; - cvt.u64.u32 %rd1259, %r3002; - bfi.b64 %rd1260, %rd1257, %rd1258, 32, 32; - cvt.u64.u32 %rd1261, %r2610; - bfi.b64 %rd1262, %rd1261, %rd1259, 57, 7; - mov.b64 {%r3004, %r3005}, %rd1255; - mov.b64 {%r3006, %r3007}, %rd1256; - mov.b64 {%r3008, %r3009}, %rd1260; - mov.b64 {%r3010, %r3011}, %rd1262; - or.b64 %rd1263, %rd1260, %rd1255; - or.b32 %r3012, %r3009, %r3005; - or.b32 %r3013, %r3010, %r3006; - or.b32 %r3014, %r3011, %r3007; - cvt.u64.u32 %rd1264, %r3014; - cvt.u64.u32 %rd1265, %r3012; - and.b64 %rd1266, %rd1263, 4294967295; - cvt.u64.u32 %rd1267, %r3013; - bfi.b64 %rd1268, %rd1265, %rd1266, 32, 32; - bfi.b64 %rd1269, %rd1264, %rd1267, 32, 32; - shr.u32 %r3015, %r2608, 18; - shr.u32 %r3016, %r2609, 18; - shr.u32 %r3017, %r2610, 18; - cvt.u64.u32 %rd1270, %r3017; - cvt.u64.u32 %rd1271, %r3015; - shr.u32 %r3018, %r2607, 18; - cvt.u64.u32 %rd1272, %r3018; - cvt.u64.u32 %rd1273, %r3016; - bfi.b64 %rd1274, %rd1271, %rd1272, 32, 32; - bfi.b64 %rd1275, %rd1270, %rd1273, 32, 32; - shl.b32 %r3019, %r2608, 14; - shl.b32 %r3020, %r2609, 14; - cvt.u64.u32 %rd1276, %r3019; - shl.b32 %r3021, %r2607, 14; - cvt.u64.u32 %rd1277, %r3021; - cvt.u64.u32 %rd1278, %r3020; - bfi.b64 %rd1279, %rd1276, %rd1277, 32, 32; - bfi.b64 %rd1280, %rd1261, %rd1278, 46, 18; - mov.b64 {%r3022, %r3023}, %rd1274; - mov.b64 {%r3024, %r3025}, %rd1275; - mov.b64 {%r3026, %r3027}, %rd1279; - mov.b64 {%r3028, %r3029}, %rd1280; - or.b64 %rd1281, %rd1279, %rd1274; - or.b32 %r3030, %r3027, %r3023; - or.b32 %r3031, %r3028, %r3024; - or.b32 %r3032, %r3029, %r3025; - cvt.u64.u32 %rd1282, %r3032; - cvt.u64.u32 %rd1283, %r3030; - and.b64 %rd1284, %rd1281, 4294967295; - cvt.u64.u32 %rd1285, %r3031; - bfi.b64 %rd1286, %rd1283, %rd1284, 32, 32; - bfi.b64 %rd1287, %rd1282, %rd1285, 32, 32; - shr.u32 %r3033, %r2608, 3; - shr.u32 %r3034, %r2609, 3; - shr.u32 %r3035, %r2610, 3; - cvt.u64.u32 %rd1288, %r3035; - cvt.u64.u32 %rd1289, %r3033; - shr.u32 %r3036, %r2607, 3; - cvt.u64.u32 %rd1290, %r3036; - cvt.u64.u32 %rd1291, %r3034; - bfi.b64 %rd1292, %rd1289, %rd1290, 32, 32; - bfi.b64 %rd1293, %rd1288, %rd1291, 32, 32; - mov.b64 {%r3037, %r3038}, %rd1268; - mov.b64 {%r3039, %r3040}, %rd1269; - mov.b64 {%r3041, %r3042}, %rd1286; - mov.b64 {%r3043, %r3044}, %rd1287; - xor.b64 %rd1294, %rd1286, %rd1268; - xor.b32 %r3045, %r3042, %r3038; - xor.b32 %r3046, %r3043, %r3039; - xor.b32 %r3047, %r3044, %r3040; - cvt.u64.u32 %rd1295, %r3047; - cvt.u64.u32 %rd1296, %r3045; - and.b64 %rd1297, %rd1294, 4294967295; - cvt.u64.u32 %rd1298, %r3046; - bfi.b64 %rd1299, %rd1296, %rd1297, 32, 32; - bfi.b64 %rd1300, %rd1295, %rd1298, 32, 32; - mov.b64 {%r3048, %r3049}, %rd1299; - mov.b64 {%r3050, %r3051}, %rd1300; - mov.b64 {%r3052, %r3053}, %rd1292; - mov.b64 {%r3054, %r3055}, %rd1293; - shf.l.wrap.b32 %r3056, %r2607, %r2607, 25; - shf.l.wrap.b32 %r3057, %r2607, %r2607, 14; - xor.b32 %r3058, %r3057, %r3056; - xor.b32 %r3059, %r3058, %r3036; - xor.b32 %r3060, %r3049, %r3053; - xor.b32 %r3061, %r3050, %r3054; - xor.b32 %r3062, %r3051, %r3055; - cvt.u64.u32 %rd1301, %r2649; - cvt.u64.u32 %rd1302, %r2648; - cvt.u64.u32 %rd1303, %r2878; - bfi.b64 %rd1304, %rd1117, %rd1303, 32, 32; - bfi.b64 %rd1305, %rd1301, %rd1302, 32, 32; - mov.b64 {%r3063, %r3064}, %rd1304; - mov.b64 {%r3065, %r3066}, %rd1305; - shf.r.wrap.b32 %r3067, %r2876, %r2876, 17; - shf.r.wrap.b32 %r3068, %r2876, %r2876, 19; - xor.b32 %r3069, %r3067, %r3068; - shr.u32 %r3070, %r2876, 10; - xor.b32 %r3071, %r3069, %r3070; - add.s32 %r3072, %r3062, %r2194; - add.s32 %r3073, %r3072, %r3071; - add.s32 %r3074, %r3073, %r3066; - shf.r.wrap.b32 %r3075, %r2875, %r2875, 17; - shf.r.wrap.b32 %r3076, %r2875, %r2875, 19; - xor.b32 %r3077, %r3075, %r3076; - shr.u32 %r3078, %r2875, 10; - xor.b32 %r3079, %r3077, %r3078; - add.s32 %r3080, %r3061, %r2193; - add.s32 %r3081, %r3080, %r3079; - add.s32 %r3082, %r3081, %r3065; - shf.r.wrap.b32 %r3083, %r3074, %r3074, 17; - shf.r.wrap.b32 %r3084, %r3074, %r3074, 19; - xor.b32 %r3085, %r3083, %r3084; - shr.u32 %r3086, %r3074, 10; - xor.b32 %r3087, %r3085, %r3086; - add.s32 %r3088, %r3060, %r2192; - add.s32 %r3089, %r3088, %r3064; - add.s32 %r3090, %r3089, %r3087; - shf.r.wrap.b32 %r3091, %r3082, %r3082, 17; - shf.r.wrap.b32 %r3092, %r3082, %r3082, 19; - xor.b32 %r3093, %r3091, %r3092; - shr.u32 %r3094, %r3082, 10; - xor.b32 %r3095, %r3093, %r3094; - add.s32 %r3096, %r3059, %r2191; - add.s32 %r3097, %r3096, %r3063; - add.s32 %r3098, %r3097, %r3095; - add.s32 %r3099, %r3098, -1933114872; - add.s32 %r3100, %r3090, -2067236844; - add.s32 %r3101, %r3082, 2024104815; - add.s32 %r3102, %r3074, 1955562222; - cvt.u64.u32 %rd1306, %r3102; - cvt.u64.u32 %rd1307, %r3101; - cvt.u64.u32 %rd1308, %r3100; - cvt.u64.u32 %rd1309, %r3099; - bfi.b64 %rd1310, %rd1308, %rd1309, 32, 32; - bfi.b64 %rd1311, %rd1306, %rd1307, 32, 32; - cvt.u64.u32 %rd1312, %r2996; - cvt.u64.u32 %rd1313, %r2994; - cvt.u64.u32 %rd1314, %r2995; - bfi.b64 %rd1315, %rd1313, %rd1248, 32, 32; - bfi.b64 %rd1316, %rd1312, %rd1314, 32, 32; - mov.b64 {%r3103, %r3104}, %rd1315; - mov.b64 {%r3105, %r3106}, %rd1316; - mov.b64 {%r3107, %r3108}, %rd1311; - shf.r.wrap.b32 %r3109, %r3105, %r3105, 6; - shf.r.wrap.b32 %r3110, %r3105, %r3105, 11; - xor.b32 %r3111, %r3109, %r3110; - shf.r.wrap.b32 %r3112, %r3105, %r3105, 25; - xor.b32 %r3113, %r3111, %r3112; - xor.b32 %r3114, %r3106, %r2943; - and.b32 %r3115, %r3114, %r3105; - xor.b32 %r3116, %r3115, %r2943; - add.s32 %r3117, %r2944, %r3108; - add.s32 %r3118, %r3117, %r3113; - add.s32 %r3119, %r3118, %r3116; - shf.r.wrap.b32 %r3120, %r3103, %r3103, 2; - shf.r.wrap.b32 %r3121, %r3103, %r3103, 13; - xor.b32 %r3122, %r3120, %r3121; - shf.r.wrap.b32 %r3123, %r3103, %r3103, 22; - xor.b32 %r3124, %r3122, %r3123; - and.b32 %r3125, %r3104, %r3103; - and.b32 %r3126, %r2992, %r2934; - xor.b32 %r3127, %r3125, %r3126; - and.b32 %r3128, %r3104, %r2941; - xor.b32 %r3129, %r3127, %r3128; - add.s32 %r3130, %r3129, %r3124; - add.s32 %r3131, %r3130, %r3119; - add.s32 %r3132, %r3119, %r2942; - shf.r.wrap.b32 %r3133, %r3132, %r3132, 6; - shf.r.wrap.b32 %r3134, %r3132, %r3132, 11; - xor.b32 %r3135, %r3133, %r3134; - shf.r.wrap.b32 %r3136, %r3132, %r3132, 25; - xor.b32 %r3137, %r3135, %r3136; - xor.b32 %r3138, %r3106, %r3105; - and.b32 %r3139, %r3132, %r3138; - xor.b32 %r3140, %r3139, %r3106; - add.s32 %r3141, %r2943, %r3107; - add.s32 %r3142, %r3141, %r3140; - add.s32 %r3143, %r3142, %r3137; - shf.r.wrap.b32 %r3144, %r3131, %r3131, 2; - shf.r.wrap.b32 %r3145, %r3131, %r3131, 13; - xor.b32 %r3146, %r3144, %r3145; - shf.r.wrap.b32 %r3147, %r3131, %r3131, 22; - xor.b32 %r3148, %r3146, %r3147; - xor.b32 %r3149, %r3104, %r3103; - and.b32 %r3150, %r3131, %r3149; - xor.b32 %r3151, %r3150, %r3125; - add.s32 %r3152, %r3148, %r3151; - add.s32 %r3153, %r3143, %r2941; - cvt.u64.u32 %rd1317, %r3132; - cvt.u64.u32 %rd1318, %r3153; - cvt.u64.u32 %rd1319, %r3131; - add.s32 %r3154, %r3152, %r3143; - cvt.u64.u32 %rd1320, %r3154; - bfi.b64 %rd1321, %rd1319, %rd1320, 32, 32; - bfi.b64 %rd1322, %rd1317, %rd1318, 32, 32; - mov.b64 {%r3155, %r3156}, %rd1321; - mov.b64 {%r3157, %r3158}, %rd1322; - mov.b64 {%r3159, %r3160}, %rd1310; - cvt.u64.u32 %rd1323, %r3160; - bfi.b64 %rd1324, %rd1323, %rd1309, 32, 32; - cvt.u64.u32 %rd1325, %r3158; - cvt.u64.u32 %rd1326, %r3156; - cvt.u64.u32 %rd1327, %r3157; - bfi.b64 %rd1328, %rd1326, %rd1320, 32, 32; - bfi.b64 %rd1329, %rd1325, %rd1327, 32, 32; - mov.b64 {%r3161, %r3162}, %rd1328; - mov.b64 {%r3163, %r3164}, %rd1329; - mov.b64 {%r3165, %r3166}, %rd1324; - shf.r.wrap.b32 %r3167, %r3163, %r3163, 6; - shf.r.wrap.b32 %r3168, %r3163, %r3163, 11; - xor.b32 %r3169, %r3167, %r3168; - shf.r.wrap.b32 %r3170, %r3163, %r3163, 25; - xor.b32 %r3171, %r3169, %r3170; - xor.b32 %r3172, %r3164, %r3105; - and.b32 %r3173, %r3172, %r3163; - xor.b32 %r3174, %r3173, %r3105; - add.s32 %r3175, %r3106, %r3166; - add.s32 %r3176, %r3175, %r3171; - add.s32 %r3177, %r3176, %r3174; - shf.r.wrap.b32 %r3178, %r3161, %r3161, 2; - shf.r.wrap.b32 %r3179, %r3161, %r3161, 13; - xor.b32 %r3180, %r3178, %r3179; - shf.r.wrap.b32 %r3181, %r3161, %r3161, 22; - xor.b32 %r3182, %r3180, %r3181; - and.b32 %r3183, %r3162, %r3161; - and.b32 %r3184, %r3154, %r2992; - xor.b32 %r3185, %r3183, %r3184; - and.b32 %r3186, %r3162, %r3103; - xor.b32 %r3187, %r3185, %r3186; - add.s32 %r3188, %r3187, %r3182; - add.s32 %r3189, %r3188, %r3177; - add.s32 %r3190, %r3177, %r3104; - shf.r.wrap.b32 %r3191, %r3190, %r3190, 6; - shf.r.wrap.b32 %r3192, %r3190, %r3190, 11; - xor.b32 %r3193, %r3191, %r3192; - shf.r.wrap.b32 %r3194, %r3190, %r3190, 25; - xor.b32 %r3195, %r3193, %r3194; - xor.b32 %r3196, %r3164, %r3163; - and.b32 %r3197, %r3190, %r3196; - xor.b32 %r3198, %r3197, %r3164; - add.s32 %r3199, %r3105, %r3165; - add.s32 %r3200, %r3199, %r3198; - add.s32 %r3201, %r3200, %r3195; - shf.r.wrap.b32 %r3202, %r3189, %r3189, 2; - shf.r.wrap.b32 %r3203, %r3189, %r3189, 13; - xor.b32 %r3204, %r3202, %r3203; - shf.r.wrap.b32 %r3205, %r3189, %r3189, 22; - xor.b32 %r3206, %r3204, %r3205; - xor.b32 %r3207, %r3162, %r3161; - and.b32 %r3208, %r3189, %r3207; - xor.b32 %r3209, %r3208, %r3183; - add.s32 %r3210, %r3206, %r3209; - add.s32 %r3211, %r3201, %r3103; - cvt.u64.u32 %rd1330, %r3190; - cvt.u64.u32 %rd1331, %r3211; - cvt.u64.u32 %rd1332, %r3189; - add.s32 %r3212, %r3210, %r3201; - cvt.u64.u32 %rd1333, %r3212; - bfi.b64 %rd1334, %rd1332, %rd1333, 32, 32; - bfi.b64 %rd1335, %rd1330, %rd1331, 32, 32; - mov.b64 {%r3213, %r3214}, %rd1334; - mov.b64 {%r3215, %r3216}, %rd1335; - shr.u32 %r3217, %r2836, 7; - shr.u32 %r3218, %r2837, 7; - shr.u32 %r3219, %r2838, 7; - cvt.u64.u32 %rd1336, %r3219; - cvt.u64.u32 %rd1337, %r3217; - shr.u32 %r3220, %r2835, 7; - cvt.u64.u32 %rd1338, %r3220; - cvt.u64.u32 %rd1339, %r3218; - bfi.b64 %rd1340, %rd1337, %rd1338, 32, 32; - bfi.b64 %rd1341, %rd1336, %rd1339, 32, 32; - shl.b32 %r3221, %r2836, 25; - shl.b32 %r3222, %r2837, 25; - cvt.u64.u32 %rd1342, %r3221; - shl.b32 %r3223, %r2835, 25; - cvt.u64.u32 %rd1343, %r3223; - cvt.u64.u32 %rd1344, %r3222; - bfi.b64 %rd1345, %rd1342, %rd1343, 32, 32; - cvt.u64.u32 %rd1346, %r2838; - bfi.b64 %rd1347, %rd1346, %rd1344, 57, 7; - mov.b64 {%r3224, %r3225}, %rd1340; - mov.b64 {%r3226, %r3227}, %rd1341; - mov.b64 {%r3228, %r3229}, %rd1345; - mov.b64 {%r3230, %r3231}, %rd1347; - or.b64 %rd1348, %rd1345, %rd1340; - or.b32 %r3232, %r3229, %r3225; - or.b32 %r3233, %r3230, %r3226; - or.b32 %r3234, %r3231, %r3227; - cvt.u64.u32 %rd1349, %r3234; - cvt.u64.u32 %rd1350, %r3232; - and.b64 %rd1351, %rd1348, 4294967295; - cvt.u64.u32 %rd1352, %r3233; - bfi.b64 %rd1353, %rd1350, %rd1351, 32, 32; - bfi.b64 %rd1354, %rd1349, %rd1352, 32, 32; - shr.u32 %r3235, %r2836, 18; - shr.u32 %r3236, %r2837, 18; - shr.u32 %r3237, %r2838, 18; - cvt.u64.u32 %rd1355, %r3237; - cvt.u64.u32 %rd1356, %r3235; - shr.u32 %r3238, %r2835, 18; - cvt.u64.u32 %rd1357, %r3238; - cvt.u64.u32 %rd1358, %r3236; - bfi.b64 %rd1359, %rd1356, %rd1357, 32, 32; - bfi.b64 %rd1360, %rd1355, %rd1358, 32, 32; - shl.b32 %r3239, %r2836, 14; - shl.b32 %r3240, %r2837, 14; - cvt.u64.u32 %rd1361, %r3239; - shl.b32 %r3241, %r2835, 14; - cvt.u64.u32 %rd1362, %r3241; - cvt.u64.u32 %rd1363, %r3240; - bfi.b64 %rd1364, %rd1361, %rd1362, 32, 32; - bfi.b64 %rd1365, %rd1346, %rd1363, 46, 18; - mov.b64 {%r3242, %r3243}, %rd1359; - mov.b64 {%r3244, %r3245}, %rd1360; - mov.b64 {%r3246, %r3247}, %rd1364; - mov.b64 {%r3248, %r3249}, %rd1365; - or.b64 %rd1366, %rd1364, %rd1359; - or.b32 %r3250, %r3247, %r3243; - or.b32 %r3251, %r3248, %r3244; - or.b32 %r3252, %r3249, %r3245; - cvt.u64.u32 %rd1367, %r3252; - cvt.u64.u32 %rd1368, %r3250; - and.b64 %rd1369, %rd1366, 4294967295; - cvt.u64.u32 %rd1370, %r3251; - bfi.b64 %rd1371, %rd1368, %rd1369, 32, 32; - bfi.b64 %rd1372, %rd1367, %rd1370, 32, 32; - shr.u32 %r3253, %r2836, 3; - shr.u32 %r3254, %r2837, 3; - shr.u32 %r3255, %r2838, 3; - cvt.u64.u32 %rd1373, %r3255; - cvt.u64.u32 %rd1374, %r3253; - shr.u32 %r3256, %r2835, 3; - cvt.u64.u32 %rd1375, %r3256; - cvt.u64.u32 %rd1376, %r3254; - bfi.b64 %rd1377, %rd1374, %rd1375, 32, 32; - bfi.b64 %rd1378, %rd1373, %rd1376, 32, 32; - mov.b64 {%r3257, %r3258}, %rd1353; - mov.b64 {%r3259, %r3260}, %rd1354; - mov.b64 {%r3261, %r3262}, %rd1371; - mov.b64 {%r3263, %r3264}, %rd1372; - xor.b64 %rd1379, %rd1371, %rd1353; - xor.b32 %r3265, %r3262, %r3258; - xor.b32 %r3266, %r3263, %r3259; - xor.b32 %r3267, %r3264, %r3260; - cvt.u64.u32 %rd1380, %r3267; - cvt.u64.u32 %rd1381, %r3265; - and.b64 %rd1382, %rd1379, 4294967295; - cvt.u64.u32 %rd1383, %r3266; - bfi.b64 %rd1384, %rd1381, %rd1382, 32, 32; - bfi.b64 %rd1385, %rd1380, %rd1383, 32, 32; - mov.b64 {%r3268, %r3269}, %rd1384; - mov.b64 {%r3270, %r3271}, %rd1385; - mov.b64 {%r3272, %r3273}, %rd1377; - mov.b64 {%r3274, %r3275}, %rd1378; - shf.l.wrap.b32 %r3276, %r2835, %r2835, 25; - shf.l.wrap.b32 %r3277, %r2835, %r2835, 14; - xor.b32 %r3278, %r3277, %r3276; - xor.b32 %r3279, %r3278, %r3256; - xor.b32 %r3280, %r3269, %r3273; - xor.b32 %r3281, %r3270, %r3274; - xor.b32 %r3282, %r3271, %r3275; - cvt.u64.u32 %rd1386, %r2877; - cvt.u64.u32 %rd1387, %r2876; - cvt.u64.u32 %rd1388, %r3074; - bfi.b64 %rd1389, %rd1386, %rd1387, 32, 32; - bfi.b64 %rd1390, %rd1213, %rd1388, 32, 32; - mov.b64 {%r3283, %r3284}, %rd1390; - mov.b64 {%r3285, %r3286}, %rd1389; - shf.r.wrap.b32 %r3287, %r3090, %r3090, 17; - shf.r.wrap.b32 %r3288, %r3090, %r3090, 19; - xor.b32 %r3289, %r3287, %r3288; - shr.u32 %r3290, %r3090, 10; - xor.b32 %r3291, %r3289, %r3290; - add.s32 %r3292, %r3282, %r2422; - add.s32 %r3293, %r3292, %r3286; - add.s32 %r3294, %r3293, %r3291; - shf.r.wrap.b32 %r3295, %r3098, %r3098, 17; - shf.r.wrap.b32 %r3296, %r3098, %r3098, 19; - xor.b32 %r3297, %r3295, %r3296; - shr.u32 %r3298, %r3098, 10; - xor.b32 %r3299, %r3297, %r3298; - add.s32 %r3300, %r3281, %r2421; - add.s32 %r3301, %r3300, %r3285; - add.s32 %r3302, %r3301, %r3299; - shf.r.wrap.b32 %r3303, %r3294, %r3294, 17; - shf.r.wrap.b32 %r3304, %r3294, %r3294, 19; - xor.b32 %r3305, %r3303, %r3304; - shr.u32 %r3306, %r3294, 10; - xor.b32 %r3307, %r3305, %r3306; - add.s32 %r3308, %r3280, %r2420; - add.s32 %r3309, %r3308, %r3284; - add.s32 %r3310, %r3309, %r3307; - shf.r.wrap.b32 %r3311, %r3302, %r3302, 17; - shf.r.wrap.b32 %r3312, %r3302, %r3302, 19; - xor.b32 %r3313, %r3311, %r3312; - shr.u32 %r3314, %r3302, 10; - xor.b32 %r3315, %r3313, %r3314; - add.s32 %r3316, %r3279, %r2419; - add.s32 %r3317, %r3316, %r3283; - add.s32 %r3318, %r3317, %r3315; - cvt.u64.u32 %rd1391, %r3294; - cvt.u64.u32 %rd1392, %r3302; - cvt.u64.u32 %rd1393, %r3310; - cvt.u64.u32 %rd1394, %r3318; - bfi.b64 %rd1395, %rd1393, %rd1394, 32, 32; - bfi.b64 %rd1396, %rd1391, %rd1392, 32, 32; - mov.b64 {%r3319, %r3320}, %rd1395; - mov.b64 {%r3321, %r3322}, %rd1396; - cvt.u64.u32 %rd1397, %r3322; - cvt.u64.u32 %rd1398, %r3320; - cvt.u64.u32 %rd1399, %r3321; - bfi.b64 %rd1400, %rd1397, %rd1399, 32, 32; - bfi.b64 %rd1401, %rd1398, %rd1394, 32, 32; - mov.b64 {%r3323, %r3324}, %rd1401; - mov.b64 {%r3325, %r3326}, %rd1400; - add.s32 %r3327, %r3323, -965641998; - add.s32 %r3328, %r3324, -1090935817; - add.s32 %r3329, %r3325, -1538233109; - add.s32 %r3330, %r3326, -1866530822; - cvt.u64.u32 %rd1402, %r3330; - cvt.u64.u32 %rd1403, %r3328; - cvt.u64.u32 %rd1404, %r3329; - cvt.u64.u32 %rd1405, %r3327; - bfi.b64 %rd1406, %rd1403, %rd1405, 32, 32; - bfi.b64 %rd1407, %rd1402, %rd1404, 32, 32; - cvt.u64.u32 %rd1408, %r3216; - cvt.u64.u32 %rd1409, %r3214; - cvt.u64.u32 %rd1410, %r3215; - bfi.b64 %rd1411, %rd1409, %rd1333, 32, 32; - bfi.b64 %rd1412, %rd1408, %rd1410, 32, 32; - mov.b64 {%r3331, %r3332}, %rd1411; - mov.b64 {%r3333, %r3334}, %rd1412; - mov.b64 {%r3335, %r3336}, %rd1407; - shf.r.wrap.b32 %r3337, %r3333, %r3333, 6; - shf.r.wrap.b32 %r3338, %r3333, %r3333, 11; - xor.b32 %r3339, %r3337, %r3338; - shf.r.wrap.b32 %r3340, %r3333, %r3333, 25; - xor.b32 %r3341, %r3339, %r3340; - xor.b32 %r3342, %r3334, %r3163; - and.b32 %r3343, %r3342, %r3333; - xor.b32 %r3344, %r3343, %r3163; - add.s32 %r3345, %r3164, %r3336; - add.s32 %r3346, %r3345, %r3341; - add.s32 %r3347, %r3346, %r3344; - shf.r.wrap.b32 %r3348, %r3331, %r3331, 2; - shf.r.wrap.b32 %r3349, %r3331, %r3331, 13; - xor.b32 %r3350, %r3348, %r3349; - shf.r.wrap.b32 %r3351, %r3331, %r3331, 22; - xor.b32 %r3352, %r3350, %r3351; - and.b32 %r3353, %r3332, %r3331; - and.b32 %r3354, %r3212, %r3154; - xor.b32 %r3355, %r3353, %r3354; - and.b32 %r3356, %r3332, %r3161; - xor.b32 %r3357, %r3355, %r3356; - add.s32 %r3358, %r3357, %r3352; - add.s32 %r3359, %r3358, %r3347; - add.s32 %r3360, %r3347, %r3162; - shf.r.wrap.b32 %r3361, %r3360, %r3360, 6; - shf.r.wrap.b32 %r3362, %r3360, %r3360, 11; - xor.b32 %r3363, %r3361, %r3362; - shf.r.wrap.b32 %r3364, %r3360, %r3360, 25; - xor.b32 %r3365, %r3363, %r3364; - xor.b32 %r3366, %r3334, %r3333; - and.b32 %r3367, %r3360, %r3366; - xor.b32 %r3368, %r3367, %r3334; - add.s32 %r3369, %r3163, %r3335; - add.s32 %r3370, %r3369, %r3368; - add.s32 %r3371, %r3370, %r3365; - shf.r.wrap.b32 %r3372, %r3359, %r3359, 2; - shf.r.wrap.b32 %r3373, %r3359, %r3359, 13; - xor.b32 %r3374, %r3372, %r3373; - shf.r.wrap.b32 %r3375, %r3359, %r3359, 22; - xor.b32 %r3376, %r3374, %r3375; - xor.b32 %r3377, %r3332, %r3331; - and.b32 %r3378, %r3359, %r3377; - xor.b32 %r3379, %r3378, %r3353; - add.s32 %r3380, %r3376, %r3379; - add.s32 %r3381, %r3371, %r3161; - cvt.u64.u32 %rd1413, %r3360; - cvt.u64.u32 %rd1414, %r3381; - cvt.u64.u32 %rd1415, %r3359; - add.s32 %r3382, %r3380, %r3371; - cvt.u64.u32 %rd1416, %r3382; - bfi.b64 %rd1417, %rd1415, %rd1416, 32, 32; - bfi.b64 %rd1418, %rd1413, %rd1414, 32, 32; - mov.b64 {%r3383, %r3384}, %rd1417; - mov.b64 {%r3385, %r3386}, %rd1418; - mov.b64 {%r3387, %r3388}, %rd1406; - cvt.u64.u32 %rd1419, %r3388; - bfi.b64 %rd1420, %rd1419, %rd1405, 32, 32; - cvt.u64.u32 %rd1421, %r3386; - cvt.u64.u32 %rd1422, %r3384; - cvt.u64.u32 %rd1423, %r3385; - bfi.b64 %rd1424, %rd1422, %rd1416, 32, 32; - bfi.b64 %rd1425, %rd1421, %rd1423, 32, 32; - mov.b64 {%r3389, %r3390}, %rd1424; - mov.b64 {%r3391, %r3392}, %rd1425; - mov.b64 {%r3393, %r3394}, %rd1420; - shf.r.wrap.b32 %r3395, %r3391, %r3391, 6; - shf.r.wrap.b32 %r3396, %r3391, %r3391, 11; - xor.b32 %r3397, %r3395, %r3396; - shf.r.wrap.b32 %r3398, %r3391, %r3391, 25; - xor.b32 %r3399, %r3397, %r3398; - xor.b32 %r3400, %r3392, %r3333; - and.b32 %r3401, %r3400, %r3391; - xor.b32 %r3402, %r3401, %r3333; - add.s32 %r3403, %r3334, %r3394; - add.s32 %r3404, %r3403, %r3399; - add.s32 %r3405, %r3404, %r3402; - shf.r.wrap.b32 %r3406, %r3389, %r3389, 2; - shf.r.wrap.b32 %r3407, %r3389, %r3389, 13; - xor.b32 %r3408, %r3406, %r3407; - shf.r.wrap.b32 %r3409, %r3389, %r3389, 22; - xor.b32 %r3410, %r3408, %r3409; - and.b32 %r3411, %r3390, %r3389; - and.b32 %r3412, %r3382, %r3212; - xor.b32 %r3413, %r3411, %r3412; - and.b32 %r3414, %r3390, %r3331; - xor.b32 %r3415, %r3413, %r3414; - add.s32 %r3416, %r3415, %r3410; - add.s32 %r3417, %r3416, %r3405; - add.s32 %r3418, %r3405, %r3332; - shf.r.wrap.b32 %r3419, %r3418, %r3418, 6; - shf.r.wrap.b32 %r3420, %r3418, %r3418, 11; - xor.b32 %r3421, %r3419, %r3420; - shf.r.wrap.b32 %r3422, %r3418, %r3418, 25; - xor.b32 %r3423, %r3421, %r3422; - xor.b32 %r3424, %r3392, %r3391; - and.b32 %r3425, %r3418, %r3424; - xor.b32 %r3426, %r3425, %r3392; - add.s32 %r3427, %r3333, %r3393; - add.s32 %r3428, %r3427, %r3426; - add.s32 %r3429, %r3428, %r3423; - shf.r.wrap.b32 %r3430, %r3417, %r3417, 2; - shf.r.wrap.b32 %r3431, %r3417, %r3417, 13; - xor.b32 %r3432, %r3430, %r3431; - shf.r.wrap.b32 %r3433, %r3417, %r3417, 22; - xor.b32 %r3434, %r3432, %r3433; - xor.b32 %r3435, %r3390, %r3389; - and.b32 %r3436, %r3417, %r3435; - xor.b32 %r3437, %r3436, %r3411; - add.s32 %r3438, %r3437, %r3448; - add.s32 %r3439, %r3438, %r3434; - add.s32 %r3448, %r3439, %r3429; - add.s32 %r3447, %r3417, %r3447; - add.s32 %r3446, %r3382, %r3446; - add.s32 %r3445, %r3384, %r3445; - add.s32 %r3440, %r3331, %r3444; - add.s32 %r3444, %r3440, %r3429; - add.s32 %r3443, %r3418, %r3443; - add.s32 %r3442, %r3385, %r3442; - add.s32 %r3441, %r3386, %r3441; - setp.ne.s64 %p18, %rd1428, %rd3; - @%p18 bra $L__BB2_2; - -$L__BB2_20: - ld.param.u64 %rd1427, [_ZN4sha26sha25611compress25617h9eb7f017ff169f1fE_param_0]; - cvta.to.local.u64 %rd1426, %rd1427; - st.local.u32 [%rd1426], %r3448; - st.local.u32 [%rd1426+4], %r3447; - st.local.u32 [%rd1426+8], %r3446; - st.local.u32 [%rd1426+12], %r3445; - st.local.u32 [%rd1426+16], %r3444; - st.local.u32 [%rd1426+20], %r3443; - st.local.u32 [%rd1426+24], %r3442; - st.local.u32 [%rd1426+28], %r3441; - ret; - -$L__BB2_18: - { // callseq 48, 0 - .reg .b32 temp_param_reg; - call.uni - _ZN4core6result13unwrap_failed17h995d1a0127e5a880E, - ( - ); - } // callseq 48 - -} -.func _ZN4core5slice5index24slice_end_index_len_fail17habecc7827e70e1d9E() -.noreturn -{ - - - - trap; - -} -.func _ZN4core5slice5index26slice_start_index_len_fail17h31c4387487c2b57aE() -.noreturn -{ - - - - trap; - -} -.func _ZN4core6result13unwrap_failed17h995d1a0127e5a880E() -.noreturn -{ - - - - trap; - -} -