From 56b920329f379cbb8b2e6ed5e41264d92454cebc Mon Sep 17 00:00:00 2001 From: Charles Kawczynski Date: Wed, 15 May 2024 15:35:24 -0400 Subject: [PATCH] Reduce global memory reads --- src/MatrixFields/single_field_solver.jl | 17 ++++++++++++----- 1 file changed, 12 insertions(+), 5 deletions(-) diff --git a/src/MatrixFields/single_field_solver.jl b/src/MatrixFields/single_field_solver.jl index 4354c2a30f..a5f6a22bc0 100644 --- a/src/MatrixFields/single_field_solver.jl +++ b/src/MatrixFields/single_field_solver.jl @@ -125,13 +125,20 @@ function band_matrix_solve!(::Type{<:TridiagonalMatrixRow}, cache, x, Aⱼs, b) n = length(x) @inbounds begin inv_D₀ = inv(A₀[1]) - Ux[1] = inv_D₀ ⊠ b[1] - U₊₁[1] = inv_D₀ ⊠ A₊₁[1] + U₊₁ᵢ₋₁ = inv_D₀ ⊠ A₊₁[1] + Uxᵢ₋₁ = inv_D₀ ⊠ b[1] + Ux[1] = Uxᵢ₋₁ + U₊₁[1] = U₊₁ᵢ₋₁ for i in 2:n - inv_D₀ = inv(A₀[i] ⊟ A₋₁[i] ⊠ U₊₁[i - 1]) - Ux[i] = inv_D₀ ⊠ (b[i] ⊟ A₋₁[i] ⊠ Ux[i - 1]) - i < n && (U₊₁[i] = inv_D₀ ⊠ A₊₁[i]) # U₊₁[n] is outside the matrix. + A₋₁ᵢ = A₋₁[i] + inv_D₀ = inv(A₀[i] ⊟ A₋₁ᵢ ⊠ U₊₁ᵢ₋₁) + Uxᵢ₋₁ = inv_D₀ ⊠ (b[i] ⊟ A₋₁ᵢ ⊠ Uxᵢ₋₁) + Ux[i] = Uxᵢ₋₁ + if i < n + U₊₁ᵢ₋₁ = inv_D₀ ⊠ A₊₁[i] # U₊₁[n] is outside the matrix. + U₊₁[i] = U₊₁ᵢ₋₁ + end end x[n] = Ux[n]