|
98 | 98 | end
|
99 | 99 |
|
100 | 100 |
|
101 |
| - |
102 |
| -@inline function materialize!(M::MatLdivVec{<:TriangularLayout{'U',UNIT,<:AbstractBlockBandedLayout}, |
103 |
| - <:AbstractStridedLayout}) where UNIT |
104 |
| - U,dest = M.A,M.B |
105 |
| - T = eltype(dest) |
106 |
| - |
107 |
| - A = triangulardata(U) |
108 |
| - @assert hasmatchingblocks(A) |
109 |
| - |
110 |
| - @boundscheck size(A,1) == size(dest,1) || throw(BoundsError()) |
111 |
| - |
112 |
| - # impose block structure |
113 |
| - b = PseudoBlockArray(dest, BlockSizes((cumulsizes(blocksizes(A),1),))) |
114 |
| - |
115 |
| - Bs = blocksizes(A) |
116 |
| - N = nblocks(Bs,1) |
117 |
| - |
118 |
| - for K = N:-1:1 |
119 |
| - b_2 = view(b, Block(K)) |
120 |
| - Ũ = _triangular_matrix(Val('U'), Val(UNIT), view(A, Block(K,K))) |
121 |
| - apply!(\, Ũ, b_2) |
122 |
| - |
123 |
| - if K ≥ 2 |
124 |
| - KR = blockcolstart(A, K):Block(K-1) |
125 |
| - V_12 = view(A, KR, Block(K)) |
126 |
| - b̃_1 = view(b, KR) |
127 |
| - b̃_1 .= (-one(T)).*Mul(V_12, b_2) .+ b̃_1 |
| 101 | +for UNIT in ('U', 'N') |
| 102 | + @eval begin |
| 103 | + @inline function materialize!(M::MatLdivVec{<:TriangularLayout{'U',$UNIT,<:AbstractBlockBandedLayout}, |
| 104 | + <:AbstractStridedLayout}) |
| 105 | + U,dest = M.A,M.B |
| 106 | + T = eltype(dest) |
| 107 | + |
| 108 | + A = triangulardata(U) |
| 109 | + @assert hasmatchingblocks(A) |
| 110 | + |
| 111 | + @boundscheck size(A,1) == size(dest,1) || throw(BoundsError()) |
| 112 | + |
| 113 | + # impose block structure |
| 114 | + b = PseudoBlockArray(dest, BlockSizes((cumulsizes(blocksizes(A),1),))) |
| 115 | + |
| 116 | + Bs = blocksizes(A) |
| 117 | + N = nblocks(Bs,1) |
| 118 | + |
| 119 | + for K = N:-1:1 |
| 120 | + b_2 = view(b, Block(K)) |
| 121 | + Ũ = _triangular_matrix(Val('U'), Val($UNIT), view(A, Block(K,K))) |
| 122 | + apply!(\, Ũ, b_2) |
| 123 | + |
| 124 | + if K ≥ 2 |
| 125 | + KR = blockcolstart(A, K):Block(K-1) |
| 126 | + V_12 = view(A, KR, Block(K)) |
| 127 | + b̃_1 = view(b, KR) |
| 128 | + materialize!(MulAdd(-one(T), V_12, b_2, one(T), b̃_1)) |
| 129 | + end |
| 130 | + end |
| 131 | + |
| 132 | + dest |
128 | 133 | end
|
129 |
| - end |
130 | 134 |
|
131 |
| - dest |
132 |
| -end |
| 135 | + @inline function materialize!(M::MatLdivVec{<:TriangularLayout{'L',$UNIT,<:AbstractBlockBandedLayout}, |
| 136 | + <:AbstractStridedLayout}) |
| 137 | + L,dest = M.A, M.B |
| 138 | + T = eltype(dest) |
| 139 | + A = triangulardata(L) |
| 140 | + @assert hasmatchingblocks(A) |
133 | 141 |
|
134 |
| -@inline function materialize!(M::MatLdivVec{<:TriangularLayout{'L',UNIT,<:AbstractBlockBandedLayout}, |
135 |
| - <:AbstractStridedLayout}) where UNIT |
136 |
| - L,dest = M.A, M.B |
137 |
| - T = eltype(dest) |
138 |
| - A = triangulardata(L) |
139 |
| - @assert hasmatchingblocks(A) |
| 142 | + @boundscheck size(A,1) == size(dest,1) || throw(BoundsError()) |
140 | 143 |
|
141 |
| - @boundscheck size(A,1) == size(dest,1) || throw(BoundsError()) |
| 144 | + # impose block structure |
| 145 | + b = PseudoBlockArray(dest, BlockSizes((cumulsizes(blocksizes(A),1),))) |
142 | 146 |
|
143 |
| - # impose block structure |
144 |
| - b = PseudoBlockArray(dest, BlockSizes((cumulsizes(blocksizes(A),1),))) |
| 147 | + Bs = blocksizes(A) |
| 148 | + N = nblocks(Bs,1) |
145 | 149 |
|
146 |
| - Bs = blocksizes(A) |
147 |
| - N = nblocks(Bs,1) |
| 150 | + for K = 1:N |
| 151 | + b_2 = view(b, Block(K)) |
| 152 | + L̃ = _triangular_matrix(Val('L'), Val($UNIT), view(A, Block(K,K))) |
| 153 | + b_2 .= Ldiv(L̃, b_2) |
148 | 154 |
|
149 |
| - for K = 1:N |
150 |
| - b_2 = view(b, Block(K)) |
151 |
| - L̃ = _triangular_matrix(Val('L'), Val(UNIT), view(A, Block(K,K))) |
152 |
| - b_2 .= Ldiv(L̃, b_2) |
153 |
| - |
154 |
| - if K < N |
155 |
| - KR = Block(K+1):blockcolstop(A, K) |
156 |
| - V_12 = view(A, KR, Block(K)) |
157 |
| - b̃_1 = view(b, KR) |
158 |
| - b̃_1 .= (-one(T)).*Mul(V_12, b_2) .+ b̃_1 |
159 |
| - end |
160 |
| - end |
| 155 | + if K < N |
| 156 | + KR = Block(K+1):blockcolstop(A, K) |
| 157 | + V_12 = view(A, KR, Block(K)) |
| 158 | + b̃_1 = view(b, KR) |
| 159 | + materialize!(MulAdd(-one(T), V_12, b_2, one(T), b̃_1)) |
| 160 | + end |
| 161 | + end |
161 | 162 |
|
162 |
| - dest |
| 163 | + dest |
| 164 | + end |
| 165 | + end |
163 | 166 | end
|
164 | 167 |
|
165 | 168 |
|
|
0 commit comments