Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Normal
Revision Log

radiation_matrix.F90 @ 5325

Last change on this file since 5325 was 4773, checked in by idelkadi, 19 months ago

Update of Ecrad in LMDZ The same organization of the Ecrad offline version is retained in order to facilitate the updating of Ecrad in LMDZ and the comparison between online and offline results. version 1.6.1 of Ecrad (https://github.com/lguez/ecrad.git)

Implementation of the double call of Ecrad in LMDZ

File size: 33.4 KB

Rev	Line
[4773]	1	! radiation_matrix.F90 - SPARTACUS matrix operations
	2	!
	3	! (C) Copyright 2014- ECMWF.
	4	!
	5	! This software is licensed under the terms of the Apache Licence Version 2.0
	6	! which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
	7	!
	8	! In applying this licence, ECMWF does not waive the privileges and immunities
	9	! granted to it by virtue of its status as an intergovernmental organisation
	10	! nor does it submit to any jurisdiction.
	11	!
	12	! Author: Robin Hogan
	13	! Email: r.j.hogan@ecmwf.int
	14	!
	15	! Modifications
	16	! 2018-10-15 R. Hogan Added fast_expm_exchange_[23]
	17	!
	18	! This module provides the neccessary mathematical functions for the
	19	! SPARTACUS radiation scheme: matrix multiplication, matrix solvers
	20	! and matrix exponentiation, but (a) multiple matrices are operated on
	21	! at once with array access indended to facilitate vectorization, and
	22	! (b) optimization for 2x2 and 3x3 matrices. There is probably
	23	! considerable scope for further optimization. Note that this module
	24	! is not used by the McICA solver.
	25
	26	module radiation_matrix
	27
	28	use parkind1, only : jprb
	29
	30	implicit none
	31	public
	32
	33	! Codes to describe sparseness pattern, where the SHORTWAVE
	34	! pattern is of the form:
	35	! (x x x)
	36	! (x x x)
	37	! (0 0 x)
	38	! where each element may itself be a square matrix.
	39	integer, parameter :: IMatrixPatternDense = 0
	40	integer, parameter :: IMatrixPatternShortwave = 1
	41
	42	public :: mat_x_vec, singlemat_x_vec, mat_x_mat, &
	43	& singlemat_x_mat, mat_x_singlemat, &
	44	& identity_minus_mat_x_mat, solve_vec, solve_mat, expm, &
	45	& fast_expm_exchange_2, fast_expm_exchange_3, &
	46	& sparse_x_dense
	47
	48	private :: solve_vec_2, solve_vec_3, solve_mat_2, &
	49	& solve_mat_3, lu_factorization, lu_substitution, solve_mat_n, &
	50	& diag_mat_right_divide_3
	51
	52	interface fast_expm_exchange
	53	module procedure fast_expm_exchange_2, fast_expm_exchange_3
	54	end interface fast_expm_exchange
	55
	56	contains
	57
	58	! --- MATRIX-VECTOR MULTIPLICATION ---
	59
	60	!---------------------------------------------------------------------
	61	! Treat A as n m-by-m square matrices (with the n dimension varying
	62	! fastest) and b as n m-element vectors, and perform matrix-vector
	63	! multiplications on first iend pairs
	64	function mat_x_vec(n,iend,m,A,b,do_top_left_only_in)
	65
	66	use yomhook, only : lhook, dr_hook, jphook
	67
	68	integer, intent(in) :: n, m, iend
	69	real(jprb), intent(in), dimension(:,:,:) :: A
	70	real(jprb), intent(in), dimension(:,:) :: b
	71	logical, intent(in), optional :: do_top_left_only_in
	72	real(jprb), dimension(iend,m):: mat_x_vec
	73
	74	integer :: j1, j2
	75	logical :: do_top_left_only
	76
	77	real(jphook) :: hook_handle
	78
	79	if (lhook) call dr_hook('radiation_matrix:mat_x_vec',0,hook_handle)
	80
	81	if (present(do_top_left_only_in)) then
	82	do_top_left_only = do_top_left_only_in
	83	else
	84	do_top_left_only = .false.
	85	end if
	86
	87	! Array-wise assignment
	88	mat_x_vec = 0.0_jprb
	89
	90	if (do_top_left_only) then
	91	mat_x_vec(1:iend,1) = A(1:iend,1,1)*b(1:iend,1)
	92	else
	93	do j1 = 1,m
	94	do j2 = 1,m
	95	mat_x_vec(1:iend,j1) = mat_x_vec(1:iend,j1) &
	96	& + A(1:iend,j1,j2)*b(1:iend,j2)
	97	end do
	98	end do
	99	end if
	100
	101	if (lhook) call dr_hook('radiation_matrix:mat_x_vec',1,hook_handle)
	102
	103	end function mat_x_vec
	104
	105
	106	!---------------------------------------------------------------------
	107	! Treat A as an m-by-m square matrix and b as n m-element vectors
	108	! (with the n dimension varying fastest), and perform matrix-vector
	109	! multiplications on first iend pairs
	110	function singlemat_x_vec(n,iend,m,A,b)
	111
	112	! use yomhook, only : lhook, dr_hook, jphook
	113
	114	integer, intent(in) :: n, m, iend
	115	real(jprb), intent(in), dimension(m,m) :: A
	116	real(jprb), intent(in), dimension(:,:) :: b
	117	real(jprb), dimension(iend,m) :: singlemat_x_vec
	118
	119	integer :: j1, j2
	120	! real(jphook) :: hook_handle
	121
	122	! if (lhook) call dr_hook('radiation_matrix:single_mat_x_vec',0,hook_handle)
	123
	124	! Array-wise assignment
	125	singlemat_x_vec = 0.0_jprb
	126
	127	do j1 = 1,m
	128	do j2 = 1,m
	129	singlemat_x_vec(1:iend,j1) = singlemat_x_vec(1:iend,j1) &
	130	& + A(j1,j2)*b(1:iend,j2)
	131	end do
	132	end do
	133
	134	! if (lhook) call dr_hook('radiation_matrix:single_mat_x_vec',1,hook_handle)
	135
	136	end function singlemat_x_vec
	137
	138
	139	! --- SQUARE MATRIX-MATRIX MULTIPLICATION ---
	140
	141	!---------------------------------------------------------------------
	142	! Treat A and B each as n m-by-m square matrices (with the n
	143	! dimension varying fastest) and perform matrix multiplications on
	144	! all n matrix pairs
	145	function mat_x_mat(n,iend,m,A,B,i_matrix_pattern)
	146
	147	use yomhook, only : lhook, dr_hook, jphook
	148
	149	integer, intent(in) :: n, m, iend
	150	integer, intent(in), optional :: i_matrix_pattern
	151	real(jprb), intent(in), dimension(:,:,:) :: A, B
	152
	153	real(jprb), dimension(iend,m,m) :: mat_x_mat
	154	integer :: j1, j2, j3
	155	integer :: mblock, m2block
	156	integer :: i_actual_matrix_pattern
	157	real(jphook) :: hook_handle
	158
	159	if (lhook) call dr_hook('radiation_matrix:mat_x_mat',0,hook_handle)
	160
	161	if (present(i_matrix_pattern)) then
	162	i_actual_matrix_pattern = i_matrix_pattern
	163	else
	164	i_actual_matrix_pattern = IMatrixPatternDense
	165	end if
	166
	167	! Array-wise assignment
	168	mat_x_mat = 0.0_jprb
	169
	170	if (i_actual_matrix_pattern == IMatrixPatternShortwave) then
	171	! Matrix has a sparsity pattern
	172	! (C D E)
	173	! A = (F G H)
	174	! (0 0 I)
	175	mblock = m/3
	176	m2block = 2*mblock
	177	! Do the top-left (C, D, F, G)
	178	do j2 = 1,m2block
	179	do j1 = 1,m2block
	180	do j3 = 1,m2block
	181	mat_x_mat(1:iend,j1,j2) = mat_x_mat(1:iend,j1,j2) &
	182	& + A(1:iend,j1,j3)*B(1:iend,j3,j2)
	183	end do
	184	end do
	185	end do
	186	do j2 = m2block+1,m
	187	! Do the top-right (E & H)
	188	do j1 = 1,m2block
	189	do j3 = 1,m
	190	mat_x_mat(1:iend,j1,j2) = mat_x_mat(1:iend,j1,j2) &
	191	& + A(1:iend,j1,j3)*B(1:iend,j3,j2)
	192	end do
	193	end do
	194	! Do the bottom-right (I)
	195	do j1 = m2block+1,m
	196	do j3 = m2block+1,m
	197	mat_x_mat(1:iend,j1,j2) = mat_x_mat(1:iend,j1,j2) &
	198	& + A(1:iend,j1,j3)*B(1:iend,j3,j2)
	199	end do
	200	end do
	201	end do
	202	else
	203	! Ordinary dense matrix
	204	do j2 = 1,m
	205	do j1 = 1,m
	206	do j3 = 1,m
	207	mat_x_mat(1:iend,j1,j2) = mat_x_mat(1:iend,j1,j2) &
	208	& + A(1:iend,j1,j3)*B(1:iend,j3,j2)
	209	end do
	210	end do
	211	end do
	212	end if
	213
	214	if (lhook) call dr_hook('radiation_matrix:mat_x_mat',1,hook_handle)
	215
	216	end function mat_x_mat
	217
	218
	219	!---------------------------------------------------------------------
	220	! Treat A as an m-by-m matrix and B as n m-by-m square matrices
	221	! (with the n dimension varying fastest) and perform matrix
	222	! multiplications on the first iend matrix pairs
	223	function singlemat_x_mat(n,iend,m,A,B)
	224
	225	use yomhook, only : lhook, dr_hook, jphook
	226
	227	integer, intent(in) :: n, m, iend
	228	real(jprb), intent(in), dimension(m,m) :: A
	229	real(jprb), intent(in), dimension(:,:,:) :: B
	230	real(jprb), dimension(iend,m,m) :: singlemat_x_mat
	231
	232	integer :: j1, j2, j3
	233	real(jphook) :: hook_handle
	234
	235	if (lhook) call dr_hook('radiation_matrix:singlemat_x_mat',0,hook_handle)
	236
	237	! Array-wise assignment
	238	singlemat_x_mat = 0.0_jprb
	239
	240	do j2 = 1,m
	241	do j1 = 1,m
	242	do j3 = 1,m
	243	singlemat_x_mat(1:iend,j1,j2) = singlemat_x_mat(1:iend,j1,j2) &
	244	& + A(j1,j3)*B(1:iend,j3,j2)
	245	end do
	246	end do
	247	end do
	248
	249	if (lhook) call dr_hook('radiation_matrix:singlemat_x_mat',1,hook_handle)
	250
	251	end function singlemat_x_mat
	252
	253
	254	!---------------------------------------------------------------------
	255	! Treat B as an m-by-m matrix and A as n m-by-m square matrices
	256	! (with the n dimension varying fastest) and perform matrix
	257	! multiplications on the first iend matrix pairs
	258	function mat_x_singlemat(n,iend,m,A,B)
	259
	260	use yomhook, only : lhook, dr_hook, jphook
	261
	262	integer, intent(in) :: n, m, iend
	263	real(jprb), intent(in), dimension(:,:,:) :: A
	264	real(jprb), intent(in), dimension(m,m) :: B
	265
	266	real(jprb), dimension(iend,m,m) :: mat_x_singlemat
	267	integer :: j1, j2, j3
	268	real(jphook) :: hook_handle
	269
	270	if (lhook) call dr_hook('radiation_matrix:mat_x_singlemat',0,hook_handle)
	271
	272	! Array-wise assignment
	273	mat_x_singlemat = 0.0_jprb
	274
	275	do j2 = 1,m
	276	do j1 = 1,m
	277	do j3 = 1,m
	278	mat_x_singlemat(1:iend,j1,j2) = mat_x_singlemat(1:iend,j1,j2) &
	279	& + A(1:iend,j1,j3)*B(j3,j2)
	280	end do
	281	end do
	282	end do
	283
	284	if (lhook) call dr_hook('radiation_matrix:mat_x_singlemat',1,hook_handle)
	285
	286	end function mat_x_singlemat
	287
	288
	289	!---------------------------------------------------------------------
	290	! Compute I-A*B where I is the identity matrix and A & B are n
	291	! m-by-m square matrices
	292	function identity_minus_mat_x_mat(n,iend,m,A,B,i_matrix_pattern)
	293
	294	use yomhook, only : lhook, dr_hook, jphook
	295
	296	integer, intent(in) :: n, m, iend
	297	integer, intent(in), optional :: i_matrix_pattern
	298	real(jprb), intent(in), dimension(:,:,:) :: A, B
	299	real(jprb), dimension(iend,m,m) :: identity_minus_mat_x_mat
	300
	301	integer :: j
	302	real(jphook) :: hook_handle
	303
	304	if (lhook) call dr_hook('radiation_matrix:identity_mat_x_mat',0,hook_handle)
	305
	306	if (present(i_matrix_pattern)) then
	307	identity_minus_mat_x_mat = mat_x_mat(n,iend,m,A,B,i_matrix_pattern)
	308	else
	309	identity_minus_mat_x_mat = mat_x_mat(n,iend,m,A,B)
	310	end if
	311
	312	identity_minus_mat_x_mat = - identity_minus_mat_x_mat
	313	do j = 1,m
	314	identity_minus_mat_x_mat(1:iend,j,j) &
	315	& = 1.0_jprb + identity_minus_mat_x_mat(1:iend,j,j)
	316	end do
	317
	318	if (lhook) call dr_hook('radiation_matrix:identity_mat_x_mat',1,hook_handle)
	319
	320	end function identity_minus_mat_x_mat
	321
	322
	323
	324	!---------------------------------------------------------------------
	325	! Replacement for matmul in the case that the first matrix is sparse
	326	function sparse_x_dense(sparse, dense)
	327
	328	real(jprb), intent(in) :: sparse(:,:), dense(:,:)
	329	real(jprb) :: sparse_x_dense(size(sparse,1),size(dense,2))
	330
	331	integer :: j1, j2, j3 ! Loop indices
	332	integer :: n1, n2, n3 ! Array sizes
	333
	334	n1 = size(sparse,1)
	335	n2 = size(sparse,2)
	336	n3 = size(dense,2)
	337
	338	sparse_x_dense = 0.0_jprb
	339	do j2 = 1,n2
	340	do j1 = 1,n1
	341	if (sparse(j1,j2) /= 0.0_jprb) then
	342	sparse_x_dense(j1,:) = sparse_x_dense(j1,:) + sparse(j1,j2)*dense(j2,:)
	343	end if
	344	end do
	345	end do
	346
	347	end function sparse_x_dense
	348
	349
	350	! --- REPEATEDLY SQUARE A MATRIX ---
	351
	352	!---------------------------------------------------------------------
	353	! Square m-by-m matrix "A" nrepeat times. A will be corrupted by
	354	! this function.
	355	function repeated_square(m,A,nrepeat,i_matrix_pattern)
	356	integer, intent(in) :: m, nrepeat
	357	real(jprb), intent(inout) :: A(m,m)
	358	integer, intent(in), optional :: i_matrix_pattern
	359	real(jprb) :: repeated_square(m,m)
	360
	361	integer :: j1, j2, j3, j4
	362	integer :: mblock, m2block
	363	integer :: i_actual_matrix_pattern
	364
	365	if (present(i_matrix_pattern)) then
	366	i_actual_matrix_pattern = i_matrix_pattern
	367	else
	368	i_actual_matrix_pattern = IMatrixPatternDense
	369	end if
	370
	371	if (i_actual_matrix_pattern == IMatrixPatternShortwave) then
	372	! Matrix has a sparsity pattern
	373	! (C D E)
	374	! A = (F G H)
	375	! (0 0 I)
	376	mblock = m/3
	377	m2block = 2*mblock
	378	do j4 = 1,nrepeat
	379	repeated_square = 0.0_jprb
	380	! Do the top-left (C, D, F & G)
	381	do j2 = 1,m2block
	382	do j1 = 1,m2block
	383	do j3 = 1,m2block
	384	repeated_square(j1,j2) = repeated_square(j1,j2) &
	385	& + A(j1,j3)*A(j3,j2)
	386	end do
	387	end do
	388	end do
	389	do j2 = m2block+1, m
	390	! Do the top-right (E & H)
	391	do j1 = 1,m2block
	392	do j3 = 1,m
	393	repeated_square(j1,j2) = repeated_square(j1,j2) &
	394	& + A(j1,j3)*A(j3,j2)
	395	end do
	396	end do
	397	! Do the bottom-right (I)
	398	do j1 = m2block+1, m
	399	do j3 = m2block+1,m
	400	repeated_square(j1,j2) = repeated_square(j1,j2) &
	401	& + A(j1,j3)*A(j3,j2)
	402	end do
	403	end do
	404	end do
	405	if (j4 < nrepeat) then
	406	A = repeated_square
	407	end if
	408	end do
	409	else
	410	! Ordinary dense matrix
	411	do j4 = 1,nrepeat
	412	repeated_square = 0.0_jprb
	413	do j2 = 1,m
	414	do j1 = 1,m
	415	do j3 = 1,m
	416	repeated_square(j1,j2) = repeated_square(j1,j2) &
	417	& + A(j1,j3)*A(j3,j2)
	418	end do
	419	end do
	420	end do
	421	if (j4 < nrepeat) then
	422	A = repeated_square
	423	end if
	424	end do
	425	end if
	426
	427	end function repeated_square
	428
	429
	430	! --- SOLVE LINEAR EQUATIONS ---
	431
	432	!---------------------------------------------------------------------
	433	! Solve Ax=b to obtain x. Version optimized for 2x2 matrices using
	434	! Cramer's method: "A" contains n 2x2 matrices and "b" contains n
	435	! 2-element vectors; returns A^-1 b.
	436	pure subroutine solve_vec_2(n,iend,A,b,x)
	437
	438	integer, intent(in) :: n, iend
	439	real(jprb), intent(in) :: A(:,:,:)
	440	real(jprb), intent(in) :: b(:,:)
	441	real(jprb), intent(out) :: x(:,:)
	442
	443	real(jprb) :: inv_det(iend)
	444
	445	inv_det = 1.0_jprb / ( A(1:iend,1,1)*A(1:iend,2,2) &
	446	& - A(1:iend,1,2)*A(1:iend,2,1))
	447
	448	x(1:iend,1) = inv_det(A(1:iend,2,2)b(1:iend,1)-A(1:iend,1,2)*b(1:iend,2))
	449	x(1:iend,2) = inv_det(A(1:iend,1,1)b(1:iend,2)-A(1:iend,2,1)*b(1:iend,1))
	450
	451	end subroutine solve_vec_2
	452
	453
	454	!---------------------------------------------------------------------
	455	! Solve AX=B to obtain X, i.e. the matrix right-hand-side version of
	456	! solve_vec_2, with A, X and B all containing n 2x2 matrices;
	457	! returns A^-1 B using Cramer's method.
	458	pure subroutine solve_mat_2(n,iend,A,B,X)
	459	integer, intent(in) :: n, iend
	460	real(jprb), intent(in) :: A(:,:,:)
	461	real(jprb), intent(in) :: B(:,:,:)
	462	real(jprb), intent(out) :: X(:,:,:)
	463
	464	real(jprb) :: inv_det(iend)
	465
	466	inv_det = 1.0_jprb / ( A(1:iend,1,1)*A(1:iend,2,2) &
	467	& - A(1:iend,1,2)*A(1:iend,2,1))
	468
	469	X(1:iend,1,1) = inv_det( A(1:iend,2,2)B(1:iend,1,1) &
	470	& -A(1:iend,1,2)*B(1:iend,2,1))
	471	X(1:iend,2,1) = inv_det( A(1:iend,1,1)B(1:iend,2,1) &
	472	& -A(1:iend,2,1)*B(1:iend,1,1))
	473	X(1:iend,1,2) = inv_det( A(1:iend,2,2)B(1:iend,1,2) &
	474	& -A(1:iend,1,2)*B(1:iend,2,2))
	475	X(1:iend,2,2) = inv_det( A(1:iend,1,1)B(1:iend,2,2) &
	476	& -A(1:iend,2,1)*B(1:iend,1,2))
	477
	478	end subroutine solve_mat_2
	479
	480
	481	!---------------------------------------------------------------------
	482	! Solve Ax=b optimized for 3x3 matrices, using LU
	483	! factorization and substitution without pivoting.
	484	pure subroutine solve_vec_3(n,iend,A,b,x)
	485	integer, intent(in) :: n, iend
	486	real(jprb), intent(in) :: A(:,:,:)
	487	real(jprb), intent(in) :: b(:,:)
	488	real(jprb), intent(out) :: x(:,:)
	489
	490	real(jprb), dimension(iend) :: L21, L31, L32
	491	real(jprb), dimension(iend) :: U22, U23, U33
	492	real(jprb), dimension(iend) :: y2, y3
	493
	494	! Some compilers unfortunately don't support assocate
	495	! associate (U11 => A(:,1,1), U12 => A(:,1,2), U13 => A(1,3), &
	496	! y1 => b(:,1), x1 => solve_vec3(:,1), &
	497	! x2 => solve_vec3(:,2), x3 => solve_vec3(:,3))
	498
	499	! LU decomposition:
	500	! ( 1 ) (U11 U12 U13)
	501	! A = (L21 1 ) * ( U22 U23)
	502	! (L31 L32 1) ( U33)
	503	L21 = A(1:iend,2,1) / A(1:iend,1,1)
	504	L31 = A(1:iend,3,1) / A(1:iend,1,1)
	505	U22 = A(1:iend,2,2) - L21*A(1:iend,1,2)
	506	U23 = A(1:iend,2,3) - L21*A(1:iend,1,3)
	507	L32 =(A(1:iend,3,2) - L31*A(1:iend,1,2)) / U22
	508	U33 = A(1:iend,3,3) - L31A(1:iend,1,3) - L32U23
	509
	510	! Solve Ly = b by forward substitution
	511	y2 = b(1:iend,2) - L21*b(1:iend,1)
	512	y3 = b(1:iend,3) - L31b(1:iend,1) - L32y2
	513
	514	! Solve Ux = y by back substitution
	515	x(1:iend,3) = y3/U33
	516	x(1:iend,2) = (y2 - U23*x(1:iend,3)) / U22
	517	x(1:iend,1) = (b(1:iend,1) - A(1:iend,1,2)*x(1:iend,2) &
	518	& - A(1:iend,1,3)*x(1:iend,3)) / A(1:iend,1,1)
	519	! end associate
	520
	521	end subroutine solve_vec_3
	522
	523
	524	!---------------------------------------------------------------------
	525	! Solve AX=B optimized for 3x3 matrices, using LU factorization and
	526	! substitution with no pivoting.
	527	pure subroutine solve_mat_3(n,iend,A,B,X)
	528	integer, intent(in) :: n, iend
	529	real(jprb), intent(in) :: A(:,:,:)
	530	real(jprb), intent(in) :: B(:,:,:)
	531	real(jprb), intent(out) :: X(:,:,:)
	532
	533	real(jprb), dimension(iend) :: L21, L31, L32
	534	real(jprb), dimension(iend) :: U22, U23, U33
	535	real(jprb), dimension(iend) :: y2, y3
	536
	537	integer :: j
	538
	539	! associate (U11 => A(:,1,1), U12 => A(:,1,2), U13 => A(1,3))
	540	! LU decomposition:
	541	! ( 1 ) (U11 U12 U13)
	542	! A = (L21 1 ) * ( U22 U23)
	543	! (L31 L32 1) ( U33)
	544	L21 = A(1:iend,2,1) / A(1:iend,1,1)
	545	L31 = A(1:iend,3,1) / A(1:iend,1,1)
	546	U22 = A(1:iend,2,2) - L21*A(1:iend,1,2)
	547	U23 = A(1:iend,2,3) - L21*A(1:iend,1,3)
	548	L32 =(A(1:iend,3,2) - L31*A(1:iend,1,2)) / U22
	549	U33 = A(1:iend,3,3) - L31A(1:iend,1,3) - L32U23
	550
	551	do j = 1,3
	552	! Solve Ly = B(:,:,j) by forward substitution
	553	! y1 = B(:,1,j)
	554	y2 = B(1:iend,2,j) - L21*B(1:iend,1,j)
	555	y3 = B(1:iend,3,j) - L31B(1:iend,1,j) - L32y2
	556	! Solve UX(:,:,j) = y by back substitution
	557	X(1:iend,3,j) = y3 / U33
	558	X(1:iend,2,j) = (y2 - U23*X(1:iend,3,j)) / U22
	559	X(1:iend,1,j) = (B(1:iend,1,j) - A(1:iend,1,2)*X(1:iend,2,j) &
	560	& - A(1:iend,1,3)*X(1:iend,3,j)) / A(1:iend,1,1)
	561	end do
	562
	563	end subroutine solve_mat_3
	564
	565
	566	!---------------------------------------------------------------------
	567	! Return X = B A^-1 = (A^-T B)^T optimized for 3x3 matrices, where B
	568	! is a diagonal matrix, using LU factorization and substitution with
	569	! no pivoting.
	570	pure subroutine diag_mat_right_divide_3(n,iend,A,B,X)
	571	integer, intent(in) :: n, iend
	572	real(jprb), intent(in) :: A(iend,3,3)
	573	real(jprb), intent(in) :: B(iend,3)
	574	real(jprb), intent(out) :: X(n,3,3)
	575
	576	real(jprb), dimension(iend) :: L21, L31, L32
	577	real(jprb), dimension(iend) :: U22, U23, U33
	578	real(jprb), dimension(iend) :: y2, y3
	579
	580	! associate (U11 => A(:,1,1), U12 => A(:,1,2), U13 => A(1,3))
	581	! LU decomposition of the transpose of A:
	582	! ( 1 ) (U11 U12 U13)
	583	! A^T = (L21 1 ) * ( U22 U23)
	584	! (L31 L32 1) ( U33)
	585	L21 = A(1:iend,1,2) / A(1:iend,1,1)
	586	L31 = A(1:iend,1,3) / A(1:iend,1,1)
	587	U22 = A(1:iend,2,2) - L21*A(1:iend,2,1)
	588	U23 = A(1:iend,3,2) - L21*A(1:iend,3,1)
	589	L32 =(A(1:iend,2,3) - L31*A(1:iend,2,1)) / U22
	590	U33 = A(1:iend,3,3) - L31A(1:iend,3,1) - L32U23
	591
	592	! Solve X(1,:) = A^-T ( B(1) )
	593	! ( 0 )
	594	! ( 0 )
	595	! Solve Ly = B(:,:,j) by forward substitution
	596	! y1 = B(:,1)
	597	y2 = - L21*B(1:iend,1)
	598	y3 = - L31B(1:iend,1) - L32y2
	599	! Solve UX(:,:,j) = y by back substitution
	600	X(1:iend,1,3) = y3 / U33
	601	X(1:iend,1,2) = (y2 - U23*X(1:iend,1,3)) / U22
	602	X(1:iend,1,1) = (B(1:iend,1) - A(1:iend,2,1)*X(1:iend,1,2) &
	603	& - A(1:iend,3,1)*X(1:iend,1,3)) / A(1:iend,1,1)
	604
	605	! Solve X(2,:) = A^-T ( 0 )
	606	! ( B(2) )
	607	! ( 0 )
	608	! Solve Ly = B(:,:,j) by forward substitution
	609	! y1 = 0
	610	! y2 = B(1:iend,2)
	611	y3 = - L32*B(1:iend,2)
	612	! Solve UX(:,:,j) = y by back substitution
	613	X(1:iend,2,3) = y3 / U33
	614	X(1:iend,2,2) = (B(1:iend,2) - U23*X(1:iend,2,3)) / U22
	615	X(1:iend,2,1) = (-A(1:iend,2,1)*X(1:iend,2,2) &
	616	& -A(1:iend,3,1)*X(1:iend,2,3)) / A(1:iend,1,1)
	617
	618	! Solve X(3,:) = A^-T ( 0 )
	619	! ( 0 )
	620	! ( B(3) )
	621	! Solve Ly = B(:,:,j) by forward substitution
	622	! y1 = 0
	623	! y2 = 0
	624	! y3 = B(1:iend,3)
	625	! Solve UX(:,:,j) = y by back substitution
	626	X(1:iend,3,3) = B(1:iend,3) / U33
	627	X(1:iend,3,2) = -U23*X(1:iend,3,3) / U22
	628	X(1:iend,3,1) = (-A(1:iend,2,1)*X(1:iend,3,2) &
	629	& - A(1:iend,3,1)*X(1:iend,3,3)) / A(1:iend,1,1)
	630
	631	end subroutine diag_mat_right_divide_3
	632
	633
	634	!---------------------------------------------------------------------
	635	! Treat A as n m-by-m matrices and return the LU factorization of A
	636	! compressed into a single matrice (with L below the diagonal and U
	637	! on and above the diagonal; the diagonal elements of L are 1). No
	638	! pivoting is performed.
	639	pure subroutine lu_factorization(n, iend, m, A, LU)
	640	integer, intent(in) :: n, m, iend
	641	real(jprb), intent(in) :: A(:,:,:)
	642	real(jprb), intent(out) :: LU(iend,m,m)
	643
	644	real(jprb) :: s(iend)
	645	integer :: j1, j2, j3
	646
	647	! This routine is adapted from an in-place one, so we first copy
	648	! the input into the output.
	649	LU(1:iend,1:m,1:m) = A(1:iend,1:m,1:m)
	650
	651	do j2 = 1, m
	652	do j1 = 1, j2-1
	653	s = LU(1:iend,j1,j2)
	654	do j3 = 1, j1-1
	655	s = s - LU(1:iend,j1,j3) * LU(1:iend,j3,j2)
	656	end do
	657	LU(1:iend,j1,j2) = s
	658	end do
	659	do j1 = j2, m
	660	s = LU(1:iend,j1,j2)
	661	do j3 = 1, j2-1
	662	s = s - LU(1:iend,j1,j3) * LU(1:iend,j3,j2)
	663	end do
	664	LU(1:iend,j1,j2) = s
	665	end do
	666	if (j2 /= m) then
	667	s = 1.0_jprb / LU(1:iend,j2,j2)
	668	do j1 = j2+1, m
	669	LU(1:iend,j1,j2) = LU(1:iend,j1,j2) * s
	670	end do
	671	end if
	672	end do
	673
	674	end subroutine lu_factorization
	675
	676
	677	!---------------------------------------------------------------------
	678	! Treat LU as an LU-factorization of an original matrix A, and
	679	! return x where Ax=b. LU consists of n m-by-m matrices and b as n
	680	! m-element vectors.
	681	pure subroutine lu_substitution(n,iend,m,LU,b,x)
	682	! CHECK: dimensions should be ":"?
	683	integer, intent(in) :: n, m, iend
	684	real(jprb), intent(in) :: LU(iend,m,m)
	685	real(jprb), intent(in) :: b(:,:)
	686	real(jprb), intent(out):: x(iend,m)
	687
	688	integer :: j1, j2
	689
	690	x(1:iend,1:m) = b(1:iend,1:m)
	691
	692	! First solve Ly=b
	693	do j2 = 2, m
	694	do j1 = 1, j2-1
	695	x(1:iend,j2) = x(1:iend,j2) - x(1:iend,j1)*LU(1:iend,j2,j1)
	696	end do
	697	end do
	698	! Now solve Ux=y
	699	do j2 = m, 1, -1
	700	do j1 = j2+1, m
	701	x(1:iend,j2) = x(1:iend,j2) - x(1:iend,j1)*LU(1:iend,j2,j1)
	702	end do
	703	x(1:iend,j2) = x(1:iend,j2) / LU(1:iend,j2,j2)
	704	end do
	705
	706	end subroutine lu_substitution
	707
	708
	709	!---------------------------------------------------------------------
	710	! Return matrix X where AX=B. LU, A, X, B all consist of n m-by-m
	711	! matrices.
	712	pure subroutine solve_mat_n(n,iend,m,A,B,X)
	713	integer, intent(in) :: n, m, iend
	714	real(jprb), intent(in) :: A(:,:,:)
	715	real(jprb), intent(in) :: B(:,:,:)
	716	real(jprb), intent(out):: X(iend,m,m)
	717
	718	real(jprb) :: LU(iend,m,m)
	719
	720	integer :: j
	721
	722	call lu_factorization(n,iend,m,A,LU)
	723
	724	do j = 1, m
	725	call lu_substitution(n,iend,m,LU,B(1:,1:m,j),X(1:iend,1:m,j))
	726	! call lu_substitution(n,iend,m,LU,B(1:n,1:m,j),X(1:iend,1:m,j))
	727	end do
	728
	729	end subroutine solve_mat_n
	730
	731
	732	!---------------------------------------------------------------------
	733	! Solve Ax=b, where A consists of n m-by-m matrices and x and b
	734	! consist of n m-element vectors. For m=2 or m=3, this function
	735	! calls optimized versions, otherwise it uses general LU
	736	! decomposition without pivoting.
	737	function solve_vec(n,iend,m,A,b)
	738
	739	use yomhook, only : lhook, dr_hook, jphook
	740
	741	integer, intent(in) :: n, m, iend
	742	real(jprb), intent(in) :: A(:,:,:)
	743	real(jprb), intent(in) :: b(:,:)
	744
	745	real(jprb) :: solve_vec(iend,m)
	746	real(jprb) :: LU(iend,m,m)
	747	real(jphook) :: hook_handle
	748
	749	if (lhook) call dr_hook('radiation_matrix:solve_vec',0,hook_handle)
	750
	751	if (m == 2) then
	752	call solve_vec_2(n,iend,A,b,solve_vec)
	753	elseif (m == 3) then
	754	call solve_vec_3(n,iend,A,b,solve_vec)
	755	else
	756	call lu_factorization(n,iend,m,A,LU)
	757	call lu_substitution(n,iend,m,LU,b,solve_vec)
	758	end if
	759
	760	if (lhook) call dr_hook('radiation_matrix:solve_vec',1,hook_handle)
	761
	762	end function solve_vec
	763
	764
	765	!---------------------------------------------------------------------
	766	! Solve AX=B, where A, X and B consist of n m-by-m matrices. For m=2
	767	! or m=3, this function calls optimized versions, otherwise it uses
	768	! general LU decomposition without pivoting.
	769	function solve_mat(n,iend,m,A,B)
	770
	771	use yomhook, only : lhook, dr_hook, jphook
	772
	773	integer, intent(in) :: n, m, iend
	774	real(jprb), intent(in) :: A(:,:,:)
	775	real(jprb), intent(in) :: B(:,:,:)
	776
	777	real(jprb) :: solve_mat(iend,m,m)
	778	real(jphook) :: hook_handle
	779
	780	if (lhook) call dr_hook('radiation_matrix:solve_mat',0,hook_handle)
	781
	782	if (m == 2) then
	783	call solve_mat_2(n,iend,A,B,solve_mat)
	784	elseif (m == 3) then
	785	call solve_mat_3(n,iend,A,B,solve_mat)
	786	else
	787	call solve_mat_n(n,iend,m,A,B,solve_mat)
	788	end if
	789
	790	if (lhook) call dr_hook('radiation_matrix:solve_mat',1,hook_handle)
	791
	792	end function solve_mat
	793
	794
	795	! --- MATRIX EXPONENTIATION ---
	796
	797	!---------------------------------------------------------------------
	798	! Perform matrix exponential of n m-by-m matrices stored in A (where
	799	! index n varies fastest) using the Higham scaling and squaring
	800	! method. The result is placed in A. This routine is intended for
	801	! speed so is accurate only to single precision. For simplicity and
	802	! to aid vectorization, the Pade approximant of order 7 is used for
	803	! all input matrices, perhaps leading to a few too many
	804	! multiplications for matrices with a small norm.
	805	subroutine expm(n,iend,m,A,i_matrix_pattern)
	806
	807	use yomhook, only : lhook, dr_hook, jphook
	808
	809	integer, intent(in) :: n, m, iend
	810	real(jprb), intent(inout) :: A(n,m,m)
	811	integer, intent(in) :: i_matrix_pattern
	812
	813	real(jprb), parameter :: theta(3) = (/4.258730016922831e-01_jprb, &
	814	& 1.880152677804762e+00_jprb, &
	815	& 3.925724783138660e+00_jprb/)
	816	real(jprb), parameter :: c(8) = (/17297280.0_jprb, 8648640.0_jprb, &
	817	& 1995840.0_jprb, 277200.0_jprb, 25200.0_jprb, &
	818	& 1512.0_jprb, 56.0_jprb, 1.0_jprb/)
	819
	820	real(jprb), dimension(iend,m,m) :: A2, A4, A6
	821	real(jprb), dimension(iend,m,m) :: U, V
	822
	823	real(jprb) :: normA(iend), sum_column(iend)
	824
	825	integer :: j1, j2, j3
	826	real(jprb) :: frac(iend)
	827	integer :: expo(iend)
	828	real(jprb) :: scaling(iend)
	829
	830	real(jphook) :: hook_handle
	831
	832	if (lhook) call dr_hook('radiation_matrix:expm',0,hook_handle)
	833
	834	normA = 0.0_jprb
	835
	836	! Compute the 1-norms of A
	837	do j3 = 1,m
	838	sum_column(:) = 0.0_jprb
	839	do j2 = 1,m
	840	do j1 = 1,iend
	841	sum_column(j1) = sum_column(j1) + abs(A(j1,j2,j3))
	842	end do
	843	end do
	844	do j1 = 1,iend
	845	if (sum_column(j1) > normA(j1)) then
	846	normA(j1) = sum_column(j1)
	847	end if
	848	end do
	849	end do
	850
	851	frac = fraction(normA/theta(3))
	852	expo = exponent(normA/theta(3))
	853	where (frac == 0.5_jprb)
	854	expo = expo - 1
	855	end where
	856
	857	where (expo < 0)
	858	expo = 0
	859	end where
	860
	861	! Scale the input matrices by a power of 2
	862	scaling = 2.0_jprb**(-expo)
	863	do j3 = 1,m
	864	do j2 = 1,m
	865	A(1:iend,j2,j3) = A(1:iend,j2,j3) * scaling
	866	end do
	867	end do
	868	! Pade approximant of degree 7
	869	A2 = mat_x_mat(n,iend,m,A, A, i_matrix_pattern)
	870	A4 = mat_x_mat(n,iend,m,A2,A2,i_matrix_pattern)
	871	A6 = mat_x_mat(n,iend,m,A2,A4,i_matrix_pattern)
	872
	873	V = c(8)A6 + c(6)A4 + c(4)*A2
	874	do j3 = 1,m
	875	V(:,j3,j3) = V(:,j3,j3) + c(2)
	876	end do
	877	U = mat_x_mat(n,iend,m,A,V,i_matrix_pattern)
	878	V = c(7)A6 + c(5)A4 + c(3)*A2
	879	! Add a multiple of the identity matrix
	880	do j3 = 1,m
	881	V(:,j3,j3) = V(:,j3,j3) + c(1)
	882	end do
	883
	884	V = V-U
	885	U = 2.0_jprb*U
	886	A(1:iend,1:m,1:m) = solve_mat(n,iend,m,V,U)
	887
	888	! Add the identity matrix
	889	do j3 = 1,m
	890	A(1:iend,j3,j3) = A(1:iend,j3,j3) + 1.0_jprb
	891	end do
	892
	893	! Loop through the matrices
	894	do j1 = 1,iend
	895	if (expo(j1) > 0) then
	896	! Square matrix j1 expo(j1) times
	897	A(j1,:,:) = repeated_square(m,A(j1,:,:),expo(j1),i_matrix_pattern)
	898	end if
	899	end do
	900
	901	if (lhook) call dr_hook('radiation_matrix:expm',1,hook_handle)
	902
	903	end subroutine expm
	904
	905
	906	!---------------------------------------------------------------------
	907	! Return the matrix exponential of n 2x2 matrices representing
	908	! conservative exchange between SPARTACUS regions, where the
	909	! matrices have the structure
	910	! (-a b)
	911	! ( a -b)
	912	! and a and b are assumed to be positive or zero. The solution uses
	913	! Putzer's algorithm - see the appendix of Hogan et al. (GMD 2018)
	914	subroutine fast_expm_exchange_2(n,iend,a,b,R)
	915
	916	use yomhook, only : lhook, dr_hook, jphook
	917
	918	integer, intent(in) :: n, iend
	919	real(jprb), dimension(n), intent(in) :: a, b
	920	real(jprb), dimension(n,2,2), intent(out) :: R
	921
	922	real(jprb), dimension(iend) :: factor
	923
	924	real(jphook) :: hook_handle
	925
	926	if (lhook) call dr_hook('radiation_matrix:fast_expm_exchange_2',0,hook_handle)
	927
	928	! Security to ensure that if a==b==0 then the identity matrix is returned
	929	factor = (1.0_jprb - exp(-(a(1:iend)+b(1:iend))))/max(1.0e-12_jprb,a(1:iend)+b(1:iend))
	930
	931	R(1:iend,1,1) = 1.0_jprb - factor*a(1:iend)
	932	R(1:iend,2,1) = factor*a(1:iend)
	933	R(1:iend,1,2) = factor*b(1:iend)
	934	R(1:iend,2,2) = 1.0_jprb - factor*b(1:iend)
	935
	936	if (lhook) call dr_hook('radiation_matrix:fast_expm_exchange_2',1,hook_handle)
	937
	938	end subroutine fast_expm_exchange_2
	939
	940
	941	!---------------------------------------------------------------------
	942	! Return the matrix exponential of n 3x3 matrices representing
	943	! conservative exchange between SPARTACUS regions, where the
	944	! matrices have the structure
	945	! (-a b 0)
	946	! ( a -b-c d)
	947	! ( 0 c -d)
	948	! and a-d are assumed to be positive or zero. The solution uses the
	949	! diagonalization method and is a slight generalization of the
	950	! solution provided in the appendix of Hogan et al. (GMD 2018),
	951	! which assumed c==d.
	952	subroutine fast_expm_exchange_3(n,iend,a,b,c,d,R)
	953
	954	use yomhook, only : lhook, dr_hook, jphook
	955
	956	real(jprb), parameter :: my_epsilon = 1.0e-12_jprb
	957
	958	integer, intent(in) :: n, iend
	959	real(jprb), dimension(n), intent(in) :: a, b, c, d
	960	real(jprb), dimension(n,3,3), intent(out) :: R
	961
	962	! Eigenvectors
	963	real(jprb), dimension(iend,3,3) :: V
	964
	965	! Non-zero Eigenvalues
	966	real(jprb), dimension(iend) :: lambda1, lambda2
	967
	968	! Diagonal matrix of the exponential of the eigenvalues
	969	real(jprb), dimension(iend,3) :: diag
	970
	971	! Result of diag right-divided by V
	972	real(jprb), dimension(iend,3,3) :: diag_rdivide_V
	973
	974	! Intermediate arrays
	975	real(jprb), dimension(iend) :: tmp1, tmp2
	976
	977	integer :: j1, j2
	978
	979	real(jphook) :: hook_handle
	980
	981	if (lhook) call dr_hook('radiation_matrix:fast_expm_exchange_3',0,hook_handle)
	982
	983	! Eigenvalues lambda1 and lambda2
	984	tmp1 = 0.5_jprb * (a(1:iend)+b(1:iend)+c(1:iend)+d(1:iend))
	985	tmp2 = sqrt(max(0.0_jprb, tmp1tmp1 - (a(1:iend)c(1:iend) &
	986	& + a(1:iend)d(1:iend) + b(1:iend)d(1:iend))))
	987	! The eigenvalues must not be the same or the LU decomposition
	988	! fails; this can occur occasionally in single precision, which we
	989	! avoid by limiting the minimum value of tmp2
	990	tmp2 = max(tmp2, epsilon(1.0_jprb) * tmp1)
	991	lambda1 = -tmp1 + tmp2
	992	lambda2 = -tmp1 - tmp2
	993
	994	! Eigenvectors, with securities such that if a--d are all zero
	995	! then V is non-singular and the identity matrix is returned in R;
	996	! note that lambdaX is typically negative so we need a
	997	! sign-preserving security
	998	V(1:iend,1,1) = max(my_epsilon, b(1:iend)) &
	999	& / sign(max(my_epsilon, abs(a(1:iend) + lambda1)), a(1:iend) + lambda1)
	1000	V(1:iend,1,2) = b(1:iend) &
	1001	& / sign(max(my_epsilon, abs(a(1:iend) + lambda2)), a(1:iend) + lambda2)
	1002	V(1:iend,1,3) = b(1:iend) / max(my_epsilon, a(1:iend))
	1003	V(1:iend,2,:) = 1.0_jprb
	1004	V(1:iend,3,1) = c(1:iend) &
	1005	& / sign(max(my_epsilon, abs(d(1:iend) + lambda1)), d(1:iend) + lambda1)
	1006	V(1:iend,3,2) = c(1:iend) &
	1007	& / sign(max(my_epsilon, abs(d(1:iend) + lambda2)), d(1:iend) + lambda2)
	1008	V(1:iend,3,3) = max(my_epsilon, c(1:iend)) / max(my_epsilon, d(1:iend))
	1009
	1010	diag(:,1) = exp(lambda1)
	1011	diag(:,2) = exp(lambda2)
	1012	diag(:,3) = 1.0_jprb
	1013
	1014	! Compute diag_rdivide_V = diag * V^-1
	1015	call diag_mat_right_divide_3(iend,iend,V,diag,diag_rdivide_V)
	1016
	1017	! Compute V * diag_rdivide_V
	1018	do j1 = 1,3
	1019	do j2 = 1,3
	1020	R(1:iend,j2,j1) = V(1:iend,j2,1)*diag_rdivide_V(1:iend,1,j1) &
	1021	& + V(1:iend,j2,2)*diag_rdivide_V(1:iend,2,j1) &
	1022	& + V(1:iend,j2,3)*diag_rdivide_V(1:iend,3,j1)
	1023	end do
	1024	end do
	1025
	1026	if (lhook) call dr_hook('radiation_matrix:fast_expm_exchange_3',1,hook_handle)
	1027
	1028	end subroutine fast_expm_exchange_3
	1029
	1030	! generic :: fast_expm_exchange => fast_expm_exchange_2, fast_expm_exchange_3
	1031
	1032
	1033	end module radiation_matrix

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Original Format