!-------------------------------------- LICENCE BEGIN ------------------------------------ !Environment Canada - Atmospheric Science and Technology License/Disclaimer, ! version 3; Last Modified: May 7, 2008. !This is free but copyrighted software; you can use/redistribute/modify it under the terms !of the Environment Canada - Atmospheric Science and Technology License/Disclaimer !version 3 or (at your option) any later version that should be found at: !http://collaboration.cmc.ec.gc.ca/science/rpn.comm/license.html ! !This software is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; !without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. !See the above mentioned License/Disclaimer for more details. !You should have received a copy of the License/Disclaimer along with this software; !if not, you can write to: EC-RPN COMM Group, 2121 TransCanada, suite 500, Dorval (Quebec), !CANADA, H9P 1J3; or send e-mail to service.rpn@ec.gc.ca !-------------------------------------- LICENCE END -------------------------------------- ***s/r hzd_solparite_u_ad - ADJ of hzd_solparite_u * #include "model_macros_f.h"*
subroutine hzd_solparite_u_ad ( 1 $ F_sol, F_Rhs_8, F_evxevec_8 ,F_oddxevec_8, % F_a_8, F_c_8 ,F_deltai_8, % minx1, maxx1, minx2, maxx2, nx1, nx2, nx3, F_pwr, % Minx,Maxx,Miny,Maxy,Gnk,Gni,nil,njl,nkl, % F_opsxp0_8, F_opsyp0_8,F_cdiff,F_npex,F_npey,NSTOR,nev) * implicit none * integer minx1, maxx1, minx2, maxx2, nx1, nx2, nx3 , $ Minx , Maxx , Miny , Maxy , Gnk, Gni, F_pwr, $ njl , nkl , nil , F_npex, F_npey,NSTOR,nev real*8 F_opsxp0_8(*), F_opsyp0_8(*), $ F_a_8(1:F_pwr,1:F_pwr,minx2:maxx2,nx3), $ F_c_8(1:F_pwr,1:F_pwr,minx2:maxx2,nx3), $ F_deltai_8(1:F_pwr,1:F_pwr,minx2:maxx2,nx3), $ F_Rhs_8 real*8 F_evxevec_8(NSTOR*NSTOR),F_oddxevec_8(NSTOR*NSTOR) real F_cdiff, F_sol(Minx:Maxx,Miny:Maxy,Gnk) * *author * M.Tanguay * *revision * v3_02 - Tanguay M. - initial version * v3_11 - Tanguay M. - AIXport+Opti+OpenMP for TLM-ADJ * v3_20 - Tanguay M. - Correction for transpose48 when NPEX.GT.1 * v3_30 - Tanguay M. - adjust OPENMP * *object * *ADJ of *arguments * Name I/O Description *---------------------------------------------------------------- * F_sol I/O r.h.s. and result of horizontal diffusion * F_Rhs_8 I work vector * *---------------------------------------------------------------- * *implicits #include "ptopo.cdk"
* real*8 fdg1_8 ( Miny:Maxy ,minx1:maxx1,Gni+F_npex), $ fdg2_8 (minx1:maxx1,minx2:maxx2,nx3+F_npey), $ dn3_8 (minx1:maxx1,minx2:maxx2,F_pwr,nx3 ), $ sol_8 (minx1:maxx1,minx2:maxx2,F_pwr,nx3 ), $ fwft_8 ( Miny:Maxy ,minx1:maxx1,Gni) real*8 fdg12_8( Miny:Maxy ,minx1:maxx1,Gni) * real*8 ZERO_8, fact_8 parameter( ZERO_8 = 0.0 ) integer m,o1,o2,i,j,k,nevi,gnii,kkii,ki0,kin,kilon,pi0,pin * * __________________________________________________________________ * kilon = (maxx2-minx2 +1+Ptopo_npeOpenMP)/Ptopo_npeOpenMP * * Zero adjoint variables * ---------------------- * !$omp parallel * !$omp do do k= 1,Gni+F_npex do j= minx1,maxx1 do i= Miny ,Maxy fdg1_8(i,j,k) = ZERO_8 end do end do end do !$omp enddo * !$omp do do k= 1,Gni do j= minx1,maxx1 do i= Miny ,Maxy fwft_8(i,j,k) = ZERO_8 end do end do end do !$omp enddo * !$omp do do k= 1,nx3+F_npey do j= minx2,maxx2 do i= minx1,maxx1 fdg2_8(i,j,k) = ZERO_8 end do end do end do !$omp enddo * !$omp do do m= 1,nx3 do k= 1,F_pwr do j= minx2,maxx2 do i= minx1,maxx1 dn3_8(i,j,k,m) = ZERO_8 sol_8(i,j,k,m) = ZERO_8 end do end do end do end do !$omp enddo * !$omp do do k= 1,Gni do j= minx1,maxx1 do i= Miny ,Maxy fdg12_8(i,j,k) = ZERO_8 end do end do end do !$omp enddo * * ADJ of * combine even and odd parts * !$omp end parallel * call rpn_comm_transpose48(F_sol, Minx, Maxx, Gni,1, (Maxy-Miny+1), % (Maxy-Miny+1), Minx1, Maxx1, gnk, fdg1_8, % 1,1.0d0,0.d0 ) * !$omp parallel private(kkii,pi0,pin,ki0,kin,gnii,nevi) !$omp$ shared (kilon,nev,nstor) * * if( Gni.ne.(2*(Gni/2)) ) then !$omp do do k= Nkl,1,-1 do j= njl,1,-1 fdg12_8(j,k,nev) = fdg1_8(j,k,nev) + fdg12_8(j,k,nev) fdg1_8 (j,k,nev) = ZERO_8 enddo enddo !$omp end do else gnii=Gni+1-nev nevi=nev+nev !$omp do do k= Nkl,1,-1 do j= njl,1,-1 fdg12_8(j,k,nev) = fdg1_8(j,k,gnii) + fdg12_8(j,k,nev) fdg12_8(j,k,nevi) = -fdg1_8(j,k,gnii) + fdg12_8(j,k,nevi) fdg1_8 (j,k,gnii) = ZERO_8 * fdg12_8(j,k,nev) = fdg1_8(j,k,nev) + fdg12_8(j,k,nev) fdg12_8(j,k,nevi) = fdg1_8(j,k,nev) + fdg12_8(j,k,nevi) fdg1_8 (j,k,nev) = ZERO_8 enddo enddo !$omp end do endif * !$omp do do k= Nkl,1,-1 do i= nev-1,1,-1 gnii=Gni+1-i nevi=nev+i do j= njl,1,-1 fdg12_8(j,k,i) = fdg1_8(j,k,gnii) + fdg12_8(j,k,i) fdg12_8(j,k,nevi) = -fdg1_8(j,k,gnii) + fdg12_8(j,k,nevi) fdg1_8 (j,k,gnii) = ZERO_8 * fdg12_8(j,k,i) = fdg1_8(j,k,i) + fdg12_8(j,k,i) fdg12_8(j,k,nevi) = fdg1_8(j,k,i) + fdg12_8(j,k,nevi) fdg1_8 (j,k,i) = ZERO_8 enddo enddo enddo !$omp end do * * ADJ of * resolution du systeme blok-tridiagonal * * ADJ of * retour * * ADJ of * inverse projection ( r = x * w ) * c call mxma8( F_oddxevec_8, NSTOR,1, c % fdg12_8(1,1,nev+1),(Maxy-Miny+1) * (maxx1-minx1+1), 1, c % fwft_8 (1,1,nev+1),(Maxy-Miny+1) * (maxx1-minx1+1), 1, c % Gni-nev, Gni-nev, (Maxy-Miny+1) * Nkl ) * !$omp do do k=1,Nkl call dgemm('N','N', (Maxy-Miny+1), Gni-nev, Gni-nev, . 1._8, fdg12_8(1,k,nev+1), . (Maxy-Miny+1)* (Maxx1-Minx1+1),F_oddxevec_8, NSTOR, . 0._8, fwft_8(1,k,nev+1), . (Maxy-Miny+1)* (Maxx1-Minx1+1)) enddo !$omp enddo * c call mxma8( F_evxevec_8, NSTOR,1, c % fdg12_8(1,1,1), (Maxy-Miny+1) * (maxx1-minx1+1), 1, c % fwft_8 (1,1,1), (Maxy-Miny+1) * (maxx1-minx1+1), 1, c % nev, nev, (Maxy-Miny+1) * Nkl ) * !$omp do do k=1,Nkl call dgemm('N','N', (Maxy-Miny+1), nev, nev, . 1._8, fdg12_8(1,k,1), . (Maxy-Miny+1)* (Maxx1-Minx1+1),F_evxevec_8, NSTOR, . 0._8, fwft_8(1,k,1), . (Maxy-Miny+1)* (Maxx1-Minx1+1)) enddo !$omp enddo * !$omp do do i = 1, gni do k = minx1, maxx1 do j = njl+1, maxy fwft_8(j,k,i)= ZERO_8 enddo enddo * do k = minx1, maxx1 do j = miny , 0 fwft_8(j,k,i)= ZERO_8 enddo enddo * enddo !$omp enddo * !$omp single call rpn_comm_transpose(fwft_8,Miny,Maxy,nx3,(maxx1-minx1+1), % minx2, maxx2,Gni,fdg2_8,2,2) !$omp end single * !$omp do do j = 1, nx3 do i = 1, nx2 do k = 1, nx1 sol_8 (k,i,F_pwr,j) = fdg2_8(k,i,j) + sol_8(k,i,F_pwr,j) fdg2_8(k,i,j) = ZERO_8 enddo enddo enddo !$omp enddo * * !$omp do do kkii = Ptopo_npeOpenMP,1,-1 ki0 = minx2 + kilon*(kkii-1) kin = min(ki0+kilon-1, maxx2) pi0 = 1 + kilon*(kkii-1) pin = min(pi0+kilon-1,nx2) * do j = 1,nx3-1 do o1= F_pwr,1,-1 do i = pin,pi0,-1 do k = nx1,1,-1 dn3_8(k,i,o1,j)= sol_8(k,i,o1,j) + dn3_8(k,i,o1,j) sol_8(k,i,o1,j)= -sol_8(k,i,o1,j) enddo enddo enddo * do o1= F_pwr,1,-1 do o2= F_pwr,1,-1 do i = kin,ki0,-1 do k = maxx1,minx1,-1 sol_8(k,i,o2,j+1)=F_c_8(o1,o2,i,j)*sol_8(k,i,o1,j) + sol_8(k,i,o2,j+1) enddo enddo enddo enddo enddo * enddo !$omp enddo * !$omp do do j = 1, nx3 if(j.eq.nx3) then do o1= 1, F_pwr do i = 1, nx2 do k = 1, nx1 dn3_8(k,i,o1,j) = sol_8(k,i,o1,j) + dn3_8(k,i,o1,j) sol_8(k,i,o1,j) = ZERO_8 enddo enddo enddo else do o1= 1, F_pwr do i = 1, nx2 do k = 1, nx1 sol_8(k,i,o1,j)= 0.0 enddo enddo enddo endif enddo !$omp enddo * * ADJ of * scale le cote droit pour retour * !$omp do do j= nx3,1,-1 * do o1= F_pwr,1,-1 do o2= F_pwr,1,-1 do i = maxx2,minx2,-1 do k = maxx1,minx1,-1 sol_8(k,i,o2,j)= F_deltai_8(o1,o2,i,j)*dn3_8(k,i,o1,j) + sol_8(k,i,o2,j) enddo enddo enddo enddo * do o1= F_pwr,1,-1 do i= maxx2,minx2,-1 do k= maxx1,minx1,-1 C dn3_8(k,i,o1,j)= 0.0 dn3_8(k,i,o1,j)= ZERO_8 enddo enddo enddo enddo !$omp end do * * ADJ of * aller * * !$omp do do kkii = Ptopo_npeOpenMP,1,-1 ki0 = minx2+ kilon*(kkii-1) kin = min(ki0+kilon-1,maxx2) pi0 = 1 + kilon*(kkii-1) pin = min(pi0+kilon-1,nx2) * do j = nx3,2,-1 do o1= F_pwr,1,-1 do i = pin,pi0,-1 do k = nx1,1,-1 dn3_8(k,i,o1,j)= sol_8(k,i,o1,j) + dn3_8(k,i,o1,j) sol_8(k,i,o1,j)= -sol_8(k,i,o1,j) enddo enddo enddo * do o1= F_pwr,1,-1 do o2= F_pwr,1,-1 do i = kin,ki0,-1 do k = nx1,1,-1 sol_8(k,i,o2,j-1) = F_a_8(o1,o2,i,j)*sol_8(k,i,o1,j) % + sol_8(k,i,o2,j-1) enddo enddo enddo enddo enddo * enddo !$omp end do * !$omp do do i = 1, nx2 do o1= 1, F_pwr do k = 1, nx1 dn3_8(k,i,o1,1)= sol_8(k,i,o1,1) + dn3_8(k,i,o1,1) sol_8(k,i,o1,1)= ZERO_8 enddo enddo enddo !$omp end do * * ADJ of * cote droit * !$omp do do j = nx3,1,-1 do i = nx2,1,-1 do k = nx1,1,-1 fdg2_8(k,i,j) = F_opsyp0_8(nx3+j)*dn3_8(k,i,1,j) + fdg2_8(k,i,j) dn3_8 (k,i,1,j) = ZERO_8 enddo enddo enddo !$omp enddo * !$omp do do j = nx3,1,-1 do o1 = F_pwr,1,-1 do i = maxx2,minx2,-1 do k = maxx1,minx1,-1 sol_8(k,i,o1,j)= ZERO_8 dn3_8(k,i,o1,j)= ZERO_8 enddo enddo enddo enddo !$omp enddo * * projection ( wfft = x transposed * g ) * !$omp single call rpn_comm_transpose(fwft_8,Miny,Maxy,nx3,(Maxx1-Minx1+1), % minx2, maxx2,Gni,fdg2_8,-2,2) !$omp end single * c call mxma8( F_oddxevec_8, 1,NSTOR, c % fwft_8 (1,1,nev+1),(Maxy-Miny+1) * (maxx1-minx1+1), 1, c % fdg12_8(1,1,nev+1),(Maxy-Miny+1) * (maxx1-minx1+1), 1, c % Gni-nev, Gni-nev, (Maxy-Miny+1) * Nkl ) * !$omp do do k=1,Nkl call dgemm('N','T', (Maxy-Miny+1),Gni-nev,Gni-nev, . 1._8, fwft_8(1,k,nev+1), . (Maxy-Miny+1) * (Maxx1-Minx1+1),F_oddxevec_8, NSTOR, . 0._8, fdg12_8(1,k,nev+1), . (Maxy-Miny+1) * (Maxx1-Minx1+1)) enddo !$omp end do * c call mxma8( F_evxevec_8, 1,NSTOR, c % fwft_8 (1,1,1), (Maxy-Miny+1) * (maxx1-minx1+1), 1, c % fdg12_8(1,1,1), (Maxy-Miny+1) * (maxx1-minx1+1), 1, c % nev, nev, (Maxy-Miny+1) * Nkl ) * !$omp do do k=1,Nkl call dgemm('N','T', (Maxy-Miny+1), nev, nev, . 1._8, fwft_8(1,k,1), . (Maxy-Miny+1) * (Maxx1-Minx1+1),F_evxevec_8, NSTOR, . 0._8, fdg12_8(1,k,1), . (Maxy-Miny+1) * (Maxx1-Minx1+1)) enddo !$omp end do * * ADJ of * odd part of rhs * !$omp do do k=Nkl,1,-1 do i=Gni-nev,1,-1 do j=njl,1,-1 fdg1_8 (j,k,i) = fdg12_8(j,k,i+nev) + fdg1_8(j,k,i) fdg1_8 (j,k,Gni+1-i) =-fdg12_8(j,k,i+nev) + fdg1_8(j,k,Gni+1-i) fdg12_8(j,k,i+nev) = ZERO_8 enddo enddo enddo !$omp enddo * * ADJ of * even part of rhs * if (Gni.ne.(2*(Gni/2)) ) then !$omp do do k=Nkl,1,-1 do j=njl,1,-1 fdg1_8 (j,k,nev) = fdg12_8(j,k,nev) + fdg1_8(j,k,nev) fdg12_8(j,k,nev) = ZERO_8 enddo enddo !$omp enddo endif * !$omp do do k=Nkl,1,-1 do i=nev,1,-1 do j=njl,1,-1 fdg1_8 (j,k,i) = fdg12_8(j,k,i) + fdg1_8(j,k,i) fdg1_8 (j,k,Gni+1-i) = fdg12_8(j,k,i) + fdg1_8(j,k,Gni+1-i) fdg12_8(j,k,i) = ZERO_8 enddo enddo enddo !$omp enddo * * ADJ of * Resolution * !$omp do do i = 1, Gni do k = minx1, maxx1 do j = Miny , Maxy fwft_8(j,k,i)=ZERO_8 enddo do j = njl+1, Maxy fdg1_8 (j,k,i)= ZERO_8 fdg12_8(j,k,i)= ZERO_8 enddo do j = Miny , 0 fdg1_8 (j,k,i)= ZERO_8 fdg12_8(j,k,i)= ZERO_8 enddo enddo enddo !$omp enddo * !$omp do do k = 1, nkl do i = 1, Gni do j = 1, njl fdg1_8(j,k,i) = F_opsxp0_8(Gni+i)*fdg1_8(j,k,i) enddo enddo enddo !$omp enddo * !$omp end parallel * fact_8 = ((-1)**F_pwr)*dble(F_cdiff) call rpn_comm_transpose48 ( F_sol, Minx, Maxx, Gni,1,(Maxy-Miny+1), % (Maxy-Miny+1),Minx1, Maxx1, gnk, fdg1_8, C % -1,fact_8,0.d0 ) % -1,1.d0,0.d0 ) * !$omp parallel do do k = 1, Gnk do j = 1, njl do i = 1, nil F_sol(i,j,k) = fact_8*F_sol(i,j,k) enddo enddo enddo !$omp end parallel do * __________________________________________________________________ * return end