quantum-espresso/PP/cft.f90

!
! (C) Copyright CERN except where explicitly stated otherwise.
!     Permission to use and/or redistribute this work is granted
!     under the terms of the GNU General Public License, The software
!     and documentation made available under the terms of this license
!     are provided with no warranty.
!
! Slightly modified version of routine D702 of CERN lib
!
!----------------------------------------------------------------------
subroutine cft (a, b, ntot, n, nspan, isn)
  !----------------------------------------------------------------------
  !
  !     multivariate complex fourier transform, computed in place
  !     using mixed-radix fast fourier transform algorithm.
  !     by R. C. Singleton, Stanford Research Institute, oct. 1968
  !     arrays a and b originally hold the real and imaginary
  !     components of the data, and return the real and
  !     imaginary components of the resulting fourier coefficients.
  !     multivariate data is indexed according to the fortran
  !     array element successor function, without limit
  !     on the number of implied multiple subscripts.
  !     the subroutine is called once for each variate.
  !     the calls for a multivariate transform may be in any order.
  !     ntot is the total number of complex data values.
  !     n is the dimension of the current variable.
  !     nspan/n is the spacing of consucutive data values
  !     while indexing the current variable.
  !     the sign of isn determines the sign of the complex
  !     exponential, and the magnitude of isn is normally one.
  !
  !     for a single-variate transform,
  !     ntot = n = nspan = (number of complex data values), f.g.
  !     call cft(a,b,n,n,n,1)
  !
  !     a tri-variate transform with a(n1,n2,n3), b(n1,n2,n3)
  !     is computed by
  !     call cft(a,b,n1*n2*n3,n1,n1,1)
  !     call cft(a,b,n1*n2*n3,n2,n1*n2,1)
  !     call cft(a,b,n1*n2*n3,n3,n1*n2*n3,1)
  !
  !     the data may alternatively be stored in a single complex
  !     array a, then the magnitude of isn changed to two to
  !     give the correct indexing increment and the second parameter
  !     used to pass the initial address for the sequence of
  !     imaginary values, e.g.
  !
  !        real s(2)
  !        equivalence (a,s)
  !        ....
  !        ....
  !        call cft(a,s(2),ntot,n,nspan,2)
  !
  !     arrays at(maxf), ck(maxf), bt(maxf), sk(maxf), and np(maxp)
  !     are used for temporary storage. if the available storage
  !     is insufficient, the program is terminated by a stop.
  !     maxf must be .ge. the maximum prime factor of n.
  !     maxp must be .gt. the number of prime factors of n.
  !     in addition, if the square-free portion k cf n has two or
  !     more prime factors, then maxp must be .ge. k-1.
  !     array storage in nfac for a maximum of 11 factors of n.
  !     if n has more than one square-free factor, the product of the
  !     square-free factors must be .le. 210
  !
  USE kinds
  implicit real(DP)(a - h, o - z)
  dimension a ( * ), b ( * )
  dimension nfac (11), np (209)
  !     array storage for maximum prime factor of 23
  dimension at (23), ck (23), bt (23), sk (23)
  equivalence (i, ii)
  !     the following two constants should agree with the array dimension
  maxf = 23
  maxp = 209
  if (n.lt.2) return
  inc = isn
  !     the following constants are rad = 2.*pi , s72 = sin(0.4*pi) ,
  !     c72 = cos(0.4*pi) and s120 = sqrt(0.75)
  rad = 6.2831853071796d0
  s72 = 0.95105651629515d0
  c72 = 0.30901699437495d0
  s120 = 0.86602540378444d0
  if (isn.ge.0) goto 10
  s72 = - s72
  s120 = - s120
  rad = - rad
  inc = - inc
10 nt = inc * ntot
  ks = inc * nspan
  kspan = ks
  nn = nt - inc
  jc = ks / n
  radf = rad * DBLE (jc) * 0.5d0
  i = 0
  jf = 0
  !     determine the factors of n
  m = 0
  k = n
  goto 20
15 m = m + 1
  nfac (m) = 4
  k = k / 16
20 if (k - (k / 16) * 16.eq.0) goto 15
  j = 3
  jj = 9
  goto 30
25 m = m + 1
  nfac (m) = j
  k = k / jj
30 if (mod (k, jj) .eq.0) goto 25
  j = j + 2
  jj = j**2
  if (jj.le.k) goto 30
  if (k.gt.4) goto 40
  kt = m
  nfac (m + 1) = k
  if (k.ne.1) m = m + 1
  goto 80
40 if (k - (k / 4) * 4.ne.0) goto 50
  m = m + 1
  nfac (m) = 2
  k = k / 4
50 kt = m
  j = 2
60 if (mod (k, j) .ne.0) goto 70
  m = m + 1
  nfac (m) = j
  k = k / j
70 j = ( (j + 1) / 2) * 2 + 1
  if (j.le.k) goto 60
80 if (kt.eq.0) goto 100
  j = kt
90 m = m + 1
  nfac (m) = nfac (j)
  j = j - 1
  if (j.ne.0) goto 90
  !     compute fourier transform
100 sd = radf / DBLE (kspan)
  cd = 2.0d0 * sin (sd) **2
  sd = sin (sd+sd)
  kk = 1
  i = i + 1
  if (nfac (i) .ne.2) goto 400
  !     transform for factor of 2 (including rotation factor)
  kspan = kspan / 2
  k1 = kspan + 2
210 k2 = kk + kspan
  ak = a (k2)
  bk = b (k2)
  a (k2) = a (kk) - ak
  b (k2) = b (kk) - bk
  a (kk) = a (kk) + ak
  b (kk) = b (kk) + bk
  kk = k2 + kspan
  if (kk.le.nn) goto 210
  kk = kk - nn
  if (kk.le.jc) goto 210
  if (kk.gt.kspan) goto 800
220 c1 = 1.0d0 - cd
  s1 = sd
230 k2 = kk + kspan
  ak = a (kk) - a (k2)
  bk = b (kk) - b (k2)
  a (kk) = a (kk) + a (k2)
  b (kk) = b (kk) + b (k2)
  a (k2) = c1 * ak - s1 * bk
  b (k2) = s1 * ak + c1 * bk
  kk = k2 + kspan
  if (kk.lt.nt) goto 230
  k2 = kk - nt
  c1 = - c1
  kk = k1 - k2
  if (kk.gt.k2) goto 230
  ak = c1 - (cd * c1 + sd * s1)
  s1 = (sd * c1 - cd * s1) + s1
  !     the following three statements compensate for truncation
  !     error. if rounded arithmetic is used, they may be deleted.
  c1 = 0.5d0 / (ak**2 + s1**2) + 0.5d0
  s1 = c1 * s1
  c1 = c1 * ak
  !     next statement should be deleted if non-rounded arithmetic is use
  !     c1=ak
  kk = kk + jc
  if (kk.lt.k2) goto 230
  k1 = k1 + inc + inc
  kk = (k1 - kspan) / 2 + jc
  if (kk.le.jc + jc) goto 220
  goto 100
  !     transform for factor of 3 (optional code)
320 k1 = kk + kspan
  k2 = k1 + kspan
  ak = a (kk)
  bk = b (kk)
  aj = a (k1) + a (k2)
  bj = b (k1) + b (k2)
  a (kk) = ak + aj
  b (kk) = bk + bj
  ak = - 0.5d0 * aj + ak
  bk = - 0.5d0 * bj + bk
  aj = (a (k1) - a (k2) ) * s120
  bj = (b (k1) - b (k2) ) * s120
  a (k1) = ak - bj
  b (k1) = bk + aj
  a (k2) = ak + bj
  b (k2) = bk - aj
  kk = k2 + kspan
  if (kk.lt.nn) goto 320
  kk = kk - nn
  if (kk.le.kspan) goto 320
  goto 700
  !     transform for factor of 4
400 if (nfac (i) .ne.4) goto 600
  kspnn = kspan
  kspan = kspan / 4
410 c1 = 1.0d0
  s1 = 0
420 k1 = kk + kspan
  k2 = k1 + kspan
  k3 = k2 + kspan
  akp = a (kk) + a (k2)
  akm = a (kk) - a (k2)
  ajp = a (k1) + a (k3)
  ajm = a (k1) - a (k3)
  a (kk) = akp + ajp
  ajp = akp - ajp
  bkp = b (kk) + b (k2)
  bkm = b (kk) - b (k2)
  bjp = b (k1) + b (k3)
  bjm = b (k1) - b (k3)
  b (kk) = bkp + bjp
  bjp = bkp - bjp
  if (isn.lt.0) goto 450
  akp = akm - bjm
  akm = akm + bjm
  bkp = bkm + ajm
  bkm = bkm - ajm
  if (s1.eq.0.0d0) goto 460
430 a (k1) = akp * c1 - bkp * s1
  b (k1) = akp * s1 + bkp * c1
  a (k2) = ajp * c2 - bjp * s2
  b (k2) = ajp * s2 + bjp * c2
  a (k3) = akm * c3 - bkm * s3
  b (k3) = akm * s3 + bkm * c3
  kk = k3 + kspan
  if (kk.le.nt) goto 420
440 c2 = c1 - (cd * c1 + sd * s1)
  s1 = (sd * c1 - cd * s1) + s1
  !     the following three statements compensate for truncation
  !     error. if rounded arithmetic is used, they may be deleted.
  c1 = 0.5d0 / (c2**2 + s1**2) + 0.5d0
  s1 = c1 * s1
  c1 = c1 * c2
  !     next statement should be deleted if non-rounded arithmetic is use
  !     c1=c2
  c2 = c1**2 - s1**2
  s2 = 2.0d0 * c1 * s1
  c3 = c2 * c1 - s2 * s1
  s3 = c2 * s1 + s2 * c1
  kk = kk - nt + jc
  if (kk.le.kspan) goto 420
  kk = kk - kspan + inc
  if (kk.le.jc) goto 410
  if (kspan.eq.jc) goto 800
  goto 100
450 akp = akm + bjm
  akm = akm - bjm
  bkp = bkm - ajm
  bkm = bkm + ajm
  if (s1.ne.0.0) goto 430
460 a (k1) = akp
  b (k1) = bkp
  a (k2) = ajp
  b (k2) = bjp
  a (k3) = akm
  b (k3) = bkm
  kk = k3 + kspan
  if (kk.le.nt) goto 420
  goto 440
  !     transform for factor of 5 (optional code)
510 c2 = c72**2 - s72**2
  s2 = 2.0d0 * c72 * s72
520 k1 = kk + kspan
  k2 = k1 + kspan
  k3 = k2 + kspan
  k4 = k3 + kspan
  akp = a (k1) + a (k4)
  akm = a (k1) - a (k4)
  bkp = b (k1) + b (k4)
  bkm = b (k1) - b (k4)
  ajp = a (k2) + a (k3)
  ajm = a (k2) - a (k3)
  bjp = b (k2) + b (k3)
  bjm = b (k2) - b (k3)
  aa = a (kk)
  bb = b (kk)
  a (kk) = aa + akp + ajp
  b (kk) = bb + bkp + bjp
  ak = akp * c72 + ajp * c2 + aa
  bk = bkp * c72 + bjp * c2 + bb
  aj = akm * s72 + ajm * s2
  bj = bkm * s72 + bjm * s2
  a (k1) = ak - bj
  a (k4) = ak + bj
  b (k1) = bk + aj
  b (k4) = bk - aj
  ak = akp * c2 + ajp * c72 + aa
  bk = bkp * c2 + bjp * c72 + bb
  aj = akm * s2 - ajm * s72
  bj = bkm * s2 - bjm * s72
  a (k2) = ak - bj
  a (k3) = ak + bj
  b (k2) = bk + aj
  b (k3) = bk - aj
  kk = k4 + kspan
  if (kk.lt.nn) goto 520
  kk = kk - nn
  if (kk.le.kspan) goto 520
  goto 700
  !     transform for odd factors
600 k = nfac (i)
  kspnn = kspan
  kspan = kspan / k
  if (k.eq.3) goto 320
  if (k.eq.5) goto 510
  if (k.eq.jf) goto 640
  jf = k
  s1 = rad / DBLE (k)
  c1 = cos (s1)
  s1 = sin (s1)
  if (jf.gt.maxf) goto 998
  ck (jf) = 1.0d0
  sk (jf) = 0.0d0
  j = 1
630 ck (j) = ck (k) * c1 + sk (k) * s1
  sk (j) = ck (k) * s1 - sk (k) * c1
  k = k - 1
  ck (k) = ck (j)
  sk (k) = - sk (j)
  j = j + 1
  if (j.lt.k) goto 630
640 k1 = kk
  k2 = kk + kspnn
  aa = a (kk)
  bb = b (kk)
  ak = aa
  bk = bb
  j = 1
  k1 = k1 + kspan
650 k2 = k2 - kspan
  j = j + 1
  at (j) = a (k1) + a (k2)
  ak = at (j) + ak
  bt (j) = b (k1) + b (k2)
  bk = bt (j) + bk
  j = j + 1
  at (j) = a (k1) - a (k2)
  bt (j) = b (k1) - b (k2)
  k1 = k1 + kspan
  if (k1.lt.k2) goto 650
  a (kk) = ak
  b (kk) = bk
  k1 = kk
  k2 = kk + kspnn
  j = 1
660 k1 = k1 + kspan
  k2 = k2 - kspan
  jj = j
  ak = aa
  bk = bb
  aj = 0.0d0
  bj = 0.0d0
  k = 1
670 k = k + 1
  ak = at (k) * ck (jj) + ak
  bk = bt (k) * ck (jj) + bk
  k = k + 1
  aj = at (k) * sk (jj) + aj
  bj = bt (k) * sk (jj) + bj
  jj = jj + j
  if (jj.gt.jf) jj = jj - jf
  if (k.lt.jf) goto 670
  k = jf - j
  a (k1) = ak - bj
  b (k1) = bk + aj
  a (k2) = ak + bj
  b (k2) = bk - aj
  j = j + 1
  if (j.lt.k) goto 660
  kk = kk + kspnn
  if (kk.le.nn) goto 640
  kk = kk - nn
  if (kk.le.kspan) goto 640
  !     multiply by rotation factor (except for factors of 2 and 4)
700 if (i.eq.m) goto 800
  kk = jc + 1
710 c2 = 1.0d0 - cd
  s1 = sd
720 c1 = c2
  s2 = s1
  kk = kk + kspan
730 ak = a (kk)
  a (kk) = c2 * ak - s2 * b (kk)
  b (kk) = s2 * ak + c2 * b (kk)
  kk = kk + kspnn
  if (kk.le.nt) goto 730
  ak = s1 * s2
  s2 = s1 * c2 + c1 * s2
  c2 = c1 * c2 - ak
  kk = kk - nt + kspan
  if (kk.le.kspnn) goto 730
  c2 = c1 - (cd * c1 + sd * s1)
  s1 = s1 + (sd * c1 - cd * s1)
  !     the following three statements compensate for truncation
  !     error. if rounded arithmetic is used, they may
  !     be deleted.
  c1 = 0.5d0 / (c2**2 + s1**2) + 0.5d0
  s1 = c1 * s1
  c2 = c1 * c2
  kk = kk - kspnn + jc
  if (kk.le.kspan) goto 720
  kk = kk - kspan + jc + inc
  if (kk.le.jc + jc) goto 710
  goto 100
  !     permute the results to normal order---done in two stages
  !     permutation for square factors of n
800 np (1) = ks
  if (kt.eq.0) goto 890
  k = kt + kt + 1
  if (m.lt.k) k = k - 1
  j = 1
  np (k + 1) = jc
810 np (j + 1) = np (j) / nfac (j)
  np (k) = np (k + 1) * nfac (j)
  j = j + 1
  k = k - 1
  if (j.lt.k) goto 810
  k3 = np (k + 1)
  kspan = np (2)
  kk = jc + 1
  k2 = kspan + 1
  j = 1
  if (n.ne.ntot) goto 850
  !     permutation for single-variate transform (optional code)
820 ak = a (kk)
  a (kk) = a (k2)
  a (k2) = ak
  bk = b (kk)
  b (kk) = b (k2)
  b (k2) = bk
  kk = kk + inc
  k2 = kspan + k2
  if (k2.lt.ks) goto 820
830 k2 = k2 - np (j)
  j = j + 1
  k2 = np (j + 1) + k2
  if (k2.gt.np (j) ) goto 830
  j = 1
840 if (kk.lt.k2) goto 820
  kk = kk + inc
  k2 = kspan + k2
  if (k2.lt.ks) goto 840
  if (kk.lt.ks) goto 830
  jc = k3
  goto 890
  !     permutation for multivariate transform
850 k = kk + jc
860 ak = a (kk)
  a (kk) = a (k2)
  a (k2) = ak
  bk = b (kk)
  b (kk) = b (k2)
  b (k2) = bk
  kk = kk + inc
  k2 = k2 + inc
  if (kk.lt.k) goto 860
  kk = kk + ks - jc
  k2 = k2 + ks - jc
  if (kk.lt.nt) goto 850
  k2 = k2 - nt + kspan
  kk = kk - nt + jc
  if (k2.lt.ks) goto 850
870 k2 = k2 - np (j)
  j = j + 1
  k2 = np (j + 1) + k2
  if (k2.gt.np (j) ) goto 870
  j = 1
880 if (kk.lt.k2) goto 850
  kk = kk + jc
  k2 = kspan + k2
  if (k2.lt.ks) goto 880
  if (kk.lt.ks) goto 870
  jc = k3
890 if (2 * kt + 1.ge.m) return
  kspnn = np (kt + 1)
  !     permutation for square-free factors of n
  j = m - kt
  nfac (j + 1) = 1
900 nfac (j) = nfac (j) * nfac (j + 1)
  j = j - 1
  if (j.ne.kt) goto 900
  kt = kt + 1
  nn = nfac (kt) - 1
  if (nn.gt.maxp) goto 998
  jj = 0
  j = 0
  goto 906
902 jj = jj - k2
  k2 = kk
  k = k + 1
  kk = nfac (k)
904 jj = kk + jj
  if (jj.ge.k2) goto 902
  np (j) = jj
906 k2 = nfac (kt)
  k = kt + 1
  kk = nfac (k)
  j = j + 1
  if (j.le.nn) goto 904
  !     determine the permutation cycles of length greater than 1
  j = 0
  goto 914
910 k = kk
  kk = np (k)
  np (k) = - kk
  if (kk.ne.j) goto 910
  k3 = kk
914 j = j + 1
  kk = np (j)
  if (kk.lt.0) goto 914
  if (kk.ne.j) goto 910
  np (j) = - j
  if (j.ne.nn) goto 914
  maxf = inc * maxf
  !     reorder a and b, following the permutation cycles
  goto 950
924 j = j - 1
  if (np (j) .lt.0) goto 924
  jj = jc
926 kspan = jj
  if (jj.gt.maxf) kspan = maxf
  jj = jj - kspan
  k = np (j)
  kk = jc * k + ii + jj
  k1 = kk + kspan
  k2 = 0
928 k2 = k2 + 1
  at (k2) = a (k1)
  bt (k2) = b (k1)
  k1 = k1 - inc
  if (k1.ne.kk) goto 928
932 k1 = kk + kspan
  k2 = k1 - jc * (k + np (k) )
  k = - np (k)
936 a (k1) = a (k2)
  b (k1) = b (k2)
  k1 = k1 - inc
  k2 = k2 - inc
  if (k1.ne.kk) goto 936
  kk = k2
  if (k.ne.j) goto 932
  k1 = kk + kspan
  k2 = 0
940 k2 = k2 + 1
  a (k1) = at (k2)
  b (k1) = bt (k2)
  k1 = k1 - inc
  if (k1.ne.kk) goto 940
  if (jj.ne.0) goto 926
  if (j.ne.1) goto 924
950 j = k3 + 1
  nt = nt - kspnn
  ii = nt - inc + 1
  if (nt.ge.0) goto 924
  return
  !     error finish, insufficient array storage
998 isn = 0
!  print 999
  print*,'Array bounds exceeded within subroutine cft'
  stop
!999 format(44h0array bounds exceeded within subroutine cft)
  end subroutine cft