qbox-public-rel1_73_3/src/ChargeDensity.cpp

////////////////////////////////////////////////////////////////////////////////
//
// Copyright (c) 2008 The Regents of the University of California
//
// This file is part of Qbox
//
// Qbox is distributed under the terms of the GNU General Public License
// as published by the Free Software Foundation, either version 2 of
// the License, or (at your option) any later version.
// See the file COPYING in the root directory of this distribution
// or <http://www.gnu.org/licenses/>.
//
////////////////////////////////////////////////////////////////////////////////
//
// ChargeDensity.cpp
//
////////////////////////////////////////////////////////////////////////////////

#include "MPIdata.h"
#include "ChargeDensity.h"
#include "Basis.h"
#include "Wavefunction.h"
#include "FourierTransform.h"
#include "SlaterDet.h"
#include "blas.h" // dasum

#include <iomanip>
#include <algorithm> // fill
#include <functional>
#include <fstream>
using namespace std;

////////////////////////////////////////////////////////////////////////////////
ChargeDensity::ChargeDensity(const Wavefunction& wf) : wf_(wf)
{
  vbasis_ = new Basis(MPIdata::g_comm(), D3vector(0,0,0));
  vbasis_->resize(wf.cell(),wf.refcell(),4.0*wf.ecut());
  const Basis& vb = *vbasis_;

  // define vft_, FT on vbasis context for transforming the density

  // add 2 to grid size to avoid aliasing when using non-zero k-points
  // adding 1 would suffice, but add 2 to keep even numbers
  int np0v = vb.np(0)+2;
  int np1v = vb.np(1)+2;
  int np2v = vb.np(2)+2;
  while (!vb.factorizable(np0v)) np0v += 2;
  while (!vb.factorizable(np1v)) np1v += 2;
  while (!vb.factorizable(np2v)) np2v += 2;
#ifdef DEBUG
  cout << MPIdata::rank() << ": ChargeDensity: vbasis: " << endl;
  cout << MPIdata::rank() << ": idxmin: "
       << vb.idxmin(0) << "/" << vb.idxmin(1) << "/" << vb.idxmin(2) << endl;
  cout << MPIdata::rank() << ": idxmax: "
       << vb.idxmax(0) << "/" << vb.idxmax(1) << "/" << vb.idxmax(2) << endl;
  cout << MPIdata::rank() << ": vft grid: "
       << np0v << "/" << np1v << "/" << np2v << endl;
#endif
  vft_ = new FourierTransform(vb,np0v,np1v,np2v);
  total_charge_.resize(wf.nspin());
  rhor.resize(wf.nspin());
  rhog.resize(wf.nspin());
  for ( int ispin = 0; ispin < wf.nspin(); ispin++ )
  {
    rhor[ispin].resize(vft_->np012loc());
    rhog[ispin].resize(vb.localsize());
  }
  rhotmp.resize(vft_->np012loc());

#ifdef DEBUG
  cout << MPIdata::rank() << ": ChargeDensity::ctor: wf.nsp_loc()="
       << wf.nsp_loc() << " wf.nkp_loc()=" << wf.nkp_loc() << endl;
#endif

  // FT for interpolation of wavefunctions on the fine grid
  if ( wf.nsp_loc() > 0 )
  {
    for ( int ikp_loc = 0; ikp_loc < wf.nkp_loc(); ++ikp_loc )
    {
      // use basis of isp_loc==0
      const Basis& wb = wf.sd(0,ikp_loc)->basis();
#ifdef DEBUG
      cout << MPIdata::rank() << ": ChargeDensity::ctor: ikp_loc="
           << ikp_loc << " wbasis: " << endl;
      cout << MPIdata::rank() << ": idxmin: " << wb.idxmin(0)
           << "/" << wb.idxmin(1) << "/" << wb.idxmin(2) << endl;
      cout << MPIdata::rank() << ": idxmax: " << wb.idxmax(0)
           << "/" << wb.idxmax(1) << "/" << wb.idxmax(2) << endl;
#endif
      // check that no aliasing error can occur
      assert(2*np0v > 2*wb.idxmax(0)+vb.idxmax(0));
      assert(2*np1v > 2*wb.idxmax(1)+vb.idxmax(1));
      assert(2*np2v > 2*wb.idxmax(2)+vb.idxmax(2));
      assert(2*np0v > -2*wb.idxmin(0)-vb.idxmin(0));
      assert(2*np1v > -2*wb.idxmin(1)-vb.idxmin(1));
      assert(2*np2v > -2*wb.idxmin(2)-vb.idxmin(2));

      ft_.push_back(new FourierTransform(wb,np0v,np1v,np2v));
    }
  }
  // perform reset operation on timers to introduce them in tmap
  // this is necessary to have a tmap entry even if nsp_loc or nkp_loc == 0
  tmap["charge_compute"].reset();
  tmap["charge_rowsum"].reset();
  tmap["charge_integral"].reset();
  tmap["charge_vft"].reset();
  tmap["update_taur"].reset();
}

////////////////////////////////////////////////////////////////////////////////
ChargeDensity::~ChargeDensity(void)
{
  delete vbasis_;
  delete vft_;
  for ( int ikp_loc = 0; ikp_loc < ft_.size(); ++ikp_loc )
    delete ft_[ikp_loc];

  for ( TimerMap::iterator i = tmap.begin(); i != tmap.end(); i++ )
  {
    double time = i->second.real();
    double tmin, tmax;
    MPI_Reduce(&time,&tmin,1,MPI_DOUBLE,MPI_MIN,0,MPIdata::comm());
    MPI_Reduce(&time,&tmax,1,MPI_DOUBLE,MPI_MAX,0,MPIdata::comm());
    if ( MPIdata::onpe0() && (tmax > 0.0) )
    {
      string s = "name=\"" + (*i).first + "\"";
      cout << "<timing " << left << setw(22) << s
           << " min=\"" << setprecision(3) << tmin << "\""
           << " max=\"" << setprecision(3) << tmax << "\"/>"
           << endl;
    }
  }
}

////////////////////////////////////////////////////////////////////////////////
void ChargeDensity::update_density(void)
{
  assert(rhor.size() == wf_.nspin());
  for ( int ispin = 0; ispin < wf_.nspin(); ++ispin )
    fill(rhor[ispin].begin(),rhor[ispin].end(),0.0);

  for ( int isp_loc = 0; isp_loc < wf_.nsp_loc(); ++isp_loc )
  {
    const int ispg = wf_.isp_global(isp_loc);
    assert(rhor[ispg].size() == vft_->np012loc() );
    assert(rhotmp.size() == vft_->np012loc() );

    tmap["charge_compute"].start();
    for ( int ikp_loc = 0; ikp_loc < wf_.nkp_loc(); ++ikp_loc )
    {
      assert(ft_[ikp_loc]);
      const int ikpg = wf_.ikp_global(ikp_loc);
      assert(rhor[ispg].size()==ft_[ikp_loc]->np012loc());
      wf_.sd(isp_loc,ikp_loc)->compute_density(*ft_[ikp_loc],
          wf_.weight(ikpg), &rhor[ispg][0]);
    }
    tmap["charge_compute"].stop();
  }
  // rhor now contains local contributions from this task

  for ( int ispin = 0; ispin < wf_.nspin(); ++ispin )
  {
    // sum over kpoints, states and spins
    tmap["charge_rowsum"].start();
    vector<double> tmpr(vft_->np012loc());
    MPI_Allreduce(&rhor[ispin][0],&tmpr[0],vft_->np012loc(),
                  MPI_DOUBLE,MPI_SUM,MPIdata::st_kp_sp_comm());
    rhor[ispin] = tmpr;
    tmap["charge_rowsum"].stop();

    // check integral of charge density
    // compute Fourier coefficients of the charge density
    double sum = 0.0;
    const double *const prhor = &rhor[ispin][0];
    tmap["charge_integral"].start();
    const int rhor_size = rhor[ispin].size();
    const double omega = vbasis_->cell().volume();
    #pragma omp parallel for reduction(+:sum)
    for ( int i = 0; i < rhor_size; i++ )
    {
      const double prh = prhor[i];
      sum += prh;
      rhotmp[i] = complex<double>(omega * prh, 0.0);
    }
    sum *= omega / vft_->np012();
    double tsum = 0.0;
    // sum over g_comm and sp_comm
    MPI_Allreduce(&sum,&tsum,1,MPI_DOUBLE,MPI_SUM,MPIdata::g_comm());
    sum = tsum;
    tmap["charge_integral"].stop();
    total_charge_[ispin] = sum;

    // compute rhog from rhotmp
    tmap["charge_vft"].start();
    vft_->forward(&rhotmp[0],&rhog[ispin][0]);
    tmap["charge_vft"].stop();
  }
}

////////////////////////////////////////////////////////////////////////////////
void ChargeDensity::update_rhor(void)
{
  // recalculate rhor from rhog
  assert(rhor.size() == wf_.nspin());
  const double omega = vbasis_->cell().volume();
  assert(omega!=0.0);
  const double omega_inv = 1.0 / omega;

  for ( int ispin = 0; ispin < wf_.nspin(); ++ispin )
  {
    assert(rhor[ispin].size() == vft_->np012loc() );
    assert(rhotmp.size() == vft_->np012loc() );

    vft_->backward(&rhog[ispin][0],&rhotmp[0]);

    const int rhor_size = rhor[ispin].size();
    double *const prhor = &rhor[ispin][0];
    #pragma omp parallel for
    for ( int i = 0; i < rhor_size; i++ )
      prhor[i] = rhotmp[i].real() * omega_inv;

    // integral of the charge density
    tmap["charge_integral"].start();
    int ione=1;
    int n = rhor_size;
    double sum = dasum(&n,prhor,&ione);
    sum *= omega / vft_->np012();

    // sum over g_comm
    double tsum = 0.0;
    MPI_Allreduce(&sum,&tsum,1,MPI_DOUBLE,MPI_SUM,MPIdata::g_comm());
    tmap["charge_integral"].stop();
    total_charge_[ispin] = tsum;
  }
}

////////////////////////////////////////////////////////////////////////////////
void ChargeDensity::update_taur(double* taur) const
{
  vector<double> tmpr(vft_->np012loc(),0.0);
  tmap["update_taur"].start();
  for ( int isp_loc = 0; isp_loc < wf_.nsp_loc(); ++isp_loc )
  {
    for ( int ikp_loc = 0; ikp_loc < wf_.nkp_loc(); ++ikp_loc )
    {
      assert(ft_[ikp_loc]);
      const int ikpg = wf_.ikp_global(ikp_loc);
      wf_.sd(isp_loc,ikp_loc)->compute_tau(*ft_[ikp_loc],
        wf_.weight(ikpg), &tmpr[0]);
    }
  }
  MPI_Allreduce(&tmpr[0],taur,vft_->np012loc(),
                MPI_DOUBLE,MPI_SUM,MPIdata::st_kp_sp_comm());
  tmap["update_taur"].stop();

  // stop if computing taur with NLCCs
  if ( !rhocore_r.empty() )
    assert(!"ChargeDensity: Cannot compute taur with NLCCs");
}

////////////////////////////////////////////////////////////////////////////////
void ChargeDensity::update_taur(double* taur_up, double* taur_dn) const
{
  assert(wf_.nspin()==2);
  vector<double> tmpr(vft_->np012loc());
  tmap["update_taur"].start();
  for ( int ispin = 0; ispin < wf_.nspin(); ++ispin )
  {
    memset( (void*)&tmpr[0], 0, vft_->np012loc()*sizeof(double) );
    const int isp_loc = wf_.isp_local(ispin);
    if ( isp_loc >= 0 )
    {
      for ( int ikp_loc = 0; ikp_loc < wf_.nkp_loc(); ++ikp_loc )
      {
        assert(ft_[ikp_loc]);
        const int ikpg = wf_.ikp_global(ikp_loc);
        wf_.sd(isp_loc,ikp_loc)->compute_tau(*ft_[ikp_loc],
          wf_.weight(ikpg), &tmpr[0]);
      }
    }
    // tmpr now contains local taur contrib
    // reduce to have both taur_up and taur_dn on all tasks
    if ( ispin == 0 )
    {
      MPI_Allreduce(&tmpr[0],&taur_up[0],vft_->np012loc(),
                    MPI_DOUBLE,MPI_SUM,MPIdata::st_kp_sp_comm());
    }
    else
    {
      MPI_Allreduce(&tmpr[0],&taur_dn[0],vft_->np012loc(),
                    MPI_DOUBLE,MPI_SUM,MPIdata::st_kp_sp_comm());
    }
  }
  tmap["update_taur"].stop();

  // stop if computing taur with NLCCs
  if ( !rhocore_r.empty() )
    assert(!"ChargeDensity: Cannot compute taur with NLCCs");
}

////////////////////////////////////////////////////////////////////////////////
double ChargeDensity::total_charge(void) const
{
  assert((wf_.nspin()==1)||(wf_.nspin()==2));
  if ( wf_.nspin() == 1 )
    return total_charge_[0];
  else
    return total_charge_[0] + total_charge_[1];
}

////////////////////////////////////////////////////////////////////////////////
void ChargeDensity::print(ostream& os) const
{
  os.setf(ios::fixed,ios::floatfield);
  os.setf(ios::right,ios::adjustfield);
  for ( int ispin = 0; ispin < wf_.nspin(); ispin++ )
    os << "  <electronic_charge ispin=\"" << ispin << "\"> "
       << setprecision(8) << total_charge(ispin)
       << " </electronic_charge>\n";
}

////////////////////////////////////////////////////////////////////////////////
ostream& operator<< ( ostream& os, const ChargeDensity& cd )
{
  cd.print(os);
  return os;
}

////////////////////////////////////////////////////////////////////////////////
void ChargeDensity::update_rhog(void)
{
  // recalculate rhog from rhor
  assert(rhor.size() == wf_.nspin());
  const double omega = vbasis_->cell().volume();
  assert(omega!=0.0);

  for ( int isp_loc = 0; isp_loc < wf_.nsp_loc(); ++isp_loc )
  {
    const int ispg = wf_.isp_global(isp_loc);
    const int rhor_size = rhor[ispg].size();
    double *const prhor = &rhor[ispg][0];
    #pragma omp parallel for
    for ( int i = 0; i < rhor_size; i++ )
      rhotmp[i] = complex<double> ( omega * prhor[i], 0);

    assert(rhotmp.size() == vft_->np012loc() );

    vft_->forward(&rhotmp[0],&rhog[ispg][0]);
  }
}