diff --git a/capolanco/README.md b/capolanco/README.md new file mode 100644 index 00000000..cbd01009 --- /dev/null +++ b/capolanco/README.md @@ -0,0 +1,37 @@ +# K-point convergence tracker (Materials) + +> Ideal candidate: scientists skilled in Density Functional Theory and proficient in python. + +# Overview + +The aim of this task is to create a python package that implements automatic convergence tracking mechanism for a materials simulations engine. The convergence is tracked with respect to the k-point sampling inside a reciprocal cell of a crystalline compound. + +# Requirements + +1. automatically find the dimensions of a k-point mesh that satisfy a certain criteria for total energy (eg. total energy is converged within dE = 0.01meV) +1. the code shall be written in a way that can facilitate easy addition of convergence wrt other characteristics extracted from simulations (forces, pressures, phonon frequencies etc) +1. the code shall support VASP or Quantum ESPRESSO + +# Expectations + +- correctly find k-point mesh that satisfies total energy convergence parameters for a set of 10 materials, starting from Si2, as simplest, to a 10-20-atom supercell of your choice +- modular and object-oriented implementation +- commit early and often - at least once per 24 hours + +# Timeline + +We leave exact timing to the candidate. Must fit Within 5 days total. + +# User story + +As a user of this software I can start it passing: + +- path to input data (eg. pw.in / POSCAR, INCAR, KPOINTS) and +- kinetic energy cutoff + +as parameters and get the k-point dimensions (eg. 5 5 5). + +# Notes + +- create an account at exabyte.io and use it for the calculation purposes +- suggested modeling engine: Quantum ESPRESSO diff --git a/capolanco/RunConvergence.py b/capolanco/RunConvergence.py new file mode 100644 index 00000000..892ecf6c --- /dev/null +++ b/capolanco/RunConvergence.py @@ -0,0 +1,121 @@ +# This code will run a k-point convergence up to a desire delta energy + +import subprocess +import ioqeclass as qe +import ioclusterclass as cluster + +########################### +##### USER INPUTS +########################### + +# Define the path of the input file +# The k-grid of this file will be set as the starting point +# for the convergence process +filein='Si.scf.in' + +# Define delta energy threshold for +# convergence (eV) +dEthreshold=1.0 # (eV) + + +########################### +##### DEVELOPERS INPUTS +########################### + +## Convergence +# maximum of iterations +Nitermax=20 +# increasing step of kgrid +kstep=2 + +## Cluster +# number of nodes to be used +Nnodes=1 +# number of processors per node +ppn=8 +# queue +queue='OR' +# walltime +walltimehours=5 +walltimeminutes=3 + + +########################### +##### PROGRAM +########################### + + +### Set up initial parameters +# Initialize pw.x input class +qeinput=qe.qepwinput() +# load the pw.x input +qeinput.load(filein) +# Create the input file for initial run +testin='test.scf.in' +testout='test.scf.out' +qeinput.save(filein,testin) +# Create the job to send to the cluster +# Initialize job class +job=cluster.jobclass() +# set up job class +job.name='test' +job.nodes=Nnodes +job.ppn=ppn +job.queue=queue +job.walltimehours=walltimehours +job.walltimeminutes=walltimeminutes +# create the job file +jobname=f'job.test.sh' +job.createjobQEpw(jobname,testin,testout) +# Run initial test +subprocess.run(['echo',f'runing {jobname}']) +##subprocess.run(['qsub',f'{jobname}']) + +# Initialize pw.x output class +qeoutput=qe.qepwoutput() +# Read the Total energy from the output +qeoutput.getenergy(testout) + + +# Loop testing for dE +dE=2.0*dEthreshold +EnergyOld=qeoutput.energy +counter=0 +while ((dE>dEthreshold) and (counter 1.29MB + + Estimated total allocated dynamical RAM > 31.06MB + + Initial potential from superposition of free atoms + + starting charge 7.99901, renormalised to 8.00000 + Starting wfc are 8 randomized atomic wfcs + + total cpu time spent up to now is 0.4 secs + + per-process dynamical memory: 2.9 Mb + + Self-consistent Calculation + + iteration # 1 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-02, avg # of iterations = 2.0 + + Threshold (ethr) on eigenvalues was too large: + Diagonalizing with lowered threshold + + Davidson diagonalization with overlap + ethr = 7.97E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.6 secs + + total energy = -15.84982619 Ry + Harris-Foulkes estimate = -15.87079416 Ry + estimated scf accuracy < 0.06161703 Ry + + iteration # 2 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 7.70E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.7 secs + + total energy = -15.85288351 Ry + Harris-Foulkes estimate = -15.85318795 Ry + estimated scf accuracy < 0.00216687 Ry + + iteration # 3 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 2.71E-05, avg # of iterations = 2.4 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85332918 Ry + Harris-Foulkes estimate = -15.85336185 Ry + estimated scf accuracy < 0.00007437 Ry + + iteration # 4 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 9.30E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85334986 Ry + Harris-Foulkes estimate = -15.85335396 Ry + estimated scf accuracy < 0.00000888 Ry + + iteration # 5 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.11E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.9 secs + + total energy = -15.85335134 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 0.00000011 Ry + + iteration # 6 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.35E-09, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.0 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-09 Ry + + iteration # 7 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.68E-11, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.1 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-11 Ry + + iteration # 8 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.65E-13, avg # of iterations = 3.3 + + total cpu time spent up to now is 1.2 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 5.4E-12 Ry + + iteration # 9 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.7 + + total cpu time spent up to now is 1.3 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 1.2E-13 Ry + + iteration # 10 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.0 + + total cpu time spent up to now is 1.4 secs + + End of self-consistent calculation + + k = 0.0000 0.0000 0.0000 ( 4477 PWs) bands (ev): + + -5.8300 6.2061 6.2061 6.2061 + + k =-0.1250 0.1250-0.1250 ( 4507 PWs) bands (ev): + + -5.6230 4.6051 5.9132 5.9132 + + k =-0.2500 0.2500-0.2500 ( 4510 PWs) bands (ev): + + -5.0182 2.2559 5.4373 5.4373 + + k =-0.3750 0.3750-0.3750 ( 4501 PWs) bands (ev): + + -4.1058 0.2065 5.1074 5.1074 + + k = 0.5000-0.5000 0.5000 ( 4476 PWs) bands (ev): + + -3.4453 -0.8427 4.9947 4.9947 + + k = 0.0000 0.2500 0.0000 ( 4504 PWs) bands (ev): + + -5.5533 4.8935 5.3857 5.3857 + + k =-0.1250 0.3750-0.1250 ( 4517 PWs) bands (ev): + + -5.0777 2.9801 4.8669 4.9518 + + k =-0.2500 0.5000-0.2500 ( 4508 PWs) bands (ev): + + -4.2481 0.8896 4.3532 4.5964 + + k = 0.6250-0.3750 0.6250 ( 4486 PWs) bands (ev): + + -3.3613 -0.6068 3.9003 4.6231 + + k = 0.5000-0.2500 0.5000 ( 4491 PWs) bands (ev): + + -3.6148 -0.2257 3.7125 4.9256 + + k = 0.3750-0.1250 0.3750 ( 4497 PWs) bands (ev): + + -4.5602 1.5598 3.8591 5.4251 + + k = 0.2500 0.0000 0.2500 ( 4477 PWs) bands (ev): + + -5.2819 3.5267 4.5444 5.9125 + + k = 0.0000 0.5000 0.0000 ( 4520 PWs) bands (ev): + + -4.7329 2.7148 4.2862 4.2862 + + k =-0.1250 0.6250-0.1250 ( 4509 PWs) bands (ev): + + -4.0117 1.2745 3.4881 3.9636 + + k = 0.7500-0.2500 0.7500 ( 4482 PWs) bands (ev): + + -3.0647 -0.1975 2.6082 3.9678 + + k = 0.6250-0.1250 0.6250 ( 4477 PWs) bands (ev): + + -2.8512 -0.4657 2.1376 4.2926 + + k = 0.5000 0.0000 0.5000 ( 4489 PWs) bands (ev): + + -3.7521 0.7207 2.3750 4.8614 + + k = 0.0000 0.7500 0.0000 ( 4484 PWs) bands (ev): + + -3.4015 0.4708 3.5586 3.5586 + + k = 0.8750-0.1250 0.8750 ( 4479 PWs) bands (ev): + + -2.4888 -0.6253 2.7002 3.4815 + + k = 0.7500 0.0000 0.7500 ( 4454 PWs) bands (ev): + + -2.0305 -1.0339 1.8049 3.7440 + + k = 0.0000-1.0000 0.0000 ( 4456 PWs) bands (ev): + + -1.6267 -1.6267 3.3090 3.3090 + + k =-0.2500 0.5000 0.0000 ( 4503 PWs) bands (ev): + + -4.4807 1.9234 3.4393 4.7592 + + k = 0.6250-0.3750 0.8750 ( 4489 PWs) bands (ev): + + -3.5748 0.3447 2.8290 4.2439 + + k = 0.5000-0.2500 0.7500 ( 4486 PWs) bands (ev): + + -2.9014 -0.6278 2.7039 4.0076 + + k = 0.7500-0.2500 1.0000 ( 4484 PWs) bands (ev): + + -3.1970 0.2501 2.7770 3.3923 + + k = 0.6250-0.1250 0.8750 ( 4486 PWs) bands (ev): + + -2.3006 -0.7332 2.0576 3.1860 + + k = 0.5000 0.0000 0.7500 ( 4490 PWs) bands (ev): + + -2.6570 -0.3670 1.8851 3.5717 + + k =-0.2500-1.0000 0.0000 ( 4472 PWs) bands (ev): + + -1.5427 -1.5427 2.7194 2.7194 + + k =-0.5000-1.0000 0.0000 ( 4488 PWs) bands (ev): + + -1.4495 -1.4495 2.2655 2.2655 + + highest occupied level (ev): 6.2061 + +! total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 4.0E-15 Ry + + The total energy is the sum of the following terms: + + one-electron contribution = 4.76680131 Ry + hartree contribution = 1.08149972 Ry + xc contribution = -4.81476914 Ry + ewald contribution = -16.88688327 Ry + + convergence has been achieved in 10 iterations + + Forces acting on atoms (cartesian axes, Ry/au): + + atom 1 type 1 force = 0.00000000 0.00000000 0.00000000 + atom 2 type 1 force = 0.00000000 0.00000000 -0.00000000 + + Total force = 0.000000 Total SCF correction = 0.000000 + + + Computing stress (Cartesian axis) and pressure + + total stress (Ry/bohr**3) (kbar) P= 0.05 + 0.00000032 -0.00000000 -0.00000000 0.05 -0.00 -0.00 + -0.00000000 0.00000032 0.00000000 -0.00 0.05 0.00 + -0.00000000 0.00000000 0.00000032 -0.00 0.00 0.05 + + + Writing output data file Si.save + + init_run : 0.06s CPU 0.23s WALL ( 1 calls) + electrons : 0.85s CPU 1.01s WALL ( 1 calls) + forces : 0.00s CPU 0.01s WALL ( 1 calls) + stress : 0.02s CPU 0.03s WALL ( 1 calls) + + Called by init_run: + wfcinit : 0.04s CPU 0.11s WALL ( 1 calls) + potinit : 0.00s CPU 0.01s WALL ( 1 calls) + + Called by electrons: + c_bands : 0.73s CPU 0.80s WALL ( 11 calls) + sum_band : 0.11s CPU 0.13s WALL ( 11 calls) + v_of_rho : 0.00s CPU 0.01s WALL ( 11 calls) + mix_rho : 0.00s CPU 0.01s WALL ( 11 calls) + + Called by c_bands: + init_us_2 : 0.01s CPU 0.03s WALL ( 725 calls) + cegterg : 0.69s CPU 0.74s WALL ( 319 calls) + + Called by sum_band: + + Called by *egterg: + h_psi : 0.62s CPU 0.65s WALL ( 980 calls) + g_psi : 0.00s CPU 0.00s WALL ( 632 calls) + cdiaghg : 0.05s CPU 0.10s WALL ( 922 calls) + + Called by h_psi: + h_psi:pot : 0.61s CPU 0.65s WALL ( 980 calls) + h_psi:calbec : 0.03s CPU 0.04s WALL ( 980 calls) + vloc_psi : 0.57s CPU 0.59s WALL ( 980 calls) + add_vuspsi : 0.01s CPU 0.01s WALL ( 980 calls) + + General routines + calbec : 0.03s CPU 0.05s WALL ( 1125 calls) + fft : 0.01s CPU 0.05s WALL ( 50 calls) + fftw : 0.57s CPU 0.64s WALL ( 8656 calls) + davcio : 0.00s CPU 0.06s WALL ( 29 calls) + + Parallel routines + fft_scatter : 0.29s CPU 0.31s WALL ( 8706 calls) + + PWSCF : 1.07s CPU 2.22s WALL + + + This run was terminated on: 19:30: 3 27Sep2017 + +=------------------------------------------------------------------------------= + JOB DONE. +=------------------------------------------------------------------------------= diff --git a/capolanco/__pycache__/ioclusterclass.cpython-39.pyc b/capolanco/__pycache__/ioclusterclass.cpython-39.pyc new file mode 100644 index 00000000..12df40cf Binary files /dev/null and b/capolanco/__pycache__/ioclusterclass.cpython-39.pyc differ diff --git a/capolanco/__pycache__/ioqeclass.cpython-39.pyc b/capolanco/__pycache__/ioqeclass.cpython-39.pyc new file mode 100644 index 00000000..c38ad36a Binary files /dev/null and b/capolanco/__pycache__/ioqeclass.cpython-39.pyc differ diff --git a/capolanco/ioclusterclass.py b/capolanco/ioclusterclass.py new file mode 100644 index 00000000..ea4e0716 --- /dev/null +++ b/capolanco/ioclusterclass.py @@ -0,0 +1,58 @@ +import numpy as np + + +## THINGS TO FIX + +class jobclass: + """This class creates jobs for the cluster""" + + ################### + ## Initialization function for the class + ################### + def __init__(self): + + ## name of the job + self.name='Unset' + ## number of nodes + self.nodes=np.int64(1) + ## number of processors per node + self.ppn=np.int64(1) + ## queue + self.queue='D' + ## walltime (in hours) + self.walltimehours=np.int64(1) + self.walltimeminutes=np.int64(0) + + + ################### + ## Create the job for QE pw.x calculation + ################### + def createjobQEpw(self,jobname,pwinput,pwoutput): + # Inputs + # jobname is the name of the job + # pwinput is the path of the input file + # pwoutput is the path of the output file + + print('') + print(f'#########################') + print(f'## Creating job {jobname}') + + # Open file + f=open(jobname,'w') + + # Write heather of job + f.write(f'#!/bin/bash\n\n') + f.write(f'#PBS -N {self.name}\n') + f.write(f'#PBS -l nodes={self.nodes}\n') + f.write(f'#PBS -l ppn={self.ppn}\n') + f.write(f'#PBS -q {self.queue}\n') + f.write(f'#PBS -j oe\n') + f.write(f'#PBS -l walltime={self.walltimehours:02d}:{self.walltimeminutes:02d}:00\n\n') + + f.write(f'cd $PBS_O_WORKDIR\n') + f.write(f'module load espresso\n') + f.write(f'mpirun -np $PBS_NP pw.x {pwinput} {pwoutput}\n') + + f.close() + + diff --git a/capolanco/ioqeclass.py b/capolanco/ioqeclass.py new file mode 100644 index 00000000..af2c452a --- /dev/null +++ b/capolanco/ioqeclass.py @@ -0,0 +1,132 @@ +import numpy as np + + +## THINGS TO FIX + +class qepwinput: + """This class describes the Quantum Espresso input for a pw.x calculation""" + + ################### + ## Initialization function for the class + ################### + def __init__(self): + + ## k-grid + self.kgrid=np.array([1,1,1],dtype='int64') + + ################### + ## Load pw.x input file + ## This function loads a pw.x input file into + ## the qepwinput class + ################### + def load(self,filename): + # Inputs + # filename is the path to pw.x input file + + print('') + print(f'#########################') + print(f'## Loading pw.x input from file {filename}') + + # Open file + f=open(filename,'r') + + ## Retrieve k-grid + # Loop over pw.x input file up to the kgrid information + for line in f: + x=line.split() + # if line is not empty + if x: + if (x[0]=='K_POINTS'): + break + # Read and save the k-grid information + line=f.readline() + x=line.split() + self.kgrid[0]=np.int64(x[0]) + self.kgrid[1]=np.int64(x[1]) + self.kgrid[2]=np.int64(x[2]) + + f.close() + + + ################### + ## Save pw.x input file + ## This function saves an input file from a template + ## replacing the current parameters of the qepwinput class + ################### + def save(self,template,filename): + # Inputs + # template is the path of the template pw.x input file + # filename is the path to pw.x input file that will be created + + print('') + print(f'#########################') + print(f'## Saving pw.x input to file {filename}') + + # Open template file + template=open(template,'r') + + # Open output file + f=open(filename,'w') + + # Loop over pw.x input template and copy it up to + # the kgrid information + for line in template: + f.write(line) + x=line.split() + # if line is not empty + if x: + if (x[0]=='K_POINTS'): + break + # write the k-grid information + f.write(f' {self.kgrid[0]} {self.kgrid[1]} {self.kgrid[2]} 0 0 0') + + f.close() + template.close() + + + + + + +class qepwoutput: + """This class handle the Quantum Espresso output for a pw.x calculation""" + + ################### + ## Initialization function for the class + ################### + def __init__(self): + + ## energy (eV) + self.energy=np.array([0.0e0],dtype='double') + + ################### + ## Reads Total Energy from pw.x output file + ## This function read the total energy from the output of a + ## pw.x calculation + ################### + def getenergy(self,filename): + # Inputs + # filename is the path to pw.x output file + # Output + # the energy is returned in self.energy in eV + + print('') + print(f'#########################') + print(f'## Reading total energy from pw.x output from file {filename}') + + # Open file + f=open(filename,'r') + + ## Retrieve energy + # Loop over pw.x output file up to the total energy + for line in f: + x=line.split() + # if line is not empty + if x: + if (x[0]=='!'): + self.energy=np.double(x[4]) # (Ry) + break + + # Convert to eV + self.energy=self.energy*13.605693122 # (eV) + f.close() diff --git a/capolanco/job.test.sh b/capolanco/job.test.sh new file mode 100644 index 00000000..ddcc703e --- /dev/null +++ b/capolanco/job.test.sh @@ -0,0 +1,12 @@ +#!/bin/bash + +#PBS -N test +#PBS -l nodes=1 +#PBS -l ppn=8 +#PBS -q OR +#PBS -j oe +#PBS -l walltime=05:03:00 + +cd $PBS_O_WORKDIR +module load espresso +mpirun -np $PBS_NP pw.x test.scf.in test.scf.out diff --git a/capolanco/job.test1.sh b/capolanco/job.test1.sh new file mode 100644 index 00000000..9ce1cf81 --- /dev/null +++ b/capolanco/job.test1.sh @@ -0,0 +1,12 @@ +#!/bin/bash + +#PBS -N test +#PBS -l nodes=1 +#PBS -l ppn=8 +#PBS -q OR +#PBS -j oe +#PBS -l walltime=05:03:00 + +cd $PBS_O_WORKDIR +module load espresso +mpirun -np $PBS_NP pw.x test.scf1.in test.scf1.out diff --git a/capolanco/job.test2.sh b/capolanco/job.test2.sh new file mode 100644 index 00000000..1b628d2c --- /dev/null +++ b/capolanco/job.test2.sh @@ -0,0 +1,12 @@ +#!/bin/bash + +#PBS -N test +#PBS -l nodes=1 +#PBS -l ppn=8 +#PBS -q OR +#PBS -j oe +#PBS -l walltime=05:03:00 + +cd $PBS_O_WORKDIR +module load espresso +mpirun -np $PBS_NP pw.x test.scf2.in test.scf2.out diff --git a/capolanco/job.test3.sh b/capolanco/job.test3.sh new file mode 100644 index 00000000..33c390a3 --- /dev/null +++ b/capolanco/job.test3.sh @@ -0,0 +1,12 @@ +#!/bin/bash + +#PBS -N test +#PBS -l nodes=1 +#PBS -l ppn=8 +#PBS -q OR +#PBS -j oe +#PBS -l walltime=05:03:00 + +cd $PBS_O_WORKDIR +module load espresso +mpirun -np $PBS_NP pw.x test.scf3.in test.scf3.out diff --git a/capolanco/job.test4.sh b/capolanco/job.test4.sh new file mode 100644 index 00000000..26d9d500 --- /dev/null +++ b/capolanco/job.test4.sh @@ -0,0 +1,12 @@ +#!/bin/bash + +#PBS -N test +#PBS -l nodes=1 +#PBS -l ppn=8 +#PBS -q OR +#PBS -j oe +#PBS -l walltime=05:03:00 + +cd $PBS_O_WORKDIR +module load espresso +mpirun -np $PBS_NP pw.x test.scf4.in test.scf4.out diff --git a/capolanco/test.scf.in b/capolanco/test.scf.in new file mode 100644 index 00000000..0203478a --- /dev/null +++ b/capolanco/test.scf.in @@ -0,0 +1,30 @@ + &control + calculation='scf', + outdir = '/global/cscratch1/sd/cpolanco/Si/', + prefix='Si', + pseudo_dir = '/global/homes/c/cpolanco/Materials/pseudo/', + restart_mode='from_scratch', + tprnfor= .true., + tstress= .true., + / + &system + ibrav= 2, + celldm(1)= 10.20777693, + nat= 2, + ntyp= 1, + ecutwfc= 100.0 + / + &electrons + mixing_beta= 0.7 + conv_thr= 1.0d-14 + / + +ATOMIC_SPECIES + Si 28.086 Si.pz-vbc.UPF + +ATOMIC_POSITIONS (alat) + Si 0.00 0.00 0.00 + Si 0.25 0.25 0.25 + +K_POINTS (automatic) + 8 8 8 0 0 0 \ No newline at end of file diff --git a/capolanco/test.scf.out b/capolanco/test.scf.out new file mode 100644 index 00000000..ce3f6334 --- /dev/null +++ b/capolanco/test.scf.out @@ -0,0 +1,437 @@ + + Program PWSCF v.6.1 starts on 27Sep2017 at 19:30: 1 + + This program is part of the open-source Quantum ESPRESSO suite + for quantum simulation of materials; please cite + "P. Giannozzi et al., J. Phys.:Condens. Matter 21 395502 (2009); + URL http://www.quantum-espresso.org", + in publications or presentations arising from this work. More details at + http://www.quantum-espresso.org/quote + + Parallel version (MPI & OpenMP), running on 24 processor cores + Number of MPI processes: 24 + Threads/MPI process: 1 + R & G space division: proc/nbgrp/npool/nimage = 24 + Waiting for input... + Reading input from standard input + + Current dimensions of program PWSCF are: + Max number of different atomic species (ntypx) = 10 + Max number of k-points (npk) = 40000 + Max angular momentum in pseudopotentials (lmaxx) = 3 + + Subspace diagonalization in iterative solution of the eigenvalue problem: + a serial algorithm will be used + + + Parallelization info + -------------------- + sticks: dense smooth PW G-vecs: dense smooth PW + Min 59 59 17 1489 1489 232 + Max 60 60 18 1494 1494 235 + Sum 1417 1417 421 35749 35749 5601 + + + + bravais-lattice index = 2 + lattice parameter (alat) = 10.2078 a.u. + unit-cell volume = 265.9093 (a.u.)^3 + number of atoms/cell = 2 + number of atomic types = 1 + number of electrons = 8.00 + number of Kohn-Sham states= 4 + kinetic-energy cutoff = 100.0000 Ry + charge density cutoff = 400.0000 Ry + convergence threshold = 1.0E-14 + mixing beta = 0.7000 + number of iterations used = 8 plain mixing + Exchange-correlation = SLA PZ NOGX NOGC ( 1 1 0 0 0 0) + + celldm(1)= 10.207777 celldm(2)= 0.000000 celldm(3)= 0.000000 + celldm(4)= 0.000000 celldm(5)= 0.000000 celldm(6)= 0.000000 + + crystal axes: (cart. coord. in units of alat) + a(1) = ( -0.500000 0.000000 0.500000 ) + a(2) = ( 0.000000 0.500000 0.500000 ) + a(3) = ( -0.500000 0.500000 0.000000 ) + + reciprocal axes: (cart. coord. in units 2 pi/alat) + b(1) = ( -1.000000 -1.000000 1.000000 ) + b(2) = ( 1.000000 1.000000 1.000000 ) + b(3) = ( -1.000000 1.000000 -1.000000 ) + + + PseudoPot. # 1 for Si read from file: + /global/homes/c/cpolanco/Materials/pseudo/Si.pz-vbc.UPF + MD5 check sum: 6dfa03ddd5817404712e03e4d12deb78 + Pseudo is Norm-conserving, Zval = 4.0 + Generated by new atomic code, or converted to UPF format + Using radial grid of 431 points, 2 beta functions with: + l(1) = 0 + l(2) = 1 + + atomic species valence mass pseudopotential + Si 4.00 28.08600 Si( 1.00) + + 24 Sym. Ops. (no inversion) found + (note: 24 additional sym.ops. were found but ignored + their fractional translations are incommensurate with FFT grid) + + + Cartesian axes + + site n. atom positions (alat units) + 1 Si tau( 1) = ( 0.0000000 0.0000000 0.0000000 ) + 2 Si tau( 2) = ( 0.2500000 0.2500000 0.2500000 ) + + number of k points= 29 + cart. coord. in units 2pi/alat + k( 1) = ( 0.0000000 0.0000000 0.0000000), wk = 0.0039062 + k( 2) = ( -0.1250000 0.1250000 -0.1250000), wk = 0.0312500 + k( 3) = ( -0.2500000 0.2500000 -0.2500000), wk = 0.0312500 + k( 4) = ( -0.3750000 0.3750000 -0.3750000), wk = 0.0312500 + k( 5) = ( 0.5000000 -0.5000000 0.5000000), wk = 0.0156250 + k( 6) = ( 0.0000000 0.2500000 0.0000000), wk = 0.0234375 + k( 7) = ( -0.1250000 0.3750000 -0.1250000), wk = 0.0937500 + k( 8) = ( -0.2500000 0.5000000 -0.2500000), wk = 0.0937500 + k( 9) = ( 0.6250000 -0.3750000 0.6250000), wk = 0.0937500 + k( 10) = ( 0.5000000 -0.2500000 0.5000000), wk = 0.0937500 + k( 11) = ( 0.3750000 -0.1250000 0.3750000), wk = 0.0937500 + k( 12) = ( 0.2500000 0.0000000 0.2500000), wk = 0.0468750 + k( 13) = ( 0.0000000 0.5000000 0.0000000), wk = 0.0234375 + k( 14) = ( -0.1250000 0.6250000 -0.1250000), wk = 0.0937500 + k( 15) = ( 0.7500000 -0.2500000 0.7500000), wk = 0.0937500 + k( 16) = ( 0.6250000 -0.1250000 0.6250000), wk = 0.0937500 + k( 17) = ( 0.5000000 0.0000000 0.5000000), wk = 0.0468750 + k( 18) = ( 0.0000000 0.7500000 0.0000000), wk = 0.0234375 + k( 19) = ( 0.8750000 -0.1250000 0.8750000), wk = 0.0937500 + k( 20) = ( 0.7500000 0.0000000 0.7500000), wk = 0.0468750 + k( 21) = ( 0.0000000 -1.0000000 0.0000000), wk = 0.0117188 + k( 22) = ( -0.2500000 0.5000000 0.0000000), wk = 0.0937500 + k( 23) = ( 0.6250000 -0.3750000 0.8750000), wk = 0.1875000 + k( 24) = ( 0.5000000 -0.2500000 0.7500000), wk = 0.0937500 + k( 25) = ( 0.7500000 -0.2500000 1.0000000), wk = 0.0937500 + k( 26) = ( 0.6250000 -0.1250000 0.8750000), wk = 0.1875000 + k( 27) = ( 0.5000000 0.0000000 0.7500000), wk = 0.0937500 + k( 28) = ( -0.2500000 -1.0000000 0.0000000), wk = 0.0468750 + k( 29) = ( -0.5000000 -1.0000000 0.0000000), wk = 0.0234375 + + Dense grid: 35749 G-vectors FFT dimensions: ( 45, 45, 45) + + Estimated max dynamical RAM per process > 1.29MB + + Estimated total allocated dynamical RAM > 31.06MB + + Initial potential from superposition of free atoms + + starting charge 7.99901, renormalised to 8.00000 + Starting wfc are 8 randomized atomic wfcs + + total cpu time spent up to now is 0.4 secs + + per-process dynamical memory: 2.9 Mb + + Self-consistent Calculation + + iteration # 1 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-02, avg # of iterations = 2.0 + + Threshold (ethr) on eigenvalues was too large: + Diagonalizing with lowered threshold + + Davidson diagonalization with overlap + ethr = 7.97E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.6 secs + + total energy = -15.84982619 Ry + Harris-Foulkes estimate = -15.87079416 Ry + estimated scf accuracy < 0.06161703 Ry + + iteration # 2 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 7.70E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.7 secs + + total energy = -15.85288351 Ry + Harris-Foulkes estimate = -15.85318795 Ry + estimated scf accuracy < 0.00216687 Ry + + iteration # 3 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 2.71E-05, avg # of iterations = 2.4 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85332918 Ry + Harris-Foulkes estimate = -15.85336185 Ry + estimated scf accuracy < 0.00007437 Ry + + iteration # 4 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 9.30E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85334986 Ry + Harris-Foulkes estimate = -15.85335396 Ry + estimated scf accuracy < 0.00000888 Ry + + iteration # 5 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.11E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.9 secs + + total energy = -15.85335134 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 0.00000011 Ry + + iteration # 6 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.35E-09, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.0 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-09 Ry + + iteration # 7 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.68E-11, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.1 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-11 Ry + + iteration # 8 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.65E-13, avg # of iterations = 3.3 + + total cpu time spent up to now is 1.2 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 5.4E-12 Ry + + iteration # 9 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.7 + + total cpu time spent up to now is 1.3 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 1.2E-13 Ry + + iteration # 10 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.0 + + total cpu time spent up to now is 1.4 secs + + End of self-consistent calculation + + k = 0.0000 0.0000 0.0000 ( 4477 PWs) bands (ev): + + -5.8300 6.2061 6.2061 6.2061 + + k =-0.1250 0.1250-0.1250 ( 4507 PWs) bands (ev): + + -5.6230 4.6051 5.9132 5.9132 + + k =-0.2500 0.2500-0.2500 ( 4510 PWs) bands (ev): + + -5.0182 2.2559 5.4373 5.4373 + + k =-0.3750 0.3750-0.3750 ( 4501 PWs) bands (ev): + + -4.1058 0.2065 5.1074 5.1074 + + k = 0.5000-0.5000 0.5000 ( 4476 PWs) bands (ev): + + -3.4453 -0.8427 4.9947 4.9947 + + k = 0.0000 0.2500 0.0000 ( 4504 PWs) bands (ev): + + -5.5533 4.8935 5.3857 5.3857 + + k =-0.1250 0.3750-0.1250 ( 4517 PWs) bands (ev): + + -5.0777 2.9801 4.8669 4.9518 + + k =-0.2500 0.5000-0.2500 ( 4508 PWs) bands (ev): + + -4.2481 0.8896 4.3532 4.5964 + + k = 0.6250-0.3750 0.6250 ( 4486 PWs) bands (ev): + + -3.3613 -0.6068 3.9003 4.6231 + + k = 0.5000-0.2500 0.5000 ( 4491 PWs) bands (ev): + + -3.6148 -0.2257 3.7125 4.9256 + + k = 0.3750-0.1250 0.3750 ( 4497 PWs) bands (ev): + + -4.5602 1.5598 3.8591 5.4251 + + k = 0.2500 0.0000 0.2500 ( 4477 PWs) bands (ev): + + -5.2819 3.5267 4.5444 5.9125 + + k = 0.0000 0.5000 0.0000 ( 4520 PWs) bands (ev): + + -4.7329 2.7148 4.2862 4.2862 + + k =-0.1250 0.6250-0.1250 ( 4509 PWs) bands (ev): + + -4.0117 1.2745 3.4881 3.9636 + + k = 0.7500-0.2500 0.7500 ( 4482 PWs) bands (ev): + + -3.0647 -0.1975 2.6082 3.9678 + + k = 0.6250-0.1250 0.6250 ( 4477 PWs) bands (ev): + + -2.8512 -0.4657 2.1376 4.2926 + + k = 0.5000 0.0000 0.5000 ( 4489 PWs) bands (ev): + + -3.7521 0.7207 2.3750 4.8614 + + k = 0.0000 0.7500 0.0000 ( 4484 PWs) bands (ev): + + -3.4015 0.4708 3.5586 3.5586 + + k = 0.8750-0.1250 0.8750 ( 4479 PWs) bands (ev): + + -2.4888 -0.6253 2.7002 3.4815 + + k = 0.7500 0.0000 0.7500 ( 4454 PWs) bands (ev): + + -2.0305 -1.0339 1.8049 3.7440 + + k = 0.0000-1.0000 0.0000 ( 4456 PWs) bands (ev): + + -1.6267 -1.6267 3.3090 3.3090 + + k =-0.2500 0.5000 0.0000 ( 4503 PWs) bands (ev): + + -4.4807 1.9234 3.4393 4.7592 + + k = 0.6250-0.3750 0.8750 ( 4489 PWs) bands (ev): + + -3.5748 0.3447 2.8290 4.2439 + + k = 0.5000-0.2500 0.7500 ( 4486 PWs) bands (ev): + + -2.9014 -0.6278 2.7039 4.0076 + + k = 0.7500-0.2500 1.0000 ( 4484 PWs) bands (ev): + + -3.1970 0.2501 2.7770 3.3923 + + k = 0.6250-0.1250 0.8750 ( 4486 PWs) bands (ev): + + -2.3006 -0.7332 2.0576 3.1860 + + k = 0.5000 0.0000 0.7500 ( 4490 PWs) bands (ev): + + -2.6570 -0.3670 1.8851 3.5717 + + k =-0.2500-1.0000 0.0000 ( 4472 PWs) bands (ev): + + -1.5427 -1.5427 2.7194 2.7194 + + k =-0.5000-1.0000 0.0000 ( 4488 PWs) bands (ev): + + -1.4495 -1.4495 2.2655 2.2655 + + highest occupied level (ev): 6.2061 + +! total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 4.0E-15 Ry + + The total energy is the sum of the following terms: + + one-electron contribution = 4.76680131 Ry + hartree contribution = 1.08149972 Ry + xc contribution = -4.81476914 Ry + ewald contribution = -16.88688327 Ry + + convergence has been achieved in 10 iterations + + Forces acting on atoms (cartesian axes, Ry/au): + + atom 1 type 1 force = 0.00000000 0.00000000 0.00000000 + atom 2 type 1 force = 0.00000000 0.00000000 -0.00000000 + + Total force = 0.000000 Total SCF correction = 0.000000 + + + Computing stress (Cartesian axis) and pressure + + total stress (Ry/bohr**3) (kbar) P= 0.05 + 0.00000032 -0.00000000 -0.00000000 0.05 -0.00 -0.00 + -0.00000000 0.00000032 0.00000000 -0.00 0.05 0.00 + -0.00000000 0.00000000 0.00000032 -0.00 0.00 0.05 + + + Writing output data file Si.save + + init_run : 0.06s CPU 0.23s WALL ( 1 calls) + electrons : 0.85s CPU 1.01s WALL ( 1 calls) + forces : 0.00s CPU 0.01s WALL ( 1 calls) + stress : 0.02s CPU 0.03s WALL ( 1 calls) + + Called by init_run: + wfcinit : 0.04s CPU 0.11s WALL ( 1 calls) + potinit : 0.00s CPU 0.01s WALL ( 1 calls) + + Called by electrons: + c_bands : 0.73s CPU 0.80s WALL ( 11 calls) + sum_band : 0.11s CPU 0.13s WALL ( 11 calls) + v_of_rho : 0.00s CPU 0.01s WALL ( 11 calls) + mix_rho : 0.00s CPU 0.01s WALL ( 11 calls) + + Called by c_bands: + init_us_2 : 0.01s CPU 0.03s WALL ( 725 calls) + cegterg : 0.69s CPU 0.74s WALL ( 319 calls) + + Called by sum_band: + + Called by *egterg: + h_psi : 0.62s CPU 0.65s WALL ( 980 calls) + g_psi : 0.00s CPU 0.00s WALL ( 632 calls) + cdiaghg : 0.05s CPU 0.10s WALL ( 922 calls) + + Called by h_psi: + h_psi:pot : 0.61s CPU 0.65s WALL ( 980 calls) + h_psi:calbec : 0.03s CPU 0.04s WALL ( 980 calls) + vloc_psi : 0.57s CPU 0.59s WALL ( 980 calls) + add_vuspsi : 0.01s CPU 0.01s WALL ( 980 calls) + + General routines + calbec : 0.03s CPU 0.05s WALL ( 1125 calls) + fft : 0.01s CPU 0.05s WALL ( 50 calls) + fftw : 0.57s CPU 0.64s WALL ( 8656 calls) + davcio : 0.00s CPU 0.06s WALL ( 29 calls) + + Parallel routines + fft_scatter : 0.29s CPU 0.31s WALL ( 8706 calls) + + PWSCF : 1.07s CPU 2.22s WALL + + + This run was terminated on: 19:30: 3 27Sep2017 + +=------------------------------------------------------------------------------= + JOB DONE. +=------------------------------------------------------------------------------= diff --git a/capolanco/test.scf1.in b/capolanco/test.scf1.in new file mode 100644 index 00000000..6244684f --- /dev/null +++ b/capolanco/test.scf1.in @@ -0,0 +1,30 @@ + &control + calculation='scf', + outdir = '/global/cscratch1/sd/cpolanco/Si/', + prefix='Si', + pseudo_dir = '/global/homes/c/cpolanco/Materials/pseudo/', + restart_mode='from_scratch', + tprnfor= .true., + tstress= .true., + / + &system + ibrav= 2, + celldm(1)= 10.20777693, + nat= 2, + ntyp= 1, + ecutwfc= 100.0 + / + &electrons + mixing_beta= 0.7 + conv_thr= 1.0d-14 + / + +ATOMIC_SPECIES + Si 28.086 Si.pz-vbc.UPF + +ATOMIC_POSITIONS (alat) + Si 0.00 0.00 0.00 + Si 0.25 0.25 0.25 + +K_POINTS (automatic) + 10 10 10 0 0 0 \ No newline at end of file diff --git a/capolanco/test.scf1.out b/capolanco/test.scf1.out new file mode 100644 index 00000000..92f25c0c --- /dev/null +++ b/capolanco/test.scf1.out @@ -0,0 +1,437 @@ + + Program PWSCF v.6.1 starts on 27Sep2017 at 19:30: 1 + + This program is part of the open-source Quantum ESPRESSO suite + for quantum simulation of materials; please cite + "P. Giannozzi et al., J. Phys.:Condens. Matter 21 395502 (2009); + URL http://www.quantum-espresso.org", + in publications or presentations arising from this work. More details at + http://www.quantum-espresso.org/quote + + Parallel version (MPI & OpenMP), running on 24 processor cores + Number of MPI processes: 24 + Threads/MPI process: 1 + R & G space division: proc/nbgrp/npool/nimage = 24 + Waiting for input... + Reading input from standard input + + Current dimensions of program PWSCF are: + Max number of different atomic species (ntypx) = 10 + Max number of k-points (npk) = 40000 + Max angular momentum in pseudopotentials (lmaxx) = 3 + + Subspace diagonalization in iterative solution of the eigenvalue problem: + a serial algorithm will be used + + + Parallelization info + -------------------- + sticks: dense smooth PW G-vecs: dense smooth PW + Min 59 59 17 1489 1489 232 + Max 60 60 18 1494 1494 235 + Sum 1417 1417 421 35749 35749 5601 + + + + bravais-lattice index = 2 + lattice parameter (alat) = 10.2078 a.u. + unit-cell volume = 265.9093 (a.u.)^3 + number of atoms/cell = 2 + number of atomic types = 1 + number of electrons = 8.00 + number of Kohn-Sham states= 4 + kinetic-energy cutoff = 100.0000 Ry + charge density cutoff = 400.0000 Ry + convergence threshold = 1.0E-14 + mixing beta = 0.7000 + number of iterations used = 8 plain mixing + Exchange-correlation = SLA PZ NOGX NOGC ( 1 1 0 0 0 0) + + celldm(1)= 10.207777 celldm(2)= 0.000000 celldm(3)= 0.000000 + celldm(4)= 0.000000 celldm(5)= 0.000000 celldm(6)= 0.000000 + + crystal axes: (cart. coord. in units of alat) + a(1) = ( -0.500000 0.000000 0.500000 ) + a(2) = ( 0.000000 0.500000 0.500000 ) + a(3) = ( -0.500000 0.500000 0.000000 ) + + reciprocal axes: (cart. coord. in units 2 pi/alat) + b(1) = ( -1.000000 -1.000000 1.000000 ) + b(2) = ( 1.000000 1.000000 1.000000 ) + b(3) = ( -1.000000 1.000000 -1.000000 ) + + + PseudoPot. # 1 for Si read from file: + /global/homes/c/cpolanco/Materials/pseudo/Si.pz-vbc.UPF + MD5 check sum: 6dfa03ddd5817404712e03e4d12deb78 + Pseudo is Norm-conserving, Zval = 4.0 + Generated by new atomic code, or converted to UPF format + Using radial grid of 431 points, 2 beta functions with: + l(1) = 0 + l(2) = 1 + + atomic species valence mass pseudopotential + Si 4.00 28.08600 Si( 1.00) + + 24 Sym. Ops. (no inversion) found + (note: 24 additional sym.ops. were found but ignored + their fractional translations are incommensurate with FFT grid) + + + Cartesian axes + + site n. atom positions (alat units) + 1 Si tau( 1) = ( 0.0000000 0.0000000 0.0000000 ) + 2 Si tau( 2) = ( 0.2500000 0.2500000 0.2500000 ) + + number of k points= 29 + cart. coord. in units 2pi/alat + k( 1) = ( 0.0000000 0.0000000 0.0000000), wk = 0.0039062 + k( 2) = ( -0.1250000 0.1250000 -0.1250000), wk = 0.0312500 + k( 3) = ( -0.2500000 0.2500000 -0.2500000), wk = 0.0312500 + k( 4) = ( -0.3750000 0.3750000 -0.3750000), wk = 0.0312500 + k( 5) = ( 0.5000000 -0.5000000 0.5000000), wk = 0.0156250 + k( 6) = ( 0.0000000 0.2500000 0.0000000), wk = 0.0234375 + k( 7) = ( -0.1250000 0.3750000 -0.1250000), wk = 0.0937500 + k( 8) = ( -0.2500000 0.5000000 -0.2500000), wk = 0.0937500 + k( 9) = ( 0.6250000 -0.3750000 0.6250000), wk = 0.0937500 + k( 10) = ( 0.5000000 -0.2500000 0.5000000), wk = 0.0937500 + k( 11) = ( 0.3750000 -0.1250000 0.3750000), wk = 0.0937500 + k( 12) = ( 0.2500000 0.0000000 0.2500000), wk = 0.0468750 + k( 13) = ( 0.0000000 0.5000000 0.0000000), wk = 0.0234375 + k( 14) = ( -0.1250000 0.6250000 -0.1250000), wk = 0.0937500 + k( 15) = ( 0.7500000 -0.2500000 0.7500000), wk = 0.0937500 + k( 16) = ( 0.6250000 -0.1250000 0.6250000), wk = 0.0937500 + k( 17) = ( 0.5000000 0.0000000 0.5000000), wk = 0.0468750 + k( 18) = ( 0.0000000 0.7500000 0.0000000), wk = 0.0234375 + k( 19) = ( 0.8750000 -0.1250000 0.8750000), wk = 0.0937500 + k( 20) = ( 0.7500000 0.0000000 0.7500000), wk = 0.0468750 + k( 21) = ( 0.0000000 -1.0000000 0.0000000), wk = 0.0117188 + k( 22) = ( -0.2500000 0.5000000 0.0000000), wk = 0.0937500 + k( 23) = ( 0.6250000 -0.3750000 0.8750000), wk = 0.1875000 + k( 24) = ( 0.5000000 -0.2500000 0.7500000), wk = 0.0937500 + k( 25) = ( 0.7500000 -0.2500000 1.0000000), wk = 0.0937500 + k( 26) = ( 0.6250000 -0.1250000 0.8750000), wk = 0.1875000 + k( 27) = ( 0.5000000 0.0000000 0.7500000), wk = 0.0937500 + k( 28) = ( -0.2500000 -1.0000000 0.0000000), wk = 0.0468750 + k( 29) = ( -0.5000000 -1.0000000 0.0000000), wk = 0.0234375 + + Dense grid: 35749 G-vectors FFT dimensions: ( 45, 45, 45) + + Estimated max dynamical RAM per process > 1.29MB + + Estimated total allocated dynamical RAM > 31.06MB + + Initial potential from superposition of free atoms + + starting charge 7.99901, renormalised to 8.00000 + Starting wfc are 8 randomized atomic wfcs + + total cpu time spent up to now is 0.4 secs + + per-process dynamical memory: 2.9 Mb + + Self-consistent Calculation + + iteration # 1 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-02, avg # of iterations = 2.0 + + Threshold (ethr) on eigenvalues was too large: + Diagonalizing with lowered threshold + + Davidson diagonalization with overlap + ethr = 7.97E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.6 secs + + total energy = -15.84982619 Ry + Harris-Foulkes estimate = -15.87079416 Ry + estimated scf accuracy < 0.06161703 Ry + + iteration # 2 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 7.70E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.7 secs + + total energy = -15.85288351 Ry + Harris-Foulkes estimate = -15.85318795 Ry + estimated scf accuracy < 0.00216687 Ry + + iteration # 3 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 2.71E-05, avg # of iterations = 2.4 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85332918 Ry + Harris-Foulkes estimate = -15.85336185 Ry + estimated scf accuracy < 0.00007437 Ry + + iteration # 4 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 9.30E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85334986 Ry + Harris-Foulkes estimate = -15.85335396 Ry + estimated scf accuracy < 0.00000888 Ry + + iteration # 5 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.11E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.9 secs + + total energy = -15.85335134 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 0.00000011 Ry + + iteration # 6 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.35E-09, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.0 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-09 Ry + + iteration # 7 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.68E-11, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.1 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-11 Ry + + iteration # 8 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.65E-13, avg # of iterations = 3.3 + + total cpu time spent up to now is 1.2 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 5.4E-12 Ry + + iteration # 9 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.7 + + total cpu time spent up to now is 1.3 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 1.2E-13 Ry + + iteration # 10 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.0 + + total cpu time spent up to now is 1.4 secs + + End of self-consistent calculation + + k = 0.0000 0.0000 0.0000 ( 4477 PWs) bands (ev): + + -5.8300 6.2061 6.2061 6.2061 + + k =-0.1250 0.1250-0.1250 ( 4507 PWs) bands (ev): + + -5.6230 4.6051 5.9132 5.9132 + + k =-0.2500 0.2500-0.2500 ( 4510 PWs) bands (ev): + + -5.0182 2.2559 5.4373 5.4373 + + k =-0.3750 0.3750-0.3750 ( 4501 PWs) bands (ev): + + -4.1058 0.2065 5.1074 5.1074 + + k = 0.5000-0.5000 0.5000 ( 4476 PWs) bands (ev): + + -3.4453 -0.8427 4.9947 4.9947 + + k = 0.0000 0.2500 0.0000 ( 4504 PWs) bands (ev): + + -5.5533 4.8935 5.3857 5.3857 + + k =-0.1250 0.3750-0.1250 ( 4517 PWs) bands (ev): + + -5.0777 2.9801 4.8669 4.9518 + + k =-0.2500 0.5000-0.2500 ( 4508 PWs) bands (ev): + + -4.2481 0.8896 4.3532 4.5964 + + k = 0.6250-0.3750 0.6250 ( 4486 PWs) bands (ev): + + -3.3613 -0.6068 3.9003 4.6231 + + k = 0.5000-0.2500 0.5000 ( 4491 PWs) bands (ev): + + -3.6148 -0.2257 3.7125 4.9256 + + k = 0.3750-0.1250 0.3750 ( 4497 PWs) bands (ev): + + -4.5602 1.5598 3.8591 5.4251 + + k = 0.2500 0.0000 0.2500 ( 4477 PWs) bands (ev): + + -5.2819 3.5267 4.5444 5.9125 + + k = 0.0000 0.5000 0.0000 ( 4520 PWs) bands (ev): + + -4.7329 2.7148 4.2862 4.2862 + + k =-0.1250 0.6250-0.1250 ( 4509 PWs) bands (ev): + + -4.0117 1.2745 3.4881 3.9636 + + k = 0.7500-0.2500 0.7500 ( 4482 PWs) bands (ev): + + -3.0647 -0.1975 2.6082 3.9678 + + k = 0.6250-0.1250 0.6250 ( 4477 PWs) bands (ev): + + -2.8512 -0.4657 2.1376 4.2926 + + k = 0.5000 0.0000 0.5000 ( 4489 PWs) bands (ev): + + -3.7521 0.7207 2.3750 4.8614 + + k = 0.0000 0.7500 0.0000 ( 4484 PWs) bands (ev): + + -3.4015 0.4708 3.5586 3.5586 + + k = 0.8750-0.1250 0.8750 ( 4479 PWs) bands (ev): + + -2.4888 -0.6253 2.7002 3.4815 + + k = 0.7500 0.0000 0.7500 ( 4454 PWs) bands (ev): + + -2.0305 -1.0339 1.8049 3.7440 + + k = 0.0000-1.0000 0.0000 ( 4456 PWs) bands (ev): + + -1.6267 -1.6267 3.3090 3.3090 + + k =-0.2500 0.5000 0.0000 ( 4503 PWs) bands (ev): + + -4.4807 1.9234 3.4393 4.7592 + + k = 0.6250-0.3750 0.8750 ( 4489 PWs) bands (ev): + + -3.5748 0.3447 2.8290 4.2439 + + k = 0.5000-0.2500 0.7500 ( 4486 PWs) bands (ev): + + -2.9014 -0.6278 2.7039 4.0076 + + k = 0.7500-0.2500 1.0000 ( 4484 PWs) bands (ev): + + -3.1970 0.2501 2.7770 3.3923 + + k = 0.6250-0.1250 0.8750 ( 4486 PWs) bands (ev): + + -2.3006 -0.7332 2.0576 3.1860 + + k = 0.5000 0.0000 0.7500 ( 4490 PWs) bands (ev): + + -2.6570 -0.3670 1.8851 3.5717 + + k =-0.2500-1.0000 0.0000 ( 4472 PWs) bands (ev): + + -1.5427 -1.5427 2.7194 2.7194 + + k =-0.5000-1.0000 0.0000 ( 4488 PWs) bands (ev): + + -1.4495 -1.4495 2.2655 2.2655 + + highest occupied level (ev): 6.2061 + +! total energy = -16.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 4.0E-15 Ry + + The total energy is the sum of the following terms: + + one-electron contribution = 4.76680131 Ry + hartree contribution = 1.08149972 Ry + xc contribution = -4.81476914 Ry + ewald contribution = -16.88688327 Ry + + convergence has been achieved in 10 iterations + + Forces acting on atoms (cartesian axes, Ry/au): + + atom 1 type 1 force = 0.00000000 0.00000000 0.00000000 + atom 2 type 1 force = 0.00000000 0.00000000 -0.00000000 + + Total force = 0.000000 Total SCF correction = 0.000000 + + + Computing stress (Cartesian axis) and pressure + + total stress (Ry/bohr**3) (kbar) P= 0.05 + 0.00000032 -0.00000000 -0.00000000 0.05 -0.00 -0.00 + -0.00000000 0.00000032 0.00000000 -0.00 0.05 0.00 + -0.00000000 0.00000000 0.00000032 -0.00 0.00 0.05 + + + Writing output data file Si.save + + init_run : 0.06s CPU 0.23s WALL ( 1 calls) + electrons : 0.85s CPU 1.01s WALL ( 1 calls) + forces : 0.00s CPU 0.01s WALL ( 1 calls) + stress : 0.02s CPU 0.03s WALL ( 1 calls) + + Called by init_run: + wfcinit : 0.04s CPU 0.11s WALL ( 1 calls) + potinit : 0.00s CPU 0.01s WALL ( 1 calls) + + Called by electrons: + c_bands : 0.73s CPU 0.80s WALL ( 11 calls) + sum_band : 0.11s CPU 0.13s WALL ( 11 calls) + v_of_rho : 0.00s CPU 0.01s WALL ( 11 calls) + mix_rho : 0.00s CPU 0.01s WALL ( 11 calls) + + Called by c_bands: + init_us_2 : 0.01s CPU 0.03s WALL ( 725 calls) + cegterg : 0.69s CPU 0.74s WALL ( 319 calls) + + Called by sum_band: + + Called by *egterg: + h_psi : 0.62s CPU 0.65s WALL ( 980 calls) + g_psi : 0.00s CPU 0.00s WALL ( 632 calls) + cdiaghg : 0.05s CPU 0.10s WALL ( 922 calls) + + Called by h_psi: + h_psi:pot : 0.61s CPU 0.65s WALL ( 980 calls) + h_psi:calbec : 0.03s CPU 0.04s WALL ( 980 calls) + vloc_psi : 0.57s CPU 0.59s WALL ( 980 calls) + add_vuspsi : 0.01s CPU 0.01s WALL ( 980 calls) + + General routines + calbec : 0.03s CPU 0.05s WALL ( 1125 calls) + fft : 0.01s CPU 0.05s WALL ( 50 calls) + fftw : 0.57s CPU 0.64s WALL ( 8656 calls) + davcio : 0.00s CPU 0.06s WALL ( 29 calls) + + Parallel routines + fft_scatter : 0.29s CPU 0.31s WALL ( 8706 calls) + + PWSCF : 1.07s CPU 2.22s WALL + + + This run was terminated on: 19:30: 3 27Sep2017 + +=------------------------------------------------------------------------------= + JOB DONE. +=------------------------------------------------------------------------------= diff --git a/capolanco/test.scf2.in b/capolanco/test.scf2.in new file mode 100644 index 00000000..529f9f22 --- /dev/null +++ b/capolanco/test.scf2.in @@ -0,0 +1,30 @@ + &control + calculation='scf', + outdir = '/global/cscratch1/sd/cpolanco/Si/', + prefix='Si', + pseudo_dir = '/global/homes/c/cpolanco/Materials/pseudo/', + restart_mode='from_scratch', + tprnfor= .true., + tstress= .true., + / + &system + ibrav= 2, + celldm(1)= 10.20777693, + nat= 2, + ntyp= 1, + ecutwfc= 100.0 + / + &electrons + mixing_beta= 0.7 + conv_thr= 1.0d-14 + / + +ATOMIC_SPECIES + Si 28.086 Si.pz-vbc.UPF + +ATOMIC_POSITIONS (alat) + Si 0.00 0.00 0.00 + Si 0.25 0.25 0.25 + +K_POINTS (automatic) + 12 12 12 0 0 0 \ No newline at end of file diff --git a/capolanco/test.scf2.out b/capolanco/test.scf2.out new file mode 100644 index 00000000..ce5f954a --- /dev/null +++ b/capolanco/test.scf2.out @@ -0,0 +1,437 @@ + + Program PWSCF v.6.1 starts on 27Sep2017 at 19:30: 1 + + This program is part of the open-source Quantum ESPRESSO suite + for quantum simulation of materials; please cite + "P. Giannozzi et al., J. Phys.:Condens. Matter 21 395502 (2009); + URL http://www.quantum-espresso.org", + in publications or presentations arising from this work. More details at + http://www.quantum-espresso.org/quote + + Parallel version (MPI & OpenMP), running on 24 processor cores + Number of MPI processes: 24 + Threads/MPI process: 1 + R & G space division: proc/nbgrp/npool/nimage = 24 + Waiting for input... + Reading input from standard input + + Current dimensions of program PWSCF are: + Max number of different atomic species (ntypx) = 10 + Max number of k-points (npk) = 40000 + Max angular momentum in pseudopotentials (lmaxx) = 3 + + Subspace diagonalization in iterative solution of the eigenvalue problem: + a serial algorithm will be used + + + Parallelization info + -------------------- + sticks: dense smooth PW G-vecs: dense smooth PW + Min 59 59 17 1489 1489 232 + Max 60 60 18 1494 1494 235 + Sum 1417 1417 421 35749 35749 5601 + + + + bravais-lattice index = 2 + lattice parameter (alat) = 10.2078 a.u. + unit-cell volume = 265.9093 (a.u.)^3 + number of atoms/cell = 2 + number of atomic types = 1 + number of electrons = 8.00 + number of Kohn-Sham states= 4 + kinetic-energy cutoff = 100.0000 Ry + charge density cutoff = 400.0000 Ry + convergence threshold = 1.0E-14 + mixing beta = 0.7000 + number of iterations used = 8 plain mixing + Exchange-correlation = SLA PZ NOGX NOGC ( 1 1 0 0 0 0) + + celldm(1)= 10.207777 celldm(2)= 0.000000 celldm(3)= 0.000000 + celldm(4)= 0.000000 celldm(5)= 0.000000 celldm(6)= 0.000000 + + crystal axes: (cart. coord. in units of alat) + a(1) = ( -0.500000 0.000000 0.500000 ) + a(2) = ( 0.000000 0.500000 0.500000 ) + a(3) = ( -0.500000 0.500000 0.000000 ) + + reciprocal axes: (cart. coord. in units 2 pi/alat) + b(1) = ( -1.000000 -1.000000 1.000000 ) + b(2) = ( 1.000000 1.000000 1.000000 ) + b(3) = ( -1.000000 1.000000 -1.000000 ) + + + PseudoPot. # 1 for Si read from file: + /global/homes/c/cpolanco/Materials/pseudo/Si.pz-vbc.UPF + MD5 check sum: 6dfa03ddd5817404712e03e4d12deb78 + Pseudo is Norm-conserving, Zval = 4.0 + Generated by new atomic code, or converted to UPF format + Using radial grid of 431 points, 2 beta functions with: + l(1) = 0 + l(2) = 1 + + atomic species valence mass pseudopotential + Si 4.00 28.08600 Si( 1.00) + + 24 Sym. Ops. (no inversion) found + (note: 24 additional sym.ops. were found but ignored + their fractional translations are incommensurate with FFT grid) + + + Cartesian axes + + site n. atom positions (alat units) + 1 Si tau( 1) = ( 0.0000000 0.0000000 0.0000000 ) + 2 Si tau( 2) = ( 0.2500000 0.2500000 0.2500000 ) + + number of k points= 29 + cart. coord. in units 2pi/alat + k( 1) = ( 0.0000000 0.0000000 0.0000000), wk = 0.0039062 + k( 2) = ( -0.1250000 0.1250000 -0.1250000), wk = 0.0312500 + k( 3) = ( -0.2500000 0.2500000 -0.2500000), wk = 0.0312500 + k( 4) = ( -0.3750000 0.3750000 -0.3750000), wk = 0.0312500 + k( 5) = ( 0.5000000 -0.5000000 0.5000000), wk = 0.0156250 + k( 6) = ( 0.0000000 0.2500000 0.0000000), wk = 0.0234375 + k( 7) = ( -0.1250000 0.3750000 -0.1250000), wk = 0.0937500 + k( 8) = ( -0.2500000 0.5000000 -0.2500000), wk = 0.0937500 + k( 9) = ( 0.6250000 -0.3750000 0.6250000), wk = 0.0937500 + k( 10) = ( 0.5000000 -0.2500000 0.5000000), wk = 0.0937500 + k( 11) = ( 0.3750000 -0.1250000 0.3750000), wk = 0.0937500 + k( 12) = ( 0.2500000 0.0000000 0.2500000), wk = 0.0468750 + k( 13) = ( 0.0000000 0.5000000 0.0000000), wk = 0.0234375 + k( 14) = ( -0.1250000 0.6250000 -0.1250000), wk = 0.0937500 + k( 15) = ( 0.7500000 -0.2500000 0.7500000), wk = 0.0937500 + k( 16) = ( 0.6250000 -0.1250000 0.6250000), wk = 0.0937500 + k( 17) = ( 0.5000000 0.0000000 0.5000000), wk = 0.0468750 + k( 18) = ( 0.0000000 0.7500000 0.0000000), wk = 0.0234375 + k( 19) = ( 0.8750000 -0.1250000 0.8750000), wk = 0.0937500 + k( 20) = ( 0.7500000 0.0000000 0.7500000), wk = 0.0468750 + k( 21) = ( 0.0000000 -1.0000000 0.0000000), wk = 0.0117188 + k( 22) = ( -0.2500000 0.5000000 0.0000000), wk = 0.0937500 + k( 23) = ( 0.6250000 -0.3750000 0.8750000), wk = 0.1875000 + k( 24) = ( 0.5000000 -0.2500000 0.7500000), wk = 0.0937500 + k( 25) = ( 0.7500000 -0.2500000 1.0000000), wk = 0.0937500 + k( 26) = ( 0.6250000 -0.1250000 0.8750000), wk = 0.1875000 + k( 27) = ( 0.5000000 0.0000000 0.7500000), wk = 0.0937500 + k( 28) = ( -0.2500000 -1.0000000 0.0000000), wk = 0.0468750 + k( 29) = ( -0.5000000 -1.0000000 0.0000000), wk = 0.0234375 + + Dense grid: 35749 G-vectors FFT dimensions: ( 45, 45, 45) + + Estimated max dynamical RAM per process > 1.29MB + + Estimated total allocated dynamical RAM > 31.06MB + + Initial potential from superposition of free atoms + + starting charge 7.99901, renormalised to 8.00000 + Starting wfc are 8 randomized atomic wfcs + + total cpu time spent up to now is 0.4 secs + + per-process dynamical memory: 2.9 Mb + + Self-consistent Calculation + + iteration # 1 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-02, avg # of iterations = 2.0 + + Threshold (ethr) on eigenvalues was too large: + Diagonalizing with lowered threshold + + Davidson diagonalization with overlap + ethr = 7.97E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.6 secs + + total energy = -15.84982619 Ry + Harris-Foulkes estimate = -15.87079416 Ry + estimated scf accuracy < 0.06161703 Ry + + iteration # 2 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 7.70E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.7 secs + + total energy = -15.85288351 Ry + Harris-Foulkes estimate = -15.85318795 Ry + estimated scf accuracy < 0.00216687 Ry + + iteration # 3 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 2.71E-05, avg # of iterations = 2.4 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85332918 Ry + Harris-Foulkes estimate = -15.85336185 Ry + estimated scf accuracy < 0.00007437 Ry + + iteration # 4 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 9.30E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85334986 Ry + Harris-Foulkes estimate = -15.85335396 Ry + estimated scf accuracy < 0.00000888 Ry + + iteration # 5 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.11E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.9 secs + + total energy = -15.85335134 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 0.00000011 Ry + + iteration # 6 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.35E-09, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.0 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-09 Ry + + iteration # 7 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.68E-11, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.1 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-11 Ry + + iteration # 8 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.65E-13, avg # of iterations = 3.3 + + total cpu time spent up to now is 1.2 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 5.4E-12 Ry + + iteration # 9 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.7 + + total cpu time spent up to now is 1.3 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 1.2E-13 Ry + + iteration # 10 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.0 + + total cpu time spent up to now is 1.4 secs + + End of self-consistent calculation + + k = 0.0000 0.0000 0.0000 ( 4477 PWs) bands (ev): + + -5.8300 6.2061 6.2061 6.2061 + + k =-0.1250 0.1250-0.1250 ( 4507 PWs) bands (ev): + + -5.6230 4.6051 5.9132 5.9132 + + k =-0.2500 0.2500-0.2500 ( 4510 PWs) bands (ev): + + -5.0182 2.2559 5.4373 5.4373 + + k =-0.3750 0.3750-0.3750 ( 4501 PWs) bands (ev): + + -4.1058 0.2065 5.1074 5.1074 + + k = 0.5000-0.5000 0.5000 ( 4476 PWs) bands (ev): + + -3.4453 -0.8427 4.9947 4.9947 + + k = 0.0000 0.2500 0.0000 ( 4504 PWs) bands (ev): + + -5.5533 4.8935 5.3857 5.3857 + + k =-0.1250 0.3750-0.1250 ( 4517 PWs) bands (ev): + + -5.0777 2.9801 4.8669 4.9518 + + k =-0.2500 0.5000-0.2500 ( 4508 PWs) bands (ev): + + -4.2481 0.8896 4.3532 4.5964 + + k = 0.6250-0.3750 0.6250 ( 4486 PWs) bands (ev): + + -3.3613 -0.6068 3.9003 4.6231 + + k = 0.5000-0.2500 0.5000 ( 4491 PWs) bands (ev): + + -3.6148 -0.2257 3.7125 4.9256 + + k = 0.3750-0.1250 0.3750 ( 4497 PWs) bands (ev): + + -4.5602 1.5598 3.8591 5.4251 + + k = 0.2500 0.0000 0.2500 ( 4477 PWs) bands (ev): + + -5.2819 3.5267 4.5444 5.9125 + + k = 0.0000 0.5000 0.0000 ( 4520 PWs) bands (ev): + + -4.7329 2.7148 4.2862 4.2862 + + k =-0.1250 0.6250-0.1250 ( 4509 PWs) bands (ev): + + -4.0117 1.2745 3.4881 3.9636 + + k = 0.7500-0.2500 0.7500 ( 4482 PWs) bands (ev): + + -3.0647 -0.1975 2.6082 3.9678 + + k = 0.6250-0.1250 0.6250 ( 4477 PWs) bands (ev): + + -2.8512 -0.4657 2.1376 4.2926 + + k = 0.5000 0.0000 0.5000 ( 4489 PWs) bands (ev): + + -3.7521 0.7207 2.3750 4.8614 + + k = 0.0000 0.7500 0.0000 ( 4484 PWs) bands (ev): + + -3.4015 0.4708 3.5586 3.5586 + + k = 0.8750-0.1250 0.8750 ( 4479 PWs) bands (ev): + + -2.4888 -0.6253 2.7002 3.4815 + + k = 0.7500 0.0000 0.7500 ( 4454 PWs) bands (ev): + + -2.0305 -1.0339 1.8049 3.7440 + + k = 0.0000-1.0000 0.0000 ( 4456 PWs) bands (ev): + + -1.6267 -1.6267 3.3090 3.3090 + + k =-0.2500 0.5000 0.0000 ( 4503 PWs) bands (ev): + + -4.4807 1.9234 3.4393 4.7592 + + k = 0.6250-0.3750 0.8750 ( 4489 PWs) bands (ev): + + -3.5748 0.3447 2.8290 4.2439 + + k = 0.5000-0.2500 0.7500 ( 4486 PWs) bands (ev): + + -2.9014 -0.6278 2.7039 4.0076 + + k = 0.7500-0.2500 1.0000 ( 4484 PWs) bands (ev): + + -3.1970 0.2501 2.7770 3.3923 + + k = 0.6250-0.1250 0.8750 ( 4486 PWs) bands (ev): + + -2.3006 -0.7332 2.0576 3.1860 + + k = 0.5000 0.0000 0.7500 ( 4490 PWs) bands (ev): + + -2.6570 -0.3670 1.8851 3.5717 + + k =-0.2500-1.0000 0.0000 ( 4472 PWs) bands (ev): + + -1.5427 -1.5427 2.7194 2.7194 + + k =-0.5000-1.0000 0.0000 ( 4488 PWs) bands (ev): + + -1.4495 -1.4495 2.2655 2.2655 + + highest occupied level (ev): 6.2061 + +! total energy = -15.95335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 4.0E-15 Ry + + The total energy is the sum of the following terms: + + one-electron contribution = 4.76680131 Ry + hartree contribution = 1.08149972 Ry + xc contribution = -4.81476914 Ry + ewald contribution = -16.88688327 Ry + + convergence has been achieved in 10 iterations + + Forces acting on atoms (cartesian axes, Ry/au): + + atom 1 type 1 force = 0.00000000 0.00000000 0.00000000 + atom 2 type 1 force = 0.00000000 0.00000000 -0.00000000 + + Total force = 0.000000 Total SCF correction = 0.000000 + + + Computing stress (Cartesian axis) and pressure + + total stress (Ry/bohr**3) (kbar) P= 0.05 + 0.00000032 -0.00000000 -0.00000000 0.05 -0.00 -0.00 + -0.00000000 0.00000032 0.00000000 -0.00 0.05 0.00 + -0.00000000 0.00000000 0.00000032 -0.00 0.00 0.05 + + + Writing output data file Si.save + + init_run : 0.06s CPU 0.23s WALL ( 1 calls) + electrons : 0.85s CPU 1.01s WALL ( 1 calls) + forces : 0.00s CPU 0.01s WALL ( 1 calls) + stress : 0.02s CPU 0.03s WALL ( 1 calls) + + Called by init_run: + wfcinit : 0.04s CPU 0.11s WALL ( 1 calls) + potinit : 0.00s CPU 0.01s WALL ( 1 calls) + + Called by electrons: + c_bands : 0.73s CPU 0.80s WALL ( 11 calls) + sum_band : 0.11s CPU 0.13s WALL ( 11 calls) + v_of_rho : 0.00s CPU 0.01s WALL ( 11 calls) + mix_rho : 0.00s CPU 0.01s WALL ( 11 calls) + + Called by c_bands: + init_us_2 : 0.01s CPU 0.03s WALL ( 725 calls) + cegterg : 0.69s CPU 0.74s WALL ( 319 calls) + + Called by sum_band: + + Called by *egterg: + h_psi : 0.62s CPU 0.65s WALL ( 980 calls) + g_psi : 0.00s CPU 0.00s WALL ( 632 calls) + cdiaghg : 0.05s CPU 0.10s WALL ( 922 calls) + + Called by h_psi: + h_psi:pot : 0.61s CPU 0.65s WALL ( 980 calls) + h_psi:calbec : 0.03s CPU 0.04s WALL ( 980 calls) + vloc_psi : 0.57s CPU 0.59s WALL ( 980 calls) + add_vuspsi : 0.01s CPU 0.01s WALL ( 980 calls) + + General routines + calbec : 0.03s CPU 0.05s WALL ( 1125 calls) + fft : 0.01s CPU 0.05s WALL ( 50 calls) + fftw : 0.57s CPU 0.64s WALL ( 8656 calls) + davcio : 0.00s CPU 0.06s WALL ( 29 calls) + + Parallel routines + fft_scatter : 0.29s CPU 0.31s WALL ( 8706 calls) + + PWSCF : 1.07s CPU 2.22s WALL + + + This run was terminated on: 19:30: 3 27Sep2017 + +=------------------------------------------------------------------------------= + JOB DONE. +=------------------------------------------------------------------------------= diff --git a/capolanco/test.scf3.in b/capolanco/test.scf3.in new file mode 100644 index 00000000..ef5210f4 --- /dev/null +++ b/capolanco/test.scf3.in @@ -0,0 +1,30 @@ + &control + calculation='scf', + outdir = '/global/cscratch1/sd/cpolanco/Si/', + prefix='Si', + pseudo_dir = '/global/homes/c/cpolanco/Materials/pseudo/', + restart_mode='from_scratch', + tprnfor= .true., + tstress= .true., + / + &system + ibrav= 2, + celldm(1)= 10.20777693, + nat= 2, + ntyp= 1, + ecutwfc= 100.0 + / + &electrons + mixing_beta= 0.7 + conv_thr= 1.0d-14 + / + +ATOMIC_SPECIES + Si 28.086 Si.pz-vbc.UPF + +ATOMIC_POSITIONS (alat) + Si 0.00 0.00 0.00 + Si 0.25 0.25 0.25 + +K_POINTS (automatic) + 14 14 14 0 0 0 \ No newline at end of file diff --git a/capolanco/test.scf3.out b/capolanco/test.scf3.out new file mode 100644 index 00000000..24c158b7 --- /dev/null +++ b/capolanco/test.scf3.out @@ -0,0 +1,437 @@ + + Program PWSCF v.6.1 starts on 27Sep2017 at 19:30: 1 + + This program is part of the open-source Quantum ESPRESSO suite + for quantum simulation of materials; please cite + "P. Giannozzi et al., J. Phys.:Condens. Matter 21 395502 (2009); + URL http://www.quantum-espresso.org", + in publications or presentations arising from this work. More details at + http://www.quantum-espresso.org/quote + + Parallel version (MPI & OpenMP), running on 24 processor cores + Number of MPI processes: 24 + Threads/MPI process: 1 + R & G space division: proc/nbgrp/npool/nimage = 24 + Waiting for input... + Reading input from standard input + + Current dimensions of program PWSCF are: + Max number of different atomic species (ntypx) = 10 + Max number of k-points (npk) = 40000 + Max angular momentum in pseudopotentials (lmaxx) = 3 + + Subspace diagonalization in iterative solution of the eigenvalue problem: + a serial algorithm will be used + + + Parallelization info + -------------------- + sticks: dense smooth PW G-vecs: dense smooth PW + Min 59 59 17 1489 1489 232 + Max 60 60 18 1494 1494 235 + Sum 1417 1417 421 35749 35749 5601 + + + + bravais-lattice index = 2 + lattice parameter (alat) = 10.2078 a.u. + unit-cell volume = 265.9093 (a.u.)^3 + number of atoms/cell = 2 + number of atomic types = 1 + number of electrons = 8.00 + number of Kohn-Sham states= 4 + kinetic-energy cutoff = 100.0000 Ry + charge density cutoff = 400.0000 Ry + convergence threshold = 1.0E-14 + mixing beta = 0.7000 + number of iterations used = 8 plain mixing + Exchange-correlation = SLA PZ NOGX NOGC ( 1 1 0 0 0 0) + + celldm(1)= 10.207777 celldm(2)= 0.000000 celldm(3)= 0.000000 + celldm(4)= 0.000000 celldm(5)= 0.000000 celldm(6)= 0.000000 + + crystal axes: (cart. coord. in units of alat) + a(1) = ( -0.500000 0.000000 0.500000 ) + a(2) = ( 0.000000 0.500000 0.500000 ) + a(3) = ( -0.500000 0.500000 0.000000 ) + + reciprocal axes: (cart. coord. in units 2 pi/alat) + b(1) = ( -1.000000 -1.000000 1.000000 ) + b(2) = ( 1.000000 1.000000 1.000000 ) + b(3) = ( -1.000000 1.000000 -1.000000 ) + + + PseudoPot. # 1 for Si read from file: + /global/homes/c/cpolanco/Materials/pseudo/Si.pz-vbc.UPF + MD5 check sum: 6dfa03ddd5817404712e03e4d12deb78 + Pseudo is Norm-conserving, Zval = 4.0 + Generated by new atomic code, or converted to UPF format + Using radial grid of 431 points, 2 beta functions with: + l(1) = 0 + l(2) = 1 + + atomic species valence mass pseudopotential + Si 4.00 28.08600 Si( 1.00) + + 24 Sym. Ops. (no inversion) found + (note: 24 additional sym.ops. were found but ignored + their fractional translations are incommensurate with FFT grid) + + + Cartesian axes + + site n. atom positions (alat units) + 1 Si tau( 1) = ( 0.0000000 0.0000000 0.0000000 ) + 2 Si tau( 2) = ( 0.2500000 0.2500000 0.2500000 ) + + number of k points= 29 + cart. coord. in units 2pi/alat + k( 1) = ( 0.0000000 0.0000000 0.0000000), wk = 0.0039062 + k( 2) = ( -0.1250000 0.1250000 -0.1250000), wk = 0.0312500 + k( 3) = ( -0.2500000 0.2500000 -0.2500000), wk = 0.0312500 + k( 4) = ( -0.3750000 0.3750000 -0.3750000), wk = 0.0312500 + k( 5) = ( 0.5000000 -0.5000000 0.5000000), wk = 0.0156250 + k( 6) = ( 0.0000000 0.2500000 0.0000000), wk = 0.0234375 + k( 7) = ( -0.1250000 0.3750000 -0.1250000), wk = 0.0937500 + k( 8) = ( -0.2500000 0.5000000 -0.2500000), wk = 0.0937500 + k( 9) = ( 0.6250000 -0.3750000 0.6250000), wk = 0.0937500 + k( 10) = ( 0.5000000 -0.2500000 0.5000000), wk = 0.0937500 + k( 11) = ( 0.3750000 -0.1250000 0.3750000), wk = 0.0937500 + k( 12) = ( 0.2500000 0.0000000 0.2500000), wk = 0.0468750 + k( 13) = ( 0.0000000 0.5000000 0.0000000), wk = 0.0234375 + k( 14) = ( -0.1250000 0.6250000 -0.1250000), wk = 0.0937500 + k( 15) = ( 0.7500000 -0.2500000 0.7500000), wk = 0.0937500 + k( 16) = ( 0.6250000 -0.1250000 0.6250000), wk = 0.0937500 + k( 17) = ( 0.5000000 0.0000000 0.5000000), wk = 0.0468750 + k( 18) = ( 0.0000000 0.7500000 0.0000000), wk = 0.0234375 + k( 19) = ( 0.8750000 -0.1250000 0.8750000), wk = 0.0937500 + k( 20) = ( 0.7500000 0.0000000 0.7500000), wk = 0.0468750 + k( 21) = ( 0.0000000 -1.0000000 0.0000000), wk = 0.0117188 + k( 22) = ( -0.2500000 0.5000000 0.0000000), wk = 0.0937500 + k( 23) = ( 0.6250000 -0.3750000 0.8750000), wk = 0.1875000 + k( 24) = ( 0.5000000 -0.2500000 0.7500000), wk = 0.0937500 + k( 25) = ( 0.7500000 -0.2500000 1.0000000), wk = 0.0937500 + k( 26) = ( 0.6250000 -0.1250000 0.8750000), wk = 0.1875000 + k( 27) = ( 0.5000000 0.0000000 0.7500000), wk = 0.0937500 + k( 28) = ( -0.2500000 -1.0000000 0.0000000), wk = 0.0468750 + k( 29) = ( -0.5000000 -1.0000000 0.0000000), wk = 0.0234375 + + Dense grid: 35749 G-vectors FFT dimensions: ( 45, 45, 45) + + Estimated max dynamical RAM per process > 1.29MB + + Estimated total allocated dynamical RAM > 31.06MB + + Initial potential from superposition of free atoms + + starting charge 7.99901, renormalised to 8.00000 + Starting wfc are 8 randomized atomic wfcs + + total cpu time spent up to now is 0.4 secs + + per-process dynamical memory: 2.9 Mb + + Self-consistent Calculation + + iteration # 1 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-02, avg # of iterations = 2.0 + + Threshold (ethr) on eigenvalues was too large: + Diagonalizing with lowered threshold + + Davidson diagonalization with overlap + ethr = 7.97E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.6 secs + + total energy = -15.84982619 Ry + Harris-Foulkes estimate = -15.87079416 Ry + estimated scf accuracy < 0.06161703 Ry + + iteration # 2 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 7.70E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.7 secs + + total energy = -15.85288351 Ry + Harris-Foulkes estimate = -15.85318795 Ry + estimated scf accuracy < 0.00216687 Ry + + iteration # 3 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 2.71E-05, avg # of iterations = 2.4 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85332918 Ry + Harris-Foulkes estimate = -15.85336185 Ry + estimated scf accuracy < 0.00007437 Ry + + iteration # 4 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 9.30E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85334986 Ry + Harris-Foulkes estimate = -15.85335396 Ry + estimated scf accuracy < 0.00000888 Ry + + iteration # 5 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.11E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.9 secs + + total energy = -15.85335134 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 0.00000011 Ry + + iteration # 6 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.35E-09, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.0 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-09 Ry + + iteration # 7 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.68E-11, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.1 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-11 Ry + + iteration # 8 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.65E-13, avg # of iterations = 3.3 + + total cpu time spent up to now is 1.2 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 5.4E-12 Ry + + iteration # 9 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.7 + + total cpu time spent up to now is 1.3 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 1.2E-13 Ry + + iteration # 10 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.0 + + total cpu time spent up to now is 1.4 secs + + End of self-consistent calculation + + k = 0.0000 0.0000 0.0000 ( 4477 PWs) bands (ev): + + -5.8300 6.2061 6.2061 6.2061 + + k =-0.1250 0.1250-0.1250 ( 4507 PWs) bands (ev): + + -5.6230 4.6051 5.9132 5.9132 + + k =-0.2500 0.2500-0.2500 ( 4510 PWs) bands (ev): + + -5.0182 2.2559 5.4373 5.4373 + + k =-0.3750 0.3750-0.3750 ( 4501 PWs) bands (ev): + + -4.1058 0.2065 5.1074 5.1074 + + k = 0.5000-0.5000 0.5000 ( 4476 PWs) bands (ev): + + -3.4453 -0.8427 4.9947 4.9947 + + k = 0.0000 0.2500 0.0000 ( 4504 PWs) bands (ev): + + -5.5533 4.8935 5.3857 5.3857 + + k =-0.1250 0.3750-0.1250 ( 4517 PWs) bands (ev): + + -5.0777 2.9801 4.8669 4.9518 + + k =-0.2500 0.5000-0.2500 ( 4508 PWs) bands (ev): + + -4.2481 0.8896 4.3532 4.5964 + + k = 0.6250-0.3750 0.6250 ( 4486 PWs) bands (ev): + + -3.3613 -0.6068 3.9003 4.6231 + + k = 0.5000-0.2500 0.5000 ( 4491 PWs) bands (ev): + + -3.6148 -0.2257 3.7125 4.9256 + + k = 0.3750-0.1250 0.3750 ( 4497 PWs) bands (ev): + + -4.5602 1.5598 3.8591 5.4251 + + k = 0.2500 0.0000 0.2500 ( 4477 PWs) bands (ev): + + -5.2819 3.5267 4.5444 5.9125 + + k = 0.0000 0.5000 0.0000 ( 4520 PWs) bands (ev): + + -4.7329 2.7148 4.2862 4.2862 + + k =-0.1250 0.6250-0.1250 ( 4509 PWs) bands (ev): + + -4.0117 1.2745 3.4881 3.9636 + + k = 0.7500-0.2500 0.7500 ( 4482 PWs) bands (ev): + + -3.0647 -0.1975 2.6082 3.9678 + + k = 0.6250-0.1250 0.6250 ( 4477 PWs) bands (ev): + + -2.8512 -0.4657 2.1376 4.2926 + + k = 0.5000 0.0000 0.5000 ( 4489 PWs) bands (ev): + + -3.7521 0.7207 2.3750 4.8614 + + k = 0.0000 0.7500 0.0000 ( 4484 PWs) bands (ev): + + -3.4015 0.4708 3.5586 3.5586 + + k = 0.8750-0.1250 0.8750 ( 4479 PWs) bands (ev): + + -2.4888 -0.6253 2.7002 3.4815 + + k = 0.7500 0.0000 0.7500 ( 4454 PWs) bands (ev): + + -2.0305 -1.0339 1.8049 3.7440 + + k = 0.0000-1.0000 0.0000 ( 4456 PWs) bands (ev): + + -1.6267 -1.6267 3.3090 3.3090 + + k =-0.2500 0.5000 0.0000 ( 4503 PWs) bands (ev): + + -4.4807 1.9234 3.4393 4.7592 + + k = 0.6250-0.3750 0.8750 ( 4489 PWs) bands (ev): + + -3.5748 0.3447 2.8290 4.2439 + + k = 0.5000-0.2500 0.7500 ( 4486 PWs) bands (ev): + + -2.9014 -0.6278 2.7039 4.0076 + + k = 0.7500-0.2500 1.0000 ( 4484 PWs) bands (ev): + + -3.1970 0.2501 2.7770 3.3923 + + k = 0.6250-0.1250 0.8750 ( 4486 PWs) bands (ev): + + -2.3006 -0.7332 2.0576 3.1860 + + k = 0.5000 0.0000 0.7500 ( 4490 PWs) bands (ev): + + -2.6570 -0.3670 1.8851 3.5717 + + k =-0.2500-1.0000 0.0000 ( 4472 PWs) bands (ev): + + -1.5427 -1.5427 2.7194 2.7194 + + k =-0.5000-1.0000 0.0000 ( 4488 PWs) bands (ev): + + -1.4495 -1.4495 2.2655 2.2655 + + highest occupied level (ev): 6.2061 + +! total energy = -15.86335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 4.0E-15 Ry + + The total energy is the sum of the following terms: + + one-electron contribution = 4.76680131 Ry + hartree contribution = 1.08149972 Ry + xc contribution = -4.81476914 Ry + ewald contribution = -16.88688327 Ry + + convergence has been achieved in 10 iterations + + Forces acting on atoms (cartesian axes, Ry/au): + + atom 1 type 1 force = 0.00000000 0.00000000 0.00000000 + atom 2 type 1 force = 0.00000000 0.00000000 -0.00000000 + + Total force = 0.000000 Total SCF correction = 0.000000 + + + Computing stress (Cartesian axis) and pressure + + total stress (Ry/bohr**3) (kbar) P= 0.05 + 0.00000032 -0.00000000 -0.00000000 0.05 -0.00 -0.00 + -0.00000000 0.00000032 0.00000000 -0.00 0.05 0.00 + -0.00000000 0.00000000 0.00000032 -0.00 0.00 0.05 + + + Writing output data file Si.save + + init_run : 0.06s CPU 0.23s WALL ( 1 calls) + electrons : 0.85s CPU 1.01s WALL ( 1 calls) + forces : 0.00s CPU 0.01s WALL ( 1 calls) + stress : 0.02s CPU 0.03s WALL ( 1 calls) + + Called by init_run: + wfcinit : 0.04s CPU 0.11s WALL ( 1 calls) + potinit : 0.00s CPU 0.01s WALL ( 1 calls) + + Called by electrons: + c_bands : 0.73s CPU 0.80s WALL ( 11 calls) + sum_band : 0.11s CPU 0.13s WALL ( 11 calls) + v_of_rho : 0.00s CPU 0.01s WALL ( 11 calls) + mix_rho : 0.00s CPU 0.01s WALL ( 11 calls) + + Called by c_bands: + init_us_2 : 0.01s CPU 0.03s WALL ( 725 calls) + cegterg : 0.69s CPU 0.74s WALL ( 319 calls) + + Called by sum_band: + + Called by *egterg: + h_psi : 0.62s CPU 0.65s WALL ( 980 calls) + g_psi : 0.00s CPU 0.00s WALL ( 632 calls) + cdiaghg : 0.05s CPU 0.10s WALL ( 922 calls) + + Called by h_psi: + h_psi:pot : 0.61s CPU 0.65s WALL ( 980 calls) + h_psi:calbec : 0.03s CPU 0.04s WALL ( 980 calls) + vloc_psi : 0.57s CPU 0.59s WALL ( 980 calls) + add_vuspsi : 0.01s CPU 0.01s WALL ( 980 calls) + + General routines + calbec : 0.03s CPU 0.05s WALL ( 1125 calls) + fft : 0.01s CPU 0.05s WALL ( 50 calls) + fftw : 0.57s CPU 0.64s WALL ( 8656 calls) + davcio : 0.00s CPU 0.06s WALL ( 29 calls) + + Parallel routines + fft_scatter : 0.29s CPU 0.31s WALL ( 8706 calls) + + PWSCF : 1.07s CPU 2.22s WALL + + + This run was terminated on: 19:30: 3 27Sep2017 + +=------------------------------------------------------------------------------= + JOB DONE. +=------------------------------------------------------------------------------= diff --git a/capolanco/test.scf4.in b/capolanco/test.scf4.in new file mode 100644 index 00000000..34dccffe --- /dev/null +++ b/capolanco/test.scf4.in @@ -0,0 +1,30 @@ + &control + calculation='scf', + outdir = '/global/cscratch1/sd/cpolanco/Si/', + prefix='Si', + pseudo_dir = '/global/homes/c/cpolanco/Materials/pseudo/', + restart_mode='from_scratch', + tprnfor= .true., + tstress= .true., + / + &system + ibrav= 2, + celldm(1)= 10.20777693, + nat= 2, + ntyp= 1, + ecutwfc= 100.0 + / + &electrons + mixing_beta= 0.7 + conv_thr= 1.0d-14 + / + +ATOMIC_SPECIES + Si 28.086 Si.pz-vbc.UPF + +ATOMIC_POSITIONS (alat) + Si 0.00 0.00 0.00 + Si 0.25 0.25 0.25 + +K_POINTS (automatic) + 16 16 16 0 0 0 \ No newline at end of file diff --git a/capolanco/test.scf4.out b/capolanco/test.scf4.out new file mode 100644 index 00000000..c777d624 --- /dev/null +++ b/capolanco/test.scf4.out @@ -0,0 +1,437 @@ + + Program PWSCF v.6.1 starts on 27Sep2017 at 19:30: 1 + + This program is part of the open-source Quantum ESPRESSO suite + for quantum simulation of materials; please cite + "P. Giannozzi et al., J. Phys.:Condens. Matter 21 395502 (2009); + URL http://www.quantum-espresso.org", + in publications or presentations arising from this work. More details at + http://www.quantum-espresso.org/quote + + Parallel version (MPI & OpenMP), running on 24 processor cores + Number of MPI processes: 24 + Threads/MPI process: 1 + R & G space division: proc/nbgrp/npool/nimage = 24 + Waiting for input... + Reading input from standard input + + Current dimensions of program PWSCF are: + Max number of different atomic species (ntypx) = 10 + Max number of k-points (npk) = 40000 + Max angular momentum in pseudopotentials (lmaxx) = 3 + + Subspace diagonalization in iterative solution of the eigenvalue problem: + a serial algorithm will be used + + + Parallelization info + -------------------- + sticks: dense smooth PW G-vecs: dense smooth PW + Min 59 59 17 1489 1489 232 + Max 60 60 18 1494 1494 235 + Sum 1417 1417 421 35749 35749 5601 + + + + bravais-lattice index = 2 + lattice parameter (alat) = 10.2078 a.u. + unit-cell volume = 265.9093 (a.u.)^3 + number of atoms/cell = 2 + number of atomic types = 1 + number of electrons = 8.00 + number of Kohn-Sham states= 4 + kinetic-energy cutoff = 100.0000 Ry + charge density cutoff = 400.0000 Ry + convergence threshold = 1.0E-14 + mixing beta = 0.7000 + number of iterations used = 8 plain mixing + Exchange-correlation = SLA PZ NOGX NOGC ( 1 1 0 0 0 0) + + celldm(1)= 10.207777 celldm(2)= 0.000000 celldm(3)= 0.000000 + celldm(4)= 0.000000 celldm(5)= 0.000000 celldm(6)= 0.000000 + + crystal axes: (cart. coord. in units of alat) + a(1) = ( -0.500000 0.000000 0.500000 ) + a(2) = ( 0.000000 0.500000 0.500000 ) + a(3) = ( -0.500000 0.500000 0.000000 ) + + reciprocal axes: (cart. coord. in units 2 pi/alat) + b(1) = ( -1.000000 -1.000000 1.000000 ) + b(2) = ( 1.000000 1.000000 1.000000 ) + b(3) = ( -1.000000 1.000000 -1.000000 ) + + + PseudoPot. # 1 for Si read from file: + /global/homes/c/cpolanco/Materials/pseudo/Si.pz-vbc.UPF + MD5 check sum: 6dfa03ddd5817404712e03e4d12deb78 + Pseudo is Norm-conserving, Zval = 4.0 + Generated by new atomic code, or converted to UPF format + Using radial grid of 431 points, 2 beta functions with: + l(1) = 0 + l(2) = 1 + + atomic species valence mass pseudopotential + Si 4.00 28.08600 Si( 1.00) + + 24 Sym. Ops. (no inversion) found + (note: 24 additional sym.ops. were found but ignored + their fractional translations are incommensurate with FFT grid) + + + Cartesian axes + + site n. atom positions (alat units) + 1 Si tau( 1) = ( 0.0000000 0.0000000 0.0000000 ) + 2 Si tau( 2) = ( 0.2500000 0.2500000 0.2500000 ) + + number of k points= 29 + cart. coord. in units 2pi/alat + k( 1) = ( 0.0000000 0.0000000 0.0000000), wk = 0.0039062 + k( 2) = ( -0.1250000 0.1250000 -0.1250000), wk = 0.0312500 + k( 3) = ( -0.2500000 0.2500000 -0.2500000), wk = 0.0312500 + k( 4) = ( -0.3750000 0.3750000 -0.3750000), wk = 0.0312500 + k( 5) = ( 0.5000000 -0.5000000 0.5000000), wk = 0.0156250 + k( 6) = ( 0.0000000 0.2500000 0.0000000), wk = 0.0234375 + k( 7) = ( -0.1250000 0.3750000 -0.1250000), wk = 0.0937500 + k( 8) = ( -0.2500000 0.5000000 -0.2500000), wk = 0.0937500 + k( 9) = ( 0.6250000 -0.3750000 0.6250000), wk = 0.0937500 + k( 10) = ( 0.5000000 -0.2500000 0.5000000), wk = 0.0937500 + k( 11) = ( 0.3750000 -0.1250000 0.3750000), wk = 0.0937500 + k( 12) = ( 0.2500000 0.0000000 0.2500000), wk = 0.0468750 + k( 13) = ( 0.0000000 0.5000000 0.0000000), wk = 0.0234375 + k( 14) = ( -0.1250000 0.6250000 -0.1250000), wk = 0.0937500 + k( 15) = ( 0.7500000 -0.2500000 0.7500000), wk = 0.0937500 + k( 16) = ( 0.6250000 -0.1250000 0.6250000), wk = 0.0937500 + k( 17) = ( 0.5000000 0.0000000 0.5000000), wk = 0.0468750 + k( 18) = ( 0.0000000 0.7500000 0.0000000), wk = 0.0234375 + k( 19) = ( 0.8750000 -0.1250000 0.8750000), wk = 0.0937500 + k( 20) = ( 0.7500000 0.0000000 0.7500000), wk = 0.0468750 + k( 21) = ( 0.0000000 -1.0000000 0.0000000), wk = 0.0117188 + k( 22) = ( -0.2500000 0.5000000 0.0000000), wk = 0.0937500 + k( 23) = ( 0.6250000 -0.3750000 0.8750000), wk = 0.1875000 + k( 24) = ( 0.5000000 -0.2500000 0.7500000), wk = 0.0937500 + k( 25) = ( 0.7500000 -0.2500000 1.0000000), wk = 0.0937500 + k( 26) = ( 0.6250000 -0.1250000 0.8750000), wk = 0.1875000 + k( 27) = ( 0.5000000 0.0000000 0.7500000), wk = 0.0937500 + k( 28) = ( -0.2500000 -1.0000000 0.0000000), wk = 0.0468750 + k( 29) = ( -0.5000000 -1.0000000 0.0000000), wk = 0.0234375 + + Dense grid: 35749 G-vectors FFT dimensions: ( 45, 45, 45) + + Estimated max dynamical RAM per process > 1.29MB + + Estimated total allocated dynamical RAM > 31.06MB + + Initial potential from superposition of free atoms + + starting charge 7.99901, renormalised to 8.00000 + Starting wfc are 8 randomized atomic wfcs + + total cpu time spent up to now is 0.4 secs + + per-process dynamical memory: 2.9 Mb + + Self-consistent Calculation + + iteration # 1 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-02, avg # of iterations = 2.0 + + Threshold (ethr) on eigenvalues was too large: + Diagonalizing with lowered threshold + + Davidson diagonalization with overlap + ethr = 7.97E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.6 secs + + total energy = -15.84982619 Ry + Harris-Foulkes estimate = -15.87079416 Ry + estimated scf accuracy < 0.06161703 Ry + + iteration # 2 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 7.70E-04, avg # of iterations = 1.0 + + total cpu time spent up to now is 0.7 secs + + total energy = -15.85288351 Ry + Harris-Foulkes estimate = -15.85318795 Ry + estimated scf accuracy < 0.00216687 Ry + + iteration # 3 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 2.71E-05, avg # of iterations = 2.4 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85332918 Ry + Harris-Foulkes estimate = -15.85336185 Ry + estimated scf accuracy < 0.00007437 Ry + + iteration # 4 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 9.30E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.8 secs + + total energy = -15.85334986 Ry + Harris-Foulkes estimate = -15.85335396 Ry + estimated scf accuracy < 0.00000888 Ry + + iteration # 5 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.11E-07, avg # of iterations = 2.1 + + total cpu time spent up to now is 0.9 secs + + total energy = -15.85335134 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 0.00000011 Ry + + iteration # 6 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.35E-09, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.0 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-09 Ry + + iteration # 7 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.68E-11, avg # of iterations = 2.6 + + total cpu time spent up to now is 1.1 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 2.9E-11 Ry + + iteration # 8 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 3.65E-13, avg # of iterations = 3.3 + + total cpu time spent up to now is 1.2 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 5.4E-12 Ry + + iteration # 9 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.7 + + total cpu time spent up to now is 1.3 secs + + total energy = -15.85335138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 1.2E-13 Ry + + iteration # 10 ecut= 100.00 Ry beta= 0.70 + Davidson diagonalization with overlap + ethr = 1.00E-13, avg # of iterations = 1.0 + + total cpu time spent up to now is 1.4 secs + + End of self-consistent calculation + + k = 0.0000 0.0000 0.0000 ( 4477 PWs) bands (ev): + + -5.8300 6.2061 6.2061 6.2061 + + k =-0.1250 0.1250-0.1250 ( 4507 PWs) bands (ev): + + -5.6230 4.6051 5.9132 5.9132 + + k =-0.2500 0.2500-0.2500 ( 4510 PWs) bands (ev): + + -5.0182 2.2559 5.4373 5.4373 + + k =-0.3750 0.3750-0.3750 ( 4501 PWs) bands (ev): + + -4.1058 0.2065 5.1074 5.1074 + + k = 0.5000-0.5000 0.5000 ( 4476 PWs) bands (ev): + + -3.4453 -0.8427 4.9947 4.9947 + + k = 0.0000 0.2500 0.0000 ( 4504 PWs) bands (ev): + + -5.5533 4.8935 5.3857 5.3857 + + k =-0.1250 0.3750-0.1250 ( 4517 PWs) bands (ev): + + -5.0777 2.9801 4.8669 4.9518 + + k =-0.2500 0.5000-0.2500 ( 4508 PWs) bands (ev): + + -4.2481 0.8896 4.3532 4.5964 + + k = 0.6250-0.3750 0.6250 ( 4486 PWs) bands (ev): + + -3.3613 -0.6068 3.9003 4.6231 + + k = 0.5000-0.2500 0.5000 ( 4491 PWs) bands (ev): + + -3.6148 -0.2257 3.7125 4.9256 + + k = 0.3750-0.1250 0.3750 ( 4497 PWs) bands (ev): + + -4.5602 1.5598 3.8591 5.4251 + + k = 0.2500 0.0000 0.2500 ( 4477 PWs) bands (ev): + + -5.2819 3.5267 4.5444 5.9125 + + k = 0.0000 0.5000 0.0000 ( 4520 PWs) bands (ev): + + -4.7329 2.7148 4.2862 4.2862 + + k =-0.1250 0.6250-0.1250 ( 4509 PWs) bands (ev): + + -4.0117 1.2745 3.4881 3.9636 + + k = 0.7500-0.2500 0.7500 ( 4482 PWs) bands (ev): + + -3.0647 -0.1975 2.6082 3.9678 + + k = 0.6250-0.1250 0.6250 ( 4477 PWs) bands (ev): + + -2.8512 -0.4657 2.1376 4.2926 + + k = 0.5000 0.0000 0.5000 ( 4489 PWs) bands (ev): + + -3.7521 0.7207 2.3750 4.8614 + + k = 0.0000 0.7500 0.0000 ( 4484 PWs) bands (ev): + + -3.4015 0.4708 3.5586 3.5586 + + k = 0.8750-0.1250 0.8750 ( 4479 PWs) bands (ev): + + -2.4888 -0.6253 2.7002 3.4815 + + k = 0.7500 0.0000 0.7500 ( 4454 PWs) bands (ev): + + -2.0305 -1.0339 1.8049 3.7440 + + k = 0.0000-1.0000 0.0000 ( 4456 PWs) bands (ev): + + -1.6267 -1.6267 3.3090 3.3090 + + k =-0.2500 0.5000 0.0000 ( 4503 PWs) bands (ev): + + -4.4807 1.9234 3.4393 4.7592 + + k = 0.6250-0.3750 0.8750 ( 4489 PWs) bands (ev): + + -3.5748 0.3447 2.8290 4.2439 + + k = 0.5000-0.2500 0.7500 ( 4486 PWs) bands (ev): + + -2.9014 -0.6278 2.7039 4.0076 + + k = 0.7500-0.2500 1.0000 ( 4484 PWs) bands (ev): + + -3.1970 0.2501 2.7770 3.3923 + + k = 0.6250-0.1250 0.8750 ( 4486 PWs) bands (ev): + + -2.3006 -0.7332 2.0576 3.1860 + + k = 0.5000 0.0000 0.7500 ( 4490 PWs) bands (ev): + + -2.6570 -0.3670 1.8851 3.5717 + + k =-0.2500-1.0000 0.0000 ( 4472 PWs) bands (ev): + + -1.5427 -1.5427 2.7194 2.7194 + + k =-0.5000-1.0000 0.0000 ( 4488 PWs) bands (ev): + + -1.4495 -1.4495 2.2655 2.2655 + + highest occupied level (ev): 6.2061 + +! total energy = -15.85435138 Ry + Harris-Foulkes estimate = -15.85335138 Ry + estimated scf accuracy < 4.0E-15 Ry + + The total energy is the sum of the following terms: + + one-electron contribution = 4.76680131 Ry + hartree contribution = 1.08149972 Ry + xc contribution = -4.81476914 Ry + ewald contribution = -16.88688327 Ry + + convergence has been achieved in 10 iterations + + Forces acting on atoms (cartesian axes, Ry/au): + + atom 1 type 1 force = 0.00000000 0.00000000 0.00000000 + atom 2 type 1 force = 0.00000000 0.00000000 -0.00000000 + + Total force = 0.000000 Total SCF correction = 0.000000 + + + Computing stress (Cartesian axis) and pressure + + total stress (Ry/bohr**3) (kbar) P= 0.05 + 0.00000032 -0.00000000 -0.00000000 0.05 -0.00 -0.00 + -0.00000000 0.00000032 0.00000000 -0.00 0.05 0.00 + -0.00000000 0.00000000 0.00000032 -0.00 0.00 0.05 + + + Writing output data file Si.save + + init_run : 0.06s CPU 0.23s WALL ( 1 calls) + electrons : 0.85s CPU 1.01s WALL ( 1 calls) + forces : 0.00s CPU 0.01s WALL ( 1 calls) + stress : 0.02s CPU 0.03s WALL ( 1 calls) + + Called by init_run: + wfcinit : 0.04s CPU 0.11s WALL ( 1 calls) + potinit : 0.00s CPU 0.01s WALL ( 1 calls) + + Called by electrons: + c_bands : 0.73s CPU 0.80s WALL ( 11 calls) + sum_band : 0.11s CPU 0.13s WALL ( 11 calls) + v_of_rho : 0.00s CPU 0.01s WALL ( 11 calls) + mix_rho : 0.00s CPU 0.01s WALL ( 11 calls) + + Called by c_bands: + init_us_2 : 0.01s CPU 0.03s WALL ( 725 calls) + cegterg : 0.69s CPU 0.74s WALL ( 319 calls) + + Called by sum_band: + + Called by *egterg: + h_psi : 0.62s CPU 0.65s WALL ( 980 calls) + g_psi : 0.00s CPU 0.00s WALL ( 632 calls) + cdiaghg : 0.05s CPU 0.10s WALL ( 922 calls) + + Called by h_psi: + h_psi:pot : 0.61s CPU 0.65s WALL ( 980 calls) + h_psi:calbec : 0.03s CPU 0.04s WALL ( 980 calls) + vloc_psi : 0.57s CPU 0.59s WALL ( 980 calls) + add_vuspsi : 0.01s CPU 0.01s WALL ( 980 calls) + + General routines + calbec : 0.03s CPU 0.05s WALL ( 1125 calls) + fft : 0.01s CPU 0.05s WALL ( 50 calls) + fftw : 0.57s CPU 0.64s WALL ( 8656 calls) + davcio : 0.00s CPU 0.06s WALL ( 29 calls) + + Parallel routines + fft_scatter : 0.29s CPU 0.31s WALL ( 8706 calls) + + PWSCF : 1.07s CPU 2.22s WALL + + + This run was terminated on: 19:30: 3 27Sep2017 + +=------------------------------------------------------------------------------= + JOB DONE. +=------------------------------------------------------------------------------=