[Wien] x optic error

Peter Blaha pblaha at theochem.tuwien.ac.at
Wed Jun 6 08:56:18 CEST 2012


Here is the modified   opticpara_lapw


Am 05.06.2012 19:36, schrieb soumyajyoti haldar:
> Dear Prof. Blaha,
>
> How we can get the modified file? Will you update the file after modification in the download section of the site ?
>
> On Tue, Jun 5, 2012 at 3:56 PM, Peter Blaha <pblaha at theochem.tuwien.ac.at <mailto:pblaha at theochem.tuwien.ac.at>> wrote:
>
>     You are absolutely right. $SCRATCH is not used consistently in x_lapw and opticpara
>
>     I'll add ${scratch} in front of all $case.symmat_$i$updn lines (and similar for other files)
>     in opticpara_lapw.

-- 

                                       P.Blaha
--------------------------------------------------------------------------
Peter BLAHA, Inst.f. Materials Chemistry, TU Vienna, A-1060 Vienna
Phone: +43-1-58801-165300             FAX: +43-1-58801-165982
Email: blaha at theochem.tuwien.ac.at    WWW: http://info.tuwien.ac.at/theochem/
--------------------------------------------------------------------------
-------------- next part --------------
#!/bin/csh -f
#
# Run optic in parallel mode
#
# $Author: M.Lee $
# 

set tmp  = /tmp/opticpara.$$
set tmp2 = /tmp/opticpara.$$_2
touch .lock_
foreach i (.lock_*)
    rm $i
end

onintr exit
set name	= $0
set bin         = $name:h       #default directory for WIEN-executables
if !(-d $bin) set bin = .
set name	= $name:t

unalias rm
alias   testinput       'if (! -e \!:1 ||  -z \!:1) goto \!:2'
alias   testerror       'if (! -z \!:1.error) goto error'

set t	    = time  
set cmplx
set log     = :parallel
set defmach = `hostname`
set updn			# spinpolarization switch
set dnup    = 'dn'	        # spinpolarization switch
set sc				# semicore-switch
set hf				# hybrid-switch
set so				# spinorbit-switch
set remote = ssh
set init = init:
set res  = residue:
set taskset0
set taskset='no'  

set scratch =      

if ( $?SCRATCH ) then
  set scratch=`echo $SCRATCH  | sed -e 's/\/$//'`/ # we are afraid
                                # different settings in different
                                # computing centers
                                #use global variable for scratch if set
endif


############################################################################
# In this section use 0 to turn of an option, 1 to turn it on, 
# respectively choose a value

set useremote   = 1             # using remote shell to launch processes
set delay       = 1             # delay launching of processes by n seconds
set debug       = 0             # set verbosity of debugging output

############################################################################
# and now we look if we should override the defaults
if (-e $bin/parallel_options) then
      source $bin/parallel_options
endif
if ( $?TASKSET ) then
        set taskset="$TASKSET"
endif
if ( $?USE_REMOTE ) then
        set useremote = $USE_REMOTE
endif
############################################################################

if ($#argv < 1) then
	echo usage: $0 deffile
	exit
endif

while ($#argv)
  switch ($1)
  case -h:
  case -H: 
    set help
    shift; breaksw
  case -c:
    set cmplx = c
    shift; breaksw
  case -up:
    set updn = 'up'
    set dnup = 'dn'
    shift; breaksw
  case -dn:
    set updn = 'dn'
    set dnup = 'up'
    shift; breaksw
  case -hf:
    set hf = 'hf'
    shift; breaksw
  case -so:
    set so = 'so'
    shift; breaksw
  case -sc:
    set sc = 's'
    shift; breaksw
  default:
    set def = $1:r
    shift; breaksw
  endsw
end

set exe = $bin/optic$cmplx
set exe = optic$cmplx

#are we running parallel?
testinput .processes single
echo "running OPTIC in parallel mode"
echo "RUNNING" >.opticpara

#before we start, we wipe away all parallel error files
if ( -e optic_1.error ) rm *optic_*.error
if ( -e .timeop_1) rm .timeop_*

if (-e .machines.help) rm .machines.help

grep -v $init .processes|grep : | grep -v $res >$tmp2
set mist     = `wc $tmp2 `
set maxproc  = $mist[1]
#set machine  = `grep $init .processes |cut -f2 -d: | xargs`
set machine  = `grep -v $init .processes |grep : | grep -v $res | cut -f2 -d: | xargs`

set lockfile = `cut -f2 -d: $tmp2 | awk '{print $1 NR}'|xargs`
set residue  = `grep $res .processes|cut -f2 -d:`
if ($residue == "") unset residue

if ($debug > 0) echo machines: $machine

echo "** " Error in Parallel OPTIC >$def.error
#bounding cpus
set p_cpu_bound = ($machine)
set i=1
set cpu=0
set old=old
while ($i <= $#p_cpu_bound)
  if($old != $p_cpu_bound[$i]) then
     set cpu=0
  endif
  set old=$p_cpu_bound[$i]
  set p_cpu_bound[$i] = $cpu
  @ cpu ++
  @ i ++
end
#echo $machine
#echo $p_cpu_bound

#get name of case
setenv PWD `pwd|sed "s/tmp_mnt\///"`
#echo $PWD
setenv PWD $cwd
set case    = $PWD
set case    = $case:t          
if ($case == "") then
  echo "ERROR: cannot detect working directory $cwd -> exit"
  exit 1
endif
set case    = $case:r           #head of file-names
if ($debug > 0) echo Setting up case $case for parallel execution
if ($debug > 0) echo of OPTIC
if ($debug > 0) echo "  "
#

#creating  def files
if ($debug > 0) echo " "
if ($debug > 0) echo -n "creating "$def"_*.def:  "
set i = 1
while ($i <= $maxproc)
  if ($debug > 0) echo -n "$i "
  cp $def.def .tmp
  #subsituting in files:
  cat <<theend >.script
s/vector$hf$so$dnup/&_$i/w .mist
s/vector$hf$so$updn/&_$i/w .mist
s/outputop/&_$i/w .mist
s/symmat/&_$i/w .mist
s/mommat2/&_$i/w .mist
s/mat_diag/&_$i/w .mist
s/mme/&_$i/w .mist
s/symop/&_$i/w .mist

theend

  sed -f .script .tmp > .tmp1
  sed "s/vector_${i}_$i\&dn/vectordn_$i/" .tmp1>.tmp2 
  sed "s/vector_${i}_$i\&up/vectorup_$i/" .tmp2>.tmp1
  sed "s/vector_${i}dn_$i/vectordn_$i/" .tmp1>.tmp2
  sed "s/vector_${i}_$i/vector_$i/" .tmp2>.tmp1
  sed "s/vectorhf_${i}dn_$i/vectorhfdn_$i/" .tmp1> "$def"_$i.def
#similar fix for SO necessary

  @ i ++
end
if ($debug > 0) echo " "


#starting processes
if ($debug > 0) echo " "
if ($debug > 0) echo "starting process:  "

echo "->  "starting parallel optic at `date` >>$log

set loop    = 0
set endloop = 0
set runmach = ""
echo "files:$maxproc" >.processes2
# change working dir because of problems with automounted directories
#   cd $cwd
while ($loop < $maxproc)
  set p = 1
  if ($?residue && $?resok) set p = 2
  while ($p <= $#machine)
    if ($loop < $maxproc) then
	if !(-e .lock_$lockfile[$p]) then
	    @ loop ++
	    echo "${loop}:${maxproc} : $p_cpu_bound[$p]" >.processes2
	    if ($debug > 0) echo prepare $loop on $machine[$p]
	    set runmach = ($runmach $machine[$p])
	    echo $runmach >>.processes2
	    if ($debug > 1) echo "   >  $exe ${def}_${loop}.def on $machine[$p]"
	    if ($debug > 1) echo "   >  $exe ${def}_${loop}.def on $machine[$p]">>$log
	    if ($useremote == 1) then
	    if ($debug > 1) echo use remote
		touch .lock_$lockfile[$p]
		echo -n "$runmach[$loop] ">.timeop_$loop
                if($taskset != 'no') set taskset0="$taskset $p_cpu_bound[$p]"
		($remote $machine[$p] "cd $PWD;$t $taskset0 $exe ${def}_${loop}.def;rm -f .lock_$lockfile[$p]") >>.timeop_$loop  &
	 else
		if ($debug > 1) echo not using remote shell
		touch .lock_$lockfile[$p]
		echo -n "$runmach[$loop] " >.timeop_$loop
		(cd $PWD;$t $exe ${def}_${loop}.def;rm -f .lock_$lockfile[$p]) >>.timeop_$loop  &
	    endif
	endif
    if ($debug > 1) echo sleeping for $delay seconds
    sleep $delay
            jobs -l >.optic${cmplx}para.$$.`hostname`
    endif
    @ p ++
  end
end

#wait for execution to be completed
if ($debug > 0) echo " "
if ($debug > 0) echo "waiting for processes:  "
wait


set i = 1
while ($i <= $maxproc)
  testerror "$def"_$i
  @ i ++
end

#cpu summary:
set i = 1
while ($i <= $maxproc)
#    echo "      "`cat .timeop_$i`
#fix for bash timing
    bashtime2csh.pl_lapw .timeop_$i > .time_tmp
    mv .time_tmp .timeop_$i
    echo "      "`cat .timeop_$i` >>$log
    @ i ++
end

# postanalysis
echo "   Summary of opticpara:" >$tmp
set p = 1
while ($p <= $#machine)
    set m = $runmach[$p]
    cat .timeop_* | grep $m | tr "():" " " | \
	    awk '{u += $2; cl += 60*$4+$5} \
		END {print "   '$m'\t user=" u "\t wallclock=" cl}' >>$tmp
    @ p ++
end

uniq < $tmp |tee -a $log

echo "<-  "done at `date` >>$log

# concatenating the case.symmat files and case.mommat files

if (-e $case.symop)  rm $case.symop
if (-e ${scratch}$case.mme$updn)  rm ${scratch}$case.mme$updn
if (-e ${scratch}$case.symmat$updn)  rm ${scratch}$case.symmat$updn
if (-e ${scratch}$case.mommat2$updn)  rm ${scratch}$case.mommat2$updn
if (-e ${scratch}$case.mat_diag$updn) rm ${scratch}$case.mat_diag$updn
touch ${scratch}$case.symmat$updn
touch ${scratch}$case.mommat2$updn
touch ${scratch}$case.mat_diag$updn
touch ${scratch}$case.mme$updn

mv $case.symop_1 $case.symop
rm $case.symop_*

set i = 1
while ($i <= $maxproc)
 if ( $i == 1 ) then
#    testinput $case.symmat_$i$updn scratchwarning
    cat ${scratch}$case.symmat_$i$updn    >>  ${scratch}$case.symmat$updn
#    cat ${scratch}$case.mommat2_$i$updn   >>  ${scratch}$case.mommat2$updn
    cat ${scratch}$case.mat_diag_$i$updn  >>  ${scratch}$case.mat_diag$updn
    cat ${scratch}$case.mme_$i$updn  >>  ${scratch}$case.mme$updn
 else
    tail -n +2  ${scratch}$case.symmat_$i$updn   >>  ${scratch}$case.symmat$updn
#    tail -n +2  ${scratch}$case.mommat2_$i$updn   >>  ${scratch}$case.mommat2$updn
    tail -n +2  ${scratch}$case.mat_diag_$i$updn >>  ${scratch}$case.mat_diag$updn
    tail -n +2  ${scratch}$case.mme_$i$updn >>  ${scratch}$case.mme$updn
 endif
    rm ${scratch}$case.symmat_$i$updn
#    rm ${scratch}$case.mommat2_$i$updn
    rm ${scratch}$case.mat_diag_$i$updn
    rm ${scratch}$case.mme_$i$updn
    @ i ++
end

echo "<-  "done at `date` >>$log
echo "-----------------------------------------------------------------">>$log
rm $def.error
#rm .in.tmp .in.tmp1
touch $def.error
rm $tmp* >&/dev/null
rm .optic${cmplx}para.$$.`hostname` >&/dev/null
echo "DONE" >.opticpara
exit 0

single:
echo "running in single mode"
$exe $def.def
rm $tmp* >&/dev/null
rm .optic${cmplx}para.$$.`hostname` >&/dev/null
exit 0

scratchwarning:
echo "Could not find $case.symmat_$i$updn , which is probably because you used a scratch directory $SCRATCH"
echo "Copy these files  from the remote machines and concatenate them yourself"
echo "with commands like (for all your parallel calculations i):"
echo " cat $case.symmat_"'$i'"$updn >> $case.symmat$updn           when $i =1a "
echo " tail -n +2  $case.symmat_"'$i'"$updn >> $case.symmat$updn   else"
exit 1

error:
echo "** " OPTIC crashed!
echo "** " OPTIC crashed at `date`>>$log
echo "** " check ERROR FILES! >>$log
echo "-----------------------------------------------------------------">>$log
echo "** " Error in Parallel OPTIC >>$def.error
rm $tmp* >&/dev/null
rm .optic${cmplx}para.$$.`hostname` >&/dev/null
echo "ERROR" >.opticpara
exit 1


More information about the Wien mailing list