makefile substitution now based on regexp match.
condensed makefile syntax. can now use a system-defined LAPACK instead of ACML (required for OS X...). fixed bug that 'ULTRA' was not using -O3 for most of the compiling...
This commit is contained in:
parent
d96c64373c
commit
739c524848
168
code/makefile
168
code/makefile
|
@ -3,20 +3,25 @@
|
||||||
########################################################################################
|
########################################################################################
|
||||||
# Be sure to remove all files compiled with different options by using "make clean"
|
# Be sure to remove all files compiled with different options by using "make clean"
|
||||||
#
|
#
|
||||||
# Uses OpenMP to parallelise the material subroutines (set number of cores with "export DAMASK_NUM_THREADS=n" to n)
|
# Uses OpenMP to parallelize the material subroutines (set number of threads with "export DAMASK_NUM_THREADS=n" to n)
|
||||||
# Uses linux threads to parallelise fftw3
|
|
||||||
# Besides of the f90 files written at MPIE, the two library files of fftw3 "libfftw3_threads.a" "libfftw3.a" are also needed
|
|
||||||
# Install fftw3 (v3.3 is tested):
|
|
||||||
# -Apply the following patch to api/f77funcs.h, line 92 in the FFTW source:
|
|
||||||
#
|
#
|
||||||
|
# Install fftw3 (v3.3 is tested):
|
||||||
|
# + patch api/f77funcs.h, line 92 in the FFTW source with:
|
||||||
# FFTW_VOIDFUNC F77(set_timelimit,SET_TIMELIMIT)(double *t)
|
# FFTW_VOIDFUNC F77(set_timelimit,SET_TIMELIMIT)(double *t)
|
||||||
# {
|
# {
|
||||||
# X(set_timelimit)(*t);
|
# X(set_timelimit)(*t);
|
||||||
# }
|
# }
|
||||||
# -Do "./configure --enable-threads --enable-sse2 --enable-shared" and "make"; "make install" is not needed
|
# + run
|
||||||
# as long as the two library files "libfftw3_threads.a" "libfftw3.a" are copied to the /../lib directory.
|
# ./configure --enable-threads --enable-sse2 --enable-shared [-enable-float]
|
||||||
# for single precision also use --enable-float
|
# make
|
||||||
# Need the AMD Core Math Library to be installed (v 4.4 is tested)
|
# make install
|
||||||
|
# + specify in the "pathinfo:FFTW" where FFTW was installed.
|
||||||
|
# We essentially look for two library files "lib/libfftw3_threads.a" and "lib/libfftw3.a", so you can copy those, for instance,
|
||||||
|
# into DAMASK_ROOT/lib/fftw/lib/ and specify "./fftw/" as pathinfo:FFTW
|
||||||
|
# Use --enable-float in above configure for single precision...
|
||||||
|
# Uses linux threads to parallelize fftw3
|
||||||
|
#
|
||||||
|
# Instead of the AMD Core Math Library a standard "liblapack.a/dylib/etc." can be used by leaving pathinfo:ACML blank
|
||||||
########################################################################################
|
########################################################################################
|
||||||
# OPTIONS = standard (alternative): meaning
|
# OPTIONS = standard (alternative): meaning
|
||||||
#-------------------------------------------------------------
|
#-------------------------------------------------------------
|
||||||
|
@ -25,19 +30,16 @@
|
||||||
# PORTABLE = TRUE (FALSE): decision, if executable is optimized for the machine on which it was built.
|
# PORTABLE = TRUE (FALSE): decision, if executable is optimized for the machine on which it was built.
|
||||||
# OPTIMIZATION = DEFENSIVE (OFF,AGGRESSIVE,ULTRA): Optimization mode: O2, O0, O3 + further options for most files, 03 + further options for all files
|
# OPTIMIZATION = DEFENSIVE (OFF,AGGRESSIVE,ULTRA): Optimization mode: O2, O0, O3 + further options for most files, 03 + further options for all files
|
||||||
# OPENMP = TRUE (FALSE): OpenMP multiprocessor support
|
# OPENMP = TRUE (FALSE): OpenMP multiprocessor support
|
||||||
# FFTWPATH =TAKE_FFTW_PATH, will be adjusted by setup_code.py
|
# FFTWROOT = pathinfo:FFTW (will be adjusted by setup_code.py)
|
||||||
# ACMLROOT =TAKE_ACLM_ROOT, will be adjusted by setup_code.py
|
# ACMLROOT = pathinfo:ACML (will be adjusted by setup_code.py)
|
||||||
# ACMLPATH =$(ACMLROOT)/"compilerdir"/lib (...) Path to ACML Library, choose according to your system
|
# ACMLPATH =$(ACMLROOT)/"compilerdir"/lib (...) Path to ACML, choose according to your system
|
||||||
# ACMLPATH =$(ACMLROOT/"compilerdir"_mp/lib (...) Path to ACML Library with multicore support, choose according to your system
|
# ACMLPATH =$(ACMLROOT/"compilerdir"_mp/lib (...) Path to ACML with multicore support, choose according to your system
|
||||||
# "compilerdir" is "intel64" for ifort
|
# "compilerdir" is "intel64" for ifort
|
||||||
# FFTWOPTIONS =$(FFTWPATH)/libfftw3.a $(FFTWPATH)/libfftw3_threads.a -lpthread (...) Path to FFTW library files with Linux threads (multicore) support
|
|
||||||
# FFTWOPTIONS =$(FFTWPATH)/libfftw3.a (...) Path to FFTW library files without Linux threads (multicore) support
|
|
||||||
# FFTWOPTIONS is different for single and double precision. Choose the options to use OpenMP instead of pthreads support or change the directory
|
|
||||||
# PREFIX: specify an arbitrary prefix
|
# PREFIX: specify an arbitrary prefix
|
||||||
# SUFFIX: specify an arbitrary suffix
|
# SUFFIX: specify an arbitrary suffix
|
||||||
# COMPILERNAME = overwrite name of Compiler, e.g. using mpich-g90 instead of ifort
|
# COMPILERNAME = overwrite name of Compiler, e.g. using mpich-g90 instead of ifort
|
||||||
########################################################################################
|
########################################################################################
|
||||||
# Here are some usefull debugging switches. Switch on by uncommenting the #SUFFIX line at the end of this section:
|
# Here are some useful debugging switches. Switch on by uncommenting the #SUFFIX line at the end of this section:
|
||||||
# information on http://software.intel.com/en-us/articles/determining-root-cause-of-sigsegv-or-sigbus-errors/
|
# information on http://software.intel.com/en-us/articles/determining-root-cause-of-sigsegv-or-sigbus-errors/
|
||||||
# check if an array index is too small (<1) or too large!
|
# check if an array index is too small (<1) or too large!
|
||||||
DEBUG1 =-check bounds -g
|
DEBUG1 =-check bounds -g
|
||||||
|
@ -57,98 +59,95 @@ DEBUG5 =-stand std03/std95
|
||||||
#SUFFIX =$(DEBUG1) $(DEBUG2) $(DEBUG3)
|
#SUFFIX =$(DEBUG1) $(DEBUG2) $(DEBUG3)
|
||||||
########################################################################################
|
########################################################################################
|
||||||
|
|
||||||
#default values below will be set by setup_code.py
|
#auto values will be set by setup_code.py
|
||||||
#FFTWPATH =../lib
|
FFTWROOT := auto
|
||||||
#ACMLROOT =/opt/acml4.4.0
|
ACMLROOT := auto
|
||||||
|
|
||||||
FFTWPATH =/nethome/m.diehl/DAMASK/lib
|
F90 ?= ifort
|
||||||
ACMLROOT =/opt/acml4.4.0
|
|
||||||
|
|
||||||
ifndef F90
|
COMPILERNAME ?= $(F90)
|
||||||
F90 =ifort
|
|
||||||
|
OPENMP ?= ON
|
||||||
|
|
||||||
|
OPTIMIZATION ?= DEFENSIVE
|
||||||
|
|
||||||
|
ifeq "$(OPTIMIZATION)" "OFF"
|
||||||
|
OPTI := OFF
|
||||||
|
MAXOPTI := OFF
|
||||||
|
endif
|
||||||
|
ifeq "$(OPTIMIZATION)" "DEFENSIVE"
|
||||||
|
OPTI := DEFENSIVE
|
||||||
|
MAXOPTI := DEFENSIVE
|
||||||
|
endif
|
||||||
|
ifeq "$(OPTIMIZATION)" "AGGRESSIVE"
|
||||||
|
OPTI := AGGRESSIVE
|
||||||
|
MAXOPTI := DEFENSIVE
|
||||||
|
endif
|
||||||
|
ifeq "$(OPTIMIZATION)" "ULTRA"
|
||||||
|
OPTI := AGGRESSIVE
|
||||||
|
MAXOPTI := AGGRESSIVE
|
||||||
endif
|
endif
|
||||||
|
|
||||||
ifndef OPTIMIZATION
|
ifndef OPTI
|
||||||
OPTIMIZATION =DEFENSIVE
|
OPTI := DEFENSIVE
|
||||||
endif
|
MAXOPTI := DEFENSIVE
|
||||||
MAXOPTI =$(OPTIMIZATION)
|
|
||||||
|
|
||||||
ifeq ($(OPTIMIZATION),AGGRESSIVE)
|
|
||||||
MAXOPTI=DEFENSIVE
|
|
||||||
endif
|
endif
|
||||||
|
|
||||||
ifeq ($(OPTIMIZATION),ULTRA)
|
ifeq "$(PORTABLE)" "FALSE"
|
||||||
MAXOPTI=AGGRESSIVE
|
|
||||||
OPTIMIZATION=AGGRESSIVE
|
|
||||||
endif
|
|
||||||
|
|
||||||
ifeq ($(PORTABLE),FALSE)
|
|
||||||
PORTABLE_SWITCH = -msse3
|
PORTABLE_SWITCH = -msse3
|
||||||
endif
|
endif
|
||||||
|
|
||||||
ifndef OPENMP
|
ifeq "$(PRECISION)" "single"
|
||||||
OPENMP=ON
|
FFTWPREC = f
|
||||||
|
else
|
||||||
|
FFTWPREC =
|
||||||
endif
|
endif
|
||||||
|
|
||||||
# setting defaults in case of multicore support
|
|
||||||
ifeq ($(OPENMP),ON)
|
# settings for multicore support
|
||||||
|
ifeq "$(OPENMP)" "ON"
|
||||||
OPENMP_FLAG_ifort = -openmp -openmp-report0 -parallel
|
OPENMP_FLAG_ifort = -openmp -openmp-report0 -parallel
|
||||||
OPENMP_FLAG_gfortran = -fopenmp
|
OPENMP_FLAG_gfortran = -fopenmp
|
||||||
ifndef ACMLPATH
|
ACML_ARCH =_mp
|
||||||
ACMLPATH =$(ACMLROOT)/$(F90)64_mp/lib
|
LIBRARIES += -lfftw3$(FFTWPREC)_threads -lpthread
|
||||||
endif
|
endif
|
||||||
ifndef FFTWOPTIONS
|
|
||||||
ifeq ($(PRECISION),single)
|
LIBRARIES += -lfftw3$(FFTWPREC)
|
||||||
FFTWOPTIONS =$(FFTWPATH)/libfftw3f_threads.a $(FFTWPATH)/libfftw3f.a -lpthread
|
LIB_DIRS += -L$(FFTWROOT)/lib
|
||||||
|
|
||||||
|
ifdef ACMLROOT
|
||||||
|
LIB_DIRS += -L$(ACMLROOT)/$(F90)64$(ACML_ARCH)/lib
|
||||||
|
LIBRARIES += -lacml$(ACML_ARCH)
|
||||||
else
|
else
|
||||||
FFTWOPTIONS =$(FFTWPATH)/libfftw3_threads.a $(FFTWPATH)/libfftw3.a -lpthread
|
LIBRARIES += -llapack
|
||||||
endif
|
|
||||||
endif
|
|
||||||
BLAS=$(ACMLPATH)/libacml_mp.a
|
|
||||||
|
|
||||||
#setting defaults in case of single core compilation
|
|
||||||
else
|
|
||||||
ifndef ACMLPATH
|
|
||||||
ACMLPATH=$(ACMLROOT)/$(F90)64/lib
|
|
||||||
endif
|
|
||||||
ifndef FFTWOPTIONS
|
|
||||||
ifeq ($(PRECISION),single)
|
|
||||||
FFTWOPTIONS =$(FFTWPATH)/libfftw3f.a
|
|
||||||
else
|
|
||||||
FFTWOPTIONS =$(FFTWPATH)/libfftw3.a
|
|
||||||
endif
|
|
||||||
endif
|
|
||||||
BLAS=$(ACMLPATH)/libacml.a
|
|
||||||
endif
|
endif
|
||||||
|
|
||||||
|
|
||||||
OPTIMIZATION_OFF_ifort =-O0
|
OPTIMIZATION_OFF_ifort :=-O0
|
||||||
OPTIMIZATION_OFF_gfortran =-O0
|
OPTIMIZATION_OFF_gfortran :=-O0
|
||||||
OPTIMIZATION_DEFENSIVE_ifort =-O2
|
OPTIMIZATION_DEFENSIVE_ifort :=-O2
|
||||||
OPTIMIZATION_DEFENSIVE_gfortran =-O2
|
OPTIMIZATION_DEFENSIVE_gfortran :=-O2
|
||||||
OPTIMIZATION_AGGRESSIVE_ifort =-O3 $(PORTABLE_SWITCH) -ip -static -fp-model fast=2 -no-prec-div
|
OPTIMIZATION_AGGRESSIVE_ifort :=-O3 $(PORTABLE_SWITCH) -ip -static -fp-model fast=2 -no-prec-div
|
||||||
OPTIMIZATION_AGGRESSIVE_gfortran =-O3 $(PORTABLE_SWITCH) -march=opteron -ffast-math -funroll-loops -ftree-vectorize -ftree-loop-linear
|
OPTIMIZATION_AGGRESSIVE_gfortran :=-O3 $(PORTABLE_SWITCH) -ffast-math -funroll-loops -ftree-vectorize
|
||||||
|
|
||||||
COMPILE_OPTIONS_ifort =-fpp -diag-disable 8291,8290
|
|
||||||
COMPILE_OPTIONS_gfortran =-xf95-cpp-input -fno-range-check
|
|
||||||
|
|
||||||
COMPILE =${OPENMP_FLAG_${F90}} ${COMPILE_OPTIONS_${F90}} ${OPTIMIZATION_${OPTIMIZATION}_${F90}} -c
|
COMPILE_OPTIONS_ifort := -fpp -diag-disable 8291,8290
|
||||||
COMPILE_MAXOPTI =${OPENMP_FLAG_${F90}} ${COMPILE_OPTIONS_${F90}} ${OPTIMIZATION_${MAXOPTI}_${F90}} -c
|
COMPILE_OPTIONS_gfortran := -xf95-cpp-input -fno-range-check
|
||||||
|
|
||||||
ifndef COMPILERNAME
|
COMPILE = $(OPENMP_FLAG_$(F90)) $(COMPILE_OPTIONS_$(F90)) $(OPTIMIZATION_$(OPTI)_$(F90)) -c
|
||||||
COMPILERNAME=$(F90)
|
COMPILE_MAXOPTI = $(OPENMP_FLAG_$(F90)) $(COMPILE_OPTIONS_$(F90)) $(OPTIMIZATION_$(MAXOPTI)_$(F90)) -c
|
||||||
endif
|
|
||||||
|
|
||||||
ifeq ($(PRECISION),single)
|
|
||||||
|
ifeq "$(PRECISION)" "single"
|
||||||
DAMASK_spectral_single.exe: DAMASK_spectral_single.o CPFEM.a
|
DAMASK_spectral_single.exe: DAMASK_spectral_single.o CPFEM.a
|
||||||
$(PREFIX) $(COMPILERNAME) $(OPENMP_FLAG_$(F90)) -o DAMASK_spectral_single.exe DAMASK_spectral_single.o CPFEM.a $(FFTWOPTIONS)\
|
$(PREFIX) $(COMPILERNAME) $(OPENMP_FLAG_$(F90)) -o DAMASK_spectral_single.exe DAMASK_spectral_single.o CPFEM.a \
|
||||||
constitutive.a advanced.a basics.a $(BLAS)
|
constitutive.a advanced.a basics.a $(LIB_DIRS) $(LIBRARIES)
|
||||||
DAMASK_spectral_single.o: DAMASK_spectral_single.f90 CPFEM.o
|
DAMASK_spectral_single.o: DAMASK_spectral_single.f90 CPFEM.o
|
||||||
$(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) DAMASK_spectral_single.f90 $(SUFFIX)
|
$(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) DAMASK_spectral_single.f90 $(SUFFIX)
|
||||||
else
|
else
|
||||||
DAMASK_spectral.exe: DAMASK_spectral.o CPFEM.a
|
DAMASK_spectral.exe: DAMASK_spectral.o CPFEM.a
|
||||||
$(PREFIX) $(COMPILERNAME) ${OPENMP_FLAG_${F90}} -o DAMASK_spectral.exe DAMASK_spectral.o CPFEM.a $(FFTWOPTIONS)\
|
$(PREFIX) $(COMPILERNAME) ${OPENMP_FLAG_${F90}} -o DAMASK_spectral.exe DAMASK_spectral.o CPFEM.a \
|
||||||
constitutive.a advanced.a basics.a $(BLAS)
|
constitutive.a advanced.a basics.a $(LIB_DIRS) $(LIBRARIES)
|
||||||
DAMASK_spectral.o: DAMASK_spectral.f90 CPFEM.o
|
DAMASK_spectral.o: DAMASK_spectral.f90 CPFEM.o
|
||||||
$(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) DAMASK_spectral.f90 $(SUFFIX)
|
$(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) DAMASK_spectral.f90 $(SUFFIX)
|
||||||
endif
|
endif
|
||||||
|
@ -205,7 +204,7 @@ mesh.o: mesh.f90 FEsolving.o
|
||||||
FEsolving.o: FEsolving.f90 basics.a
|
FEsolving.o: FEsolving.f90 basics.a
|
||||||
$(PREFIX) $(COMPILERNAME) $(COMPILE) FEsolving.f90 $(SUFFIX)
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) FEsolving.f90 $(SUFFIX)
|
||||||
|
|
||||||
ifeq ($(PRECISION),single)
|
ifeq "$(PRECISION)" "single"
|
||||||
basics.a: debug.o math.o
|
basics.a: debug.o math.o
|
||||||
ar rc basics.a debug.o math.o numerics.o IO.o DAMASK_spectral_interface.o prec_single.o
|
ar rc basics.a debug.o math.o numerics.o IO.o DAMASK_spectral_interface.o prec_single.o
|
||||||
else
|
else
|
||||||
|
@ -222,7 +221,7 @@ numerics.o: numerics.f90 IO.o
|
||||||
IO.o: IO.f90 DAMASK_spectral_interface.o
|
IO.o: IO.f90 DAMASK_spectral_interface.o
|
||||||
$(PREFIX) $(COMPILERNAME) $(COMPILE) IO.f90 $(SUFFIX)
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) IO.f90 $(SUFFIX)
|
||||||
|
|
||||||
ifeq ($(PRECISION),single)
|
ifeq "$(PRECISION)" "single"
|
||||||
DAMASK_spectral_interface.o: DAMASK_spectral_interface.f90 prec_single.o
|
DAMASK_spectral_interface.o: DAMASK_spectral_interface.f90 prec_single.o
|
||||||
$(PREFIX) $(COMPILERNAME) $(COMPILE) DAMASK_spectral_interface.f90 $(SUFFIX)
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) DAMASK_spectral_interface.f90 $(SUFFIX)
|
||||||
prec_single.o: prec_single.f90
|
prec_single.o: prec_single.f90
|
||||||
|
@ -240,3 +239,4 @@ clean:
|
||||||
rm -rf *.mod
|
rm -rf *.mod
|
||||||
rm -rf *.a
|
rm -rf *.a
|
||||||
rm -rf *.exe
|
rm -rf *.exe
|
||||||
|
|
||||||
|
|
|
@ -1,7 +1,7 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
# $Id$
|
# $Id$
|
||||||
# Writes version specific files for different MARC releases
|
# Writes version specific files for different MARC releases
|
||||||
import os,sys,string,damask
|
import os,sys,string,re,damask
|
||||||
|
|
||||||
architectures = {
|
architectures = {
|
||||||
'marc': {
|
'marc': {
|
||||||
|
@ -43,12 +43,8 @@ content = makefile.readlines()
|
||||||
makefile.close()
|
makefile.close()
|
||||||
makefile = open(os.path.join(baseDir,'makefile'),'w')
|
makefile = open(os.path.join(baseDir,'makefile'),'w')
|
||||||
for line in content:
|
for line in content:
|
||||||
if line.startswith('FFTWPATH'):
|
m = re.match(r'(FFTW|ACML)ROOT\s*:?=',line)
|
||||||
line='FFTWPATH =%s\n'%(damaskEnv.pathInfo['fftw'])
|
if m: line = '%sROOT := %s\n'%(m.group(1),damaskEnv.pathInfo[m.group(1).lower()])
|
||||||
print line
|
|
||||||
if line.startswith('ACMLROOT'):
|
|
||||||
line='ACMLROOT =%s\n'%(damaskEnv.pathInfo['acml'])
|
|
||||||
print line
|
|
||||||
makefile.writelines(line)
|
makefile.writelines(line)
|
||||||
makefile.close()
|
makefile.close()
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue