# Makefile to compile the Material subroutine for BVP solution using spectral method # # use switch on make to determine PRECISION, e.g make PRECISION=single # default is PRECISION=double # be sure to remove all librarys with different PRECISION (make clean) # # Uses openmp to parallelise the material subroutines (set number of cores with "export DAMASK_NUM_THREADS=n" to n) # Uses linux threads to parallelise fftw3 (should also be possible with openmp) # Besides of the f90 files written at MPIE, the two library files of fftw3 "libfftw3_threads.a" "libfftw3.a" are also needed # Install fftw3 (v3.3 is tested) with "./configure --enable-threads --enable-sse2" and "make"; "make install" is not needed # as long as the two library files "libfftw3_threads.a" "libfftw3.a" are copied to the code/include directory. # OPTIONS = standard (alternative): meaning #------------------------------------------------------------- # PRECISION = double (single): floating point precision # F90 = ifort (gfortran): compiler, choose Intel or GNU # PORTABLE = TRUE (FALSE): decision, if executable is optimized for the machine on which it was built. Until now only for ifort # OPTIMIZATION = DEFENSIVE (OFF,AGGRESSIVE,ULTRA): Optimization mode, O0, O2, O3 # OPENMP = TRUE (FALSE): OpenMP multiprocessor support # PREFIX: specifie an arbitrary prefix # SUFFIX: specife an arbitrary suffix, e.g # COMPILERNAME = overwrite name of Compiler, e.g. using mpich-g90 instead of ifort # Here are some usefull debugging switches. Switch on by uncommenting last line: #-------------------------------------------------------------------------------- # information on http://software.intel.com/en-us/articles/determining-root-cause-of-sigsegv-or-sigbus-errors/ # check if an array index is too small (<1) or too large! DEBUG1 =-check bounds -g #will cause a lot of warnings because we create a bunch of temporary arrays DEBUG2 =-check arg_temp_created #check from time to time DEBUG3 =-fp-stack-check -g -traceback -gen-interfaces -warn interfaces #should not be done for OpenMP, but set "ulimit -s unlimited" on shell. Problably it helps also to unlimit other limits DEBUG4 =-heap-arrays #checks for standard DEBUG5 =stand std03/std95 #SUFFIX =$(DEBUG1) $(DEBUG2) $(DEBUG3) #BLAS for OPENMP=OFF BLAS_ifort =-L /opt/acml4.4.0/ifort64/lib -lacml BLAS_gfortran = ifeq ($(F90), ) F90 =ifort endif ifeq ($(OPTIMIZATION), ) OPTIMIZATION =DEFENSIVE endif MAXOPTI =$(OPTIMIZATION) ifeq ($(OPTIMIZATION),ULTRA) MAXOPTI=AGGRESSIVE endif ifeq ($(OPTIMIZATION),AGGRESSIVE) MAXOPTI=DEFENSIVE endif ifeq ($(PORTABLE),FALSE) PORTABLE_SWITCH =-msse3 endif ifneq ($(OPENMP), OFF) OPENMP_FLAG_ifort =-openmp -openmp-report0 -parallel OPENMP_FLAG_gfortran =-fopenmp BLAS_ifort =-L /opt/acml4.4.0/ifort64_mp/lib -lacml_mp BLAS_gfortran = OPENMP =ON endif OPTIMIZATION_OFF_ifort =-O0 OPTIMIZATION_OFF_gfortran =-O0 OPTIMIZATION_DEFENSIVE_ifort =-O2 OPTIMIZATION_DEFENSIVE_gfortran =-O2 OPTIMIZATION_AGGRESSIVE_ifort =-O3 $(PORTABLE_SWITCH) -ip -static -fp-model fast=2 -no-prec-div OPTIMIZATION_ULTRA_ifort =-O3 $(PORTABLE_SWITCH) -ip -static -fp-model fast=2 -no-prec-div OPTIMIZATION_AGGRESSIVE_gfortran =-O3 -march=opteron -ffast-math -funroll-loops -ftree-vectorize -ftree-loop-linear $(PORTABLE_SWITCH) COMPILE_OPTIONS_ifort =-fpp -diag-disable 8291,8290 COMPILE_OPTIONS_gfortran =-xf95-cpp-input -ffree-line-length-none COMPILE =${OPENMP_FLAG_${F90}} ${COMPILE_OPTIONS_${F90}} ${OPTIMIZATION_${OPTIMIZATION}_${F90}} -c COMPILE_MAXOPTI =${OPENMP_FLAG_${F90}} ${COMPILE_OPTIONS_${F90}} ${OPTIMIZATION_${MAXOPTI}_${F90}} -c ifndef COMPILERNAME COMPILERNAME=$(F90) endif ifeq ($(PRECISION),single) DAMASK_spectral_single.exe: DAMASK_spectral_single.o CPFEM.a $(PREFIX) $(COMPILERNAME) ${OPENMP_FLAG_${F90}} -o DAMASK_spectral_single.exe DAMASK_spectral_single.o CPFEM.a include/libfftw3f_threads.a include/libfftw3f.a\ constitutive.a advanced.a basics.a -lpthread ${BLAS_${F90}} DAMASK_spectral_single.o: DAMASK_spectral_single.f90 CPFEM.o $(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) DAMASK_spectral_single.f90 $(SUFFIX) else DAMASK_spectral.exe: DAMASK_spectral.o CPFEM.a $(PREFIX) $(COMPILERNAME) ${OPENMP_FLAG_${F90}} -o DAMASK_spectral.exe DAMASK_spectral.o CPFEM.a include/libfftw3_threads.a include/libfftw3.a\ constitutive.a advanced.a basics.a -lpthread ${BLAS_${F90}} DAMASK_spectral.o: DAMASK_spectral.f90 CPFEM.o $(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) DAMASK_spectral.f90 $(SUFFIX) endif CPFEM.a: CPFEM.o ar rc CPFEM.a homogenization.o homogenization_RGC.o homogenization_isostrain.o crystallite.o CPFEM.o constitutive.o CPFEM.o: CPFEM.f90 homogenization.o $(PREFIX) $(COMPILERNAME) $(COMPILE) CPFEM.f90 $(SUFFIX) homogenization.o: homogenization.f90 homogenization_isostrain.o homogenization_RGC.o crystallite.o $(PREFIX) $(COMPILERNAME) $(COMPILE) homogenization.f90 $(SUFFIX) homogenization_RGC.o: homogenization_RGC.f90 constitutive.a $(PREFIX) $(COMPILERNAME) $(COMPILE) homogenization_RGC.f90 $(SUFFIX) homogenization_isostrain.o: homogenization_isostrain.f90 basics.a advanced.a $(PREFIX) $(COMPILERNAME) $(COMPILE) homogenization_isostrain.f90 $(SUFFIX) crystallite.o: crystallite.f90 constitutive.a $(PREFIX) $(COMPILERNAME) $(COMPILE) crystallite.f90 $(SUFFIX) constitutive.a: constitutive.o ar rc constitutive.a constitutive.o constitutive_titanmod.o constitutive_nonlocal.o constitutive_dislotwin.o constitutive_j2.o constitutive_phenopowerlaw.o basics.a advanced.a constitutive.o: constitutive.f90 constitutive_titanmod.o constitutive_nonlocal.o constitutive_dislotwin.o constitutive_j2.o constitutive_phenopowerlaw.o $(PREFIX) $(COMPILERNAME) $(COMPILE) constitutive.f90 $(SUFFIX) constitutive_titanmod.o: constitutive_titanmod.f90 basics.a advanced.a $(PREFIX) $(COMPILERNAME) $(COMPILE) constitutive_titanmod.f90 $(SUFFIX) constitutive_nonlocal.o: constitutive_nonlocal.f90 basics.a advanced.a $(PREFIX) $(COMPILERNAME) $(COMPILE) constitutive_nonlocal.f90 $(SUFFIX) constitutive_dislotwin.o: constitutive_dislotwin.f90 basics.a advanced.a $(PREFIX) $(COMPILERNAME) $(COMPILE) constitutive_dislotwin.f90 $(SUFFIX) constitutive_j2.o: constitutive_j2.f90 basics.a advanced.a $(PREFIX) $(COMPILERNAME) $(COMPILE) constitutive_j2.f90 $(SUFFIX) constitutive_phenopowerlaw.o: constitutive_phenopowerlaw.f90 basics.a advanced.a $(PREFIX) $(COMPILERNAME) $(COMPILE) constitutive_phenopowerlaw.f90 $(SUFFIX) advanced.a: lattice.o ar rc advanced.a FEsolving.o mesh.o material.o lattice.o lattice.o: lattice.f90 material.o $(PREFIX) $(COMPILERNAME) $(COMPILE) lattice.f90 $(SUFFIX) material.o: material.f90 mesh.o $(PREFIX) $(COMPILERNAME) $(COMPILE) material.f90 $(SUFFIX) mesh.o: mesh.f90 FEsolving.o $(PREFIX) $(COMPILERNAME) $(COMPILE) mesh.f90 $(SUFFIX) FEsolving.o: FEsolving.f90 basics.a $(PREFIX) $(COMPILERNAME) $(COMPILE) FEsolving.f90 $(SUFFIX) ifeq ($(PRECISION),single) basics.a: debug.o math.o ar rc basics.a debug.o math.o numerics.o IO.o DAMASK_spectral_interface.o prec_single.o else basics.a: debug.o math.o ar rc basics.a debug.o math.o numerics.o IO.o DAMASK_spectral_interface.o prec.o endif debug.o: debug.f90 numerics.o $(PREFIX) $(COMPILERNAME) $(COMPILE) debug.f90 $(SUFFIX) math.o: math.f90 numerics.o $(PREFIX) $(COMPILERNAME) $(COMPILE) math.f90 $(SUFFIX) numerics.o: numerics.f90 IO.o $(PREFIX) $(COMPILERNAME) $(COMPILE) numerics.f90 $(SUFFIX) IO.o: IO.f90 DAMASK_spectral_interface.o $(PREFIX) $(COMPILERNAME) $(COMPILE) IO.f90 $(SUFFIX) ifeq ($(PRECISION),single) DAMASK_spectral_interface.o: DAMASK_spectral_interface.f90 prec_single.o $(PREFIX) $(COMPILERNAME) $(COMPILE) DAMASK_spectral_interface.f90 $(SUFFIX) prec_single.o: prec_single.f90 $(PREFIX) $(COMPILERNAME) $(COMPILE) prec_single.f90 $(SUFFIX) else DAMASK_spectral_interface.o: DAMASK_spectral_interface.f90 prec.o $(PREFIX) $(COMPILERNAME) $(COMPILE) DAMASK_spectral_interface.f90 $(SUFFIX) prec.o: prec.f90 @echo $(OPTIMIZATION) @echo $(MAXOPTI) $(PREFIX) $(COMPILERNAME) $(COMPILE) prec.f90 $(SUFFIX) endif clean: rm -rf *.o rm -rf *.mod rm -rf *.a