438 lines
21 KiB
Makefile
438 lines
21 KiB
Makefile
SHELL = /bin/sh
|
|
########################################################################################
|
|
# Makefile to compile the Material subroutine for BVP solution using spectral method
|
|
########################################################################################
|
|
# Be sure to remove all files compiled with different options by using "make clean"
|
|
#
|
|
# Uses OpenMP to parallelize the material subroutines
|
|
# (set number of threads with "export DAMASK_NUM_THREADS=n" to n)
|
|
#
|
|
# Install fftw3 (v3.3 is tested):
|
|
# + execute
|
|
# ./configure --enable-threads --enable-sse2 --enable-shared
|
|
# make
|
|
# make install
|
|
# + specify in the "pathinfo:FFTW" where FFTW was installed.
|
|
# We essentially look for two library files "lib/libfftw3_threads" and "lib/libfftw3",
|
|
# so you can copy those, for instance,
|
|
# into DAMASK_ROOT/lib/fftw/lib/ and specify "./fftw/" as pathinfo:FFTW
|
|
# Uses linux threads to parallelize fftw3
|
|
#
|
|
# Instead of the AMD Core Math Library or the Intel Kernel Math Library
|
|
# a standard "lib(64)/liblapack.a/dylib/etc." can be used.
|
|
# leave pathinfo:ACML and pathinfo:IKML blank, but specify as pathinfo:LAPACK where the library folder is located
|
|
########################################################################################
|
|
# OPTIONS = standard (alternative): meaning
|
|
#-------------------------------------------------------------
|
|
# F90 = ifort (gfortran): compiler, choose Intel or GNU
|
|
# COMPILERNAME = overwrite name of Compiler, e.g. using mpich-g90 instead of ifort
|
|
# PORTABLE = TRUE (FALSE): decision, if executable is optimized for the machine on which it was built.
|
|
# OPTIMIZATION = DEFENSIVE (OFF,AGGRESSIVE,ULTRA): Optimization mode: O2, O0, O3 + further options for most files, O3 + further options for all files
|
|
# OPENMP = TRUE (FALSE): OpenMP multiprocessor support
|
|
# FFTWROOT = pathinfo:FFTW (will be adjusted by setup_code.py - required in pathinfo)
|
|
# IMKLROOT = pathinfo:IMKL (will be adjusted by setup_code.py if present in pathinfo)
|
|
# ACMLROOT = pathinfo:ACML (will be adjusted by setup_code.py if present in pathinfo)
|
|
# LAPACKROOT = pathinfo:LAPACK (will be adjusted by setup_code.py if present in pathinfo)
|
|
# PREFIX = arbitrary prefix
|
|
# SUFFIX = arbitrary suffix
|
|
# STANDARD_CHECK = checking for Fortran 2008, compiler dependend
|
|
########################################################################################
|
|
|
|
#any values will be overwritten by setup_code.py
|
|
FFTWROOT ?= auto
|
|
IMKLROOT ?= auto
|
|
ACMLROOT ?= auto
|
|
LAPACKROOT ?= auto
|
|
|
|
F90?=ifort
|
|
|
|
COMPILERNAME ?= $(F90)
|
|
|
|
INCLUDE_DIRS +=-I$(DAMASK_ROOT)/lib
|
|
|
|
ifeq "$(FASTBUILD)" "YES"
|
|
OPENMP := OFF
|
|
OPTIMIZATION := OFF
|
|
else
|
|
OPENMP ?= ON
|
|
OPTIMIZATION ?= DEFENSIVE
|
|
endif
|
|
|
|
ifeq "$(OPTIMIZATION)" "OFF"
|
|
OPTI := OFF
|
|
MAXOPTI := OFF
|
|
endif
|
|
ifeq "$(OPTIMIZATION)" "DEFENSIVE"
|
|
OPTI := DEFENSIVE
|
|
MAXOPTI := DEFENSIVE
|
|
endif
|
|
ifeq "$(OPTIMIZATION)" "AGGRESSIVE"
|
|
OPTI := AGGRESSIVE
|
|
MAXOPTI := DEFENSIVE
|
|
endif
|
|
ifeq "$(OPTIMIZATION)" "ULTRA"
|
|
OPTI := AGGRESSIVE
|
|
MAXOPTI := AGGRESSIVE
|
|
endif
|
|
|
|
ifndef OPTI
|
|
OPTI := DEFENSIVE
|
|
MAXOPTI := DEFENSIVE
|
|
endif
|
|
|
|
ifeq "$(PORTABLE)" "FALSE"
|
|
PORTABLE_SWITCH =-msse3
|
|
endif
|
|
|
|
|
|
ifdef ACMLROOT
|
|
LIB_DIRS +=-L$(ACMLROOT)/$(F90)64$(ACML_ARCH)/lib
|
|
LIBRARIES +=-lacml$(ACML_ARCH)
|
|
else
|
|
ifdef LAPACKROOT
|
|
LIB_DIRS +=-L$(LAPACKROOT)/lib64 -L$(LAPACKROOT)/lib
|
|
LIBRARIES +=-llapack
|
|
endif
|
|
endif
|
|
|
|
COMPILE_OPTIONS_ifort :=
|
|
ifeq "$(F90)" "ifort"
|
|
ifdef IMKLROOT
|
|
COMPILE_OPTIONS_ifort +=-I$(IMKLROOT)/include -mkl=sequential
|
|
LIBRARIES :=-lmkl_intel_lp64 -lmkl_sequential -lmkl_core -lm
|
|
LIB_DIRS :=-L$(IMKLROOT)/lib/intel64
|
|
endif
|
|
endif
|
|
|
|
# settings for multicore support
|
|
ifeq "$(OPENMP)" "ON"
|
|
OPENMP_FLAG_ifort =-openmp -openmp-report0 -parallel
|
|
OPENMP_FLAG_gfortran =-fopenmp
|
|
ACML_ARCH =_mp
|
|
LIBRARIES +=-lfftw3_threads -lpthread
|
|
endif
|
|
|
|
LIBRARIES +=-lfftw3
|
|
LIB_DIRS +=-L$(FFTWROOT)/lib
|
|
|
|
|
|
ifdef PETSC_DIR
|
|
include ${PETSC_DIR}/conf/variables
|
|
INCLUDE_DIRS +=${PETSC_FC_INCLUDES} -DPETSc
|
|
LIBRARIES +=${PETSC_WITH_EXTERNAL_LIB}
|
|
endif
|
|
|
|
ifdef STANDARD_CHECK
|
|
STANDARD_CHECK_ifort =$(STANDARD_CHECK)
|
|
STANDARD_CHECK_gfortran =$(STANDARD_CHECK)
|
|
endif
|
|
|
|
ifneq "$(FASTBUILD)" "YES"
|
|
STANDARD_CHECK_ifort ?=-stand f08 -standard-semantics -warn stderrors
|
|
STANDARD_CHECK_gfortran ?=-std=f2008 -Wintrinsics-std
|
|
endif
|
|
#-std=f2008ts: for newer gfortran
|
|
#-Wintrinsics-std: only standard intrisics are available, e.g. "call flush(6)" will cause an error
|
|
|
|
OPTIMIZATION_OFF_ifort :=-O0 -no-ip
|
|
OPTIMIZATION_OFF_gfortran :=-O0
|
|
OPTIMIZATION_DEFENSIVE_ifort :=-O2
|
|
OPTIMIZATION_DEFENSIVE_gfortran :=-O2
|
|
OPTIMIZATION_AGGRESSIVE_ifort :=-O3 $(PORTABLE_SWITCH) -no-prec-div -fp-model fast=2 -ipo #-static causes trouble at the moment
|
|
OPTIMIZATION_AGGRESSIVE_gfortran :=-O3 $(PORTABLE_SWITCH) -ffast-math -funroll-loops -ftree-vectorize
|
|
|
|
|
|
COMPILE_OPTIONS_ifort +=-fpp\
|
|
-ftz\
|
|
-assume byterecl
|
|
ifneq "$(FASTBUILD)" "YES"
|
|
COMPILE_OPTIONS_ifort +=$(COMPILE_OPTIONS_ifort)\
|
|
-implicitnone\
|
|
-diag-enable sc3\
|
|
-diag-disable 5268\
|
|
-warn declarations\
|
|
-warn general\
|
|
-warn usage\
|
|
-warn interfaces\
|
|
-warn ignore_loc\
|
|
-warn alignments\
|
|
-warn unused\
|
|
-warn errors
|
|
endif
|
|
###################################################################################################
|
|
#COMPILE SWITCHES
|
|
#-fpp: preprocessor
|
|
#-ftz: flush unterflow to zero, automatically set if O<0,1,2,3> >0
|
|
#-fimplicit-none: assume "implicit-none" even if not present in source
|
|
#-diag-disable: disables warnings, where
|
|
# warning ID 5268: the text exceeds right hand column allowed on the line (we have only comments there)
|
|
#-warn: enables warnings, where
|
|
# declarations: any undeclared names
|
|
# general: warning messages and informational messages are issued by the compiler
|
|
# usage: questionable programming practices
|
|
# interfaces: checks the interfaces of all SUBROUTINEs called and FUNCTIONs invoked in your compilation against an external set of interface blocks
|
|
# ignore_loc: %LOC is stripped from an actual argument
|
|
# alignments: data that is not naturally aligned
|
|
# unused: declared variables that are never used
|
|
# errors: warnings are changed to errors
|
|
# stderrors: warnings about Fortran standard violations are changed to errors (STANDARD_CHECK)
|
|
#
|
|
###################################################################################################
|
|
#MORE OPTIONS FOR DEBUGGING DURING COMPILATION
|
|
#-warn: enables warnings, where
|
|
# truncated_source: Determines whether warnings occur when source exceeds the maximum column width in fixed-format files. (too many warnings because we have comments beyond character 132)
|
|
# uncalled: Determines whether warnings occur when a statement function is never called
|
|
# all:
|
|
|
|
DEBUG_OPTIONS_ifort :=-g\
|
|
-traceback\
|
|
-gen-interfaces\
|
|
-fp-stack-check\
|
|
-check bounds,format,output_conversion,pointers,uninit
|
|
###################################################################################################
|
|
#COMPILE SWITCHES FOR RUNTIME DEBUGGING
|
|
#-g: Generate symbolic debugging information in the object file
|
|
#-traceback: Generate extra information in the object file to provide source file traceback information when a severe error occurs at run time.
|
|
#-gen-interfaces: Generate an interface block for each routine. http://software.intel.com/en-us/blogs/2012/01/05/doctor-fortran-gets-explicit-again/
|
|
#-fp-stack-check: Generate extra code after every function call to ensure that the floating-point (FP) stack is in the expected state.
|
|
#-check: checks at runtime, where
|
|
# bounds: check if an array index is too small (<1) or too large!
|
|
# format: Checking for the data type of an item being formatted for output.
|
|
# output_conversion: Checking for the fit of data items within a designated format descriptor field.
|
|
# pointers: Checking for certain disassociated or uninitialized pointers or unallocated allocatable objects.
|
|
# uninit: Checking for uninitialized variables.
|
|
#-fpe-all0 capture all floating-point exceptions, sets -ftz automatically
|
|
# information on http://software.intel.com/en-us/articles/determining-root-cause-of-sigsegv-or-sigbus-errors/
|
|
###################################################################################################
|
|
#MORE OPTIONS FOR RUNTIME DEBUGGING
|
|
#-heap-arrays: should not be done for OpenMP, but set "ulimit -s unlimited" on shell. Probably it helps also to unlimit other limits
|
|
#-check: checks at runtime, where
|
|
# arg_temp_created: will cause a lot of warnings because we create a bunch of temporary arrays (performance?)
|
|
|
|
|
|
COMPILE_OPTIONS_gfortran :=-xf95-cpp-input
|
|
ifneq "$(FASTBUILD)" "YES"
|
|
COMPILE_OPTIONS_gfortran +=$(COMPILE_OPTIONS_gfortran)\
|
|
-ffree-line-length-132\
|
|
-fimplicit-none\
|
|
-pedantic\
|
|
-Warray-bounds\
|
|
-Wampersand\
|
|
-Wno-tabs\
|
|
-Wcharacter-truncation\
|
|
-Wintrinsic-shadow\
|
|
-Waliasing\
|
|
-Wconversion\
|
|
-Wsurprising\
|
|
-Wunderflow\
|
|
-Wswitch\
|
|
-Wstrict-overflow\
|
|
-Wattributes\
|
|
-Wunsafe-loop-optimizations\
|
|
-Wunused\
|
|
-Wall\
|
|
-Wextra\
|
|
-Wsuggest-attribute=const\
|
|
-Wsuggest-attribute=pure\
|
|
-Wsuggest-attribute=noreturn\
|
|
-Wreal-q-constant\
|
|
-pedantic-errors
|
|
endif
|
|
###################################################################################################
|
|
#COMPILE SWITCHES
|
|
#-xf95-cpp-input: preprocessor
|
|
#-ffree-line-length-132: restrict line length to the standard 132 characters
|
|
#-fno-range-check: disables checking if result can be represented by variable. Needs to be set to enable DAMASK_NaN
|
|
#-fimplicit-none: assume "implicit-none" even if not present in source
|
|
#-pedantic: more strict on standard, enables some of the warnings below
|
|
#-Warray-bounds: checks if array reference is out of bounds at compile time. use -fcheck-bounds to also check during runtime
|
|
#-Wampersand: checks if a character expression is continued proberly by an ampersand at the end of the line and at the beginning of the new line
|
|
#-Wno-tabs: do not allow tabs in source
|
|
#-Wcharacter-truncation: warn if character expressions (strings) are truncated
|
|
#-Wintrinsic-shadow: warn if a user-defined procedure or module procedure has the same name as an intrinsic
|
|
#-Waliasing: warn about possible aliasing of dummy arguments. Specifically, it warns if the same actual argument is associated with a dummy argument with "INTENT(IN)" and a dummy argument with "INTENT(OUT)" in a call with an explicit interface.
|
|
#-Wconversion: warn about implicit conversions between different type
|
|
#-Wsurprising: warn when "suspicious" code constructs are encountered. While technically legal these usually indicate that an error has been made.
|
|
#-Wunderflow: produce a warning when numerical constant expressions are encountered, which yield an UNDERFLOW during compilation
|
|
#-Wswitch: warn whenever a "switch" statement has an index of enumerated type and lacks a "case" for one or more of the named codes of that enumeration. (The presence of a "default" label prevents this warning.) "case" labels outside the enumeration range also provokewarnings when this option is used (even if there is a "default" label)
|
|
#-Wstrict-overflow:
|
|
#-Wattributes: warn about inappropriate attribute usage
|
|
#-Wunsafe-loop-optimizations: warn if the loop cannot be optimized due to nontrivial assumptions.
|
|
#-Wunused:
|
|
# -value:
|
|
# -parameter: find usused variables with "parameter" attribute
|
|
#-Wextra:
|
|
#-Wsuggest-attribute=const:
|
|
#-Wsuggest-attribute=noreturn:
|
|
#-Wsuggest-attribute=pure:
|
|
#-Wreal-q-constant: warn about real-literal-constants with 'q' exponent-letter
|
|
#-pedantic-errors:
|
|
###################################################################################################
|
|
#MORE OPTIONS FOR RUNTIME DEBUGGING
|
|
#-Wline-truncation: too many warnings because we have comments beyond character 132
|
|
#-Warray-temporarieswarnings: because we have many temporary arrays (performance issue?):
|
|
#-Wimplicit-interface:
|
|
#-fmodule-private:
|
|
|
|
DEBUG_OPTIONS_gfortran :=-g\
|
|
-fbacktrace\
|
|
-fbounds-check\
|
|
-ffpe-trap=invalid,zero,overflow
|
|
###################################################################################################
|
|
#COMPILE SWITCHES FOR RUNTIME DEBUGGING
|
|
#-fbounds-check: check if an array index is too small (<1) or too large!
|
|
#-ffpe-trap=invalid,\ stop execution if floating point exception is detected (NaN is silent)
|
|
# zero,\
|
|
# overflow,\
|
|
# underflow
|
|
###################################################################################################
|
|
#COMPILE SWITCHES FOR RUNTIME DEBUGGING
|
|
#-fbounds-check: check if an array index is too small (<1) or too large!
|
|
#-ffpe-trap=precision,\
|
|
# denormal, \
|
|
# underflow
|
|
|
|
ifeq "$(DEBUG)" "ON"
|
|
COMPILE_OPTIONS_$(F90) :=$(COMPILE_OPTIONS_$(F90)) $(DEBUG_OPTIONS_$(F90))
|
|
endif
|
|
|
|
PRECISION_ifort :=-real-size 64 -integer-size 32 -DFLOAT=8 -DINT=4
|
|
#-real-size 32: set precision to one of those 32/64/128 (= 4/8/16 bytes) for standard real (=8 for pReal)
|
|
#-integer-size 16: set precision to one of those 16/32/64 (= 2/4/8 bytes) for standard integer (=4 for pInt)
|
|
PRECISION_gfortran :=-fdefault-real-8 -fdefault-double-8 -DFLOAT=8 -DINT=4
|
|
#-fdefault-real-8: set precision to 8 bytes for standard real (=8 for pReal). Will set size of double to 16 bytes as long as -fdefault-double-8 is not set
|
|
#-fdefault-double-8: set precision to 8 bytes for double real, would be 16 bytes because -fdefault-real-8 is used
|
|
#-fdefault-integer-8: Use it to set precision to 8 bytes for integer, don't use it for the standard case of pInt=4 (there is no -fdefault-integer-4)
|
|
|
|
###################################################################################################
|
|
COMPILE =$(OPENMP_FLAG_$(F90)) $(COMPILE_OPTIONS_$(F90)) $(STANDARD_CHECK_$(F90)) $(OPTIMIZATION_$(OPTI)_$(F90)) $(INCLUDE_DIRS) $(PRECISION_$(F90)) -DSpectral
|
|
COMPILE_MAXOPTI =$(OPENMP_FLAG_$(F90)) $(COMPILE_OPTIONS_$(F90)) $(STANDARD_CHECK_$(F90)) $(OPTIMIZATION_$(MAXOPTI)_$(F90)) $(INCLUDE_DIRS) $(PRECISION_$(F90)) -DSpectral
|
|
###################################################################################################
|
|
COMPILED_FILES = prec.o DAMASK_spectral_interface.o IO.o numerics.o debug.o math.o \
|
|
FEsolving.o mesh.o material.o lattice.o \
|
|
constitutive_dislotwin.o constitutive_j2.o constitutive_phenopowerlaw.o \
|
|
constitutive_titanmod.o constitutive_nonlocal.o constitutive_none.o constitutive.o crystallite.o \
|
|
homogenization_RGC.o homogenization_isostrain.o homogenization.o CPFEM.o \
|
|
DAMASK_spectral_utilities.o DAMASK_spectral_solverBasic.o
|
|
|
|
ifdef PETSC_DIR
|
|
PETSC_FILES = DAMASK_spectral_solverAL.o DAMASK_spectral_solverBasicPETSc.o
|
|
COMPILED_FILES += $(PETSC_FILES)
|
|
endif
|
|
|
|
|
|
DAMASK_spectral.exe: DAMASK_spectral_driver.o
|
|
$(PREFIX) $(COMPILERNAME) $(OPENMP_FLAG_$(F90)) $(OPTIMIZATION_$(MAXOPTI)_$(F90)) $(STANDARD_CHECK_$(F90)) \
|
|
-o DAMASK_spectral.exe DAMASK_spectral_driver.o \
|
|
$(COMPILED_FILES) $(LIB_DIRS) $(LIBRARIES) $(SUFFIX)
|
|
|
|
DAMASK_spectral_driver.o: DAMASK_spectral_driver.f90 DAMASK_spectral_solverBasic.o $(PETSC_FILES)
|
|
$(PREFIX) $(COMPILERNAME) $(COMPILE_MAXOPTI) -c DAMASK_spectral_driver.f90 $(SUFFIX)
|
|
|
|
DAMASK_spectral_solverAL.o: DAMASK_spectral_solverAL.f90\
|
|
DAMASK_spectral_utilities.o
|
|
|
|
DAMASK_spectral_solverBasic.o: DAMASK_spectral_solverBasic.f90\
|
|
DAMASK_spectral_utilities.o
|
|
|
|
DAMASK_spectral_solverBasicPETSc.o: DAMASK_spectral_solverBasicPETSc.f90\
|
|
DAMASK_spectral_utilities.o
|
|
|
|
DAMASK_spectral_utilities.o: DAMASK_spectral_utilities.f90\
|
|
CPFEM.o
|
|
CPFEM.o: CPFEM.f90\
|
|
homogenization.o
|
|
|
|
homogenization.o: homogenization.f90\
|
|
homogenization_RGC.o \
|
|
homogenization_isostrain.o
|
|
|
|
homogenization_RGC.o: homogenization_RGC.f90 \
|
|
crystallite.o
|
|
|
|
homogenization_isostrain.o: homogenization_isostrain.f90 \
|
|
crystallite.o
|
|
|
|
crystallite.o: crystallite.f90 \
|
|
constitutive.o
|
|
|
|
constitutive.o: constitutive.f90 \
|
|
constitutive_nonlocal.o \
|
|
constitutive_titanmod.o \
|
|
constitutive_dislotwin.o \
|
|
constitutive_phenopowerlaw.o \
|
|
constitutive_j2.o \
|
|
constitutive_none.o
|
|
|
|
constitutive_nonlocal.o: constitutive_nonlocal.f90 \
|
|
lattice.o
|
|
|
|
constitutive_titanmod.o: constitutive_titanmod.f90 \
|
|
lattice.o
|
|
|
|
constitutive_dislotwin.o: constitutive_dislotwin.f90 \
|
|
lattice.o
|
|
|
|
constitutive_phenopowerlaw.o: constitutive_phenopowerlaw.f90 \
|
|
lattice.o
|
|
|
|
constitutive_j2.o: constitutive_j2.f90 \
|
|
lattice.o
|
|
|
|
constitutive_none.o: constitutive_none.f90 \
|
|
lattice.o
|
|
|
|
lattice.o: lattice.f90 \
|
|
material.o
|
|
|
|
material.o: material.f90 \
|
|
mesh.o
|
|
|
|
mesh.o: mesh.f90 \
|
|
FEsolving.o \
|
|
math.o
|
|
|
|
FEsolving.o: FEsolving.f90 \
|
|
debug.o
|
|
|
|
math.o: math.f90 \
|
|
debug.o
|
|
|
|
debug.o: debug.f90 \
|
|
numerics.o
|
|
|
|
numerics.o: numerics.f90 \
|
|
IO.o
|
|
|
|
IO.o: IO.f90 \
|
|
DAMASK_spectral_interface.o
|
|
ifeq "$(F90)" "gfortran"
|
|
DAMASK_spectral_interface.o: DAMASK_spectral_interface.f90 \
|
|
prec.o
|
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) -c -fall-intrinsics DAMASK_spectral_interface.f90 $(SUFFIX)
|
|
#-fall-intrinsics: all intrinsic procedures (including the GNU-specific extensions) are accepted. -Wintrinsics-std will be ignored
|
|
# and no user-defined procedure with the same name as any intrinsic will be called except when it is explicitly declared external
|
|
# --> allows the use of 'getcwd'
|
|
prec.o: prec.f90
|
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) -c -fno-range-check prec.f90 $(SUFFIX)
|
|
# fno-range-check: Disable range checking on results of simplification of constant expressions during compilation
|
|
# --> allows the definition of DAMASK_NaN
|
|
else
|
|
DAMASK_spectral_interface.o: DAMASK_spectral_interface.f90 \
|
|
prec.o
|
|
prec.o: prec.f90
|
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) -c prec.f90 $(SUFFIX)
|
|
endif
|
|
|
|
%.o : %.f90
|
|
$(PREFIX) $(COMPILERNAME) $(COMPILE) -c $< $(SUFFIX)
|
|
|
|
tidy:
|
|
@rm -rf *.o
|
|
@rm -rf *.mod
|
|
|
|
clean:
|
|
@rm -rf *.o
|
|
@rm -rf *.mod
|
|
@rm -rf *.exe
|