Simplified algorithm of crystallite_integrateStress while preserving (almost) same functionality.

Removed "leapfrogging" (increase of step for next guess, when last guess was ok); Replaced Armijo rule testing for step size by simple check if the residuum got better, since the former virtually did not have any effect; consistently using the 2-norm of the residuum rather than infinity-norm for the convergence check throughout the function
This commit is contained in:
Christoph Kords 2012-11-06 12:35:45 +00:00
parent 1583ae74c3
commit bb033c5fe7
2 changed files with 36 additions and 113 deletions

View File

@ -2731,8 +2731,7 @@ use debug, only: debug_level, &
debug_g, & debug_g, &
debug_cumLpCalls, & debug_cumLpCalls, &
debug_cumLpTicks, & debug_cumLpTicks, &
debug_StressLoopDistribution, & debug_StressLoopDistribution
debug_LeapfrogBreakDistribution
use constitutive, only: constitutive_LpAndItsTangent, & use constitutive, only: constitutive_LpAndItsTangent, &
constitutive_TandItsTangent, & constitutive_TandItsTangent, &
constitutive_homogenizedC constitutive_homogenizedC
@ -2779,7 +2778,6 @@ real(pReal), dimension(3,3):: Fg_new, &
residuum, & ! current residuum of plastic velocity gradient residuum, & ! current residuum of plastic velocity gradient
residuum_old, & ! last residuum of plastic velocity gradient residuum_old, & ! last residuum of plastic velocity gradient
deltaLp, & ! direction of next guess deltaLp, & ! direction of next guess
gradientR, & ! derivative of the residuum norm
Tstar,& ! 2nd Piola-Kirchhoff Stress Tstar,& ! 2nd Piola-Kirchhoff Stress
A,& A,&
B, & B, &
@ -2796,10 +2794,8 @@ real(pReal), dimension(3,3,3,3):: dT_dFe3333, &
dFe_dLp3333 ! partial derivative of elastic deformation gradient dFe_dLp3333 ! partial derivative of elastic deformation gradient
real(pReal) p_hydro, & ! volumetric part of 2nd Piola-Kirchhoff Stress real(pReal) p_hydro, & ! volumetric part of 2nd Piola-Kirchhoff Stress
det, & ! determinant det, & ! determinant
expectedImprovement, &
steplength0, & steplength0, &
steplength, & steplength, &
steplength_max, &
dt, & ! time increment dt, & ! time increment
aTol aTol
logical error ! flag indicating an error logical error ! flag indicating an error
@ -2854,14 +2850,11 @@ invFp_current = math_inv33(Fp_current)
if (all(invFp_current == 0.0_pReal)) then ! ... failed? if (all(invFp_current == 0.0_pReal)) then ! ... failed?
#ifndef _OPENMP #ifndef _OPENMP
if (iand(debug_level(debug_crystallite), debug_levelBasic) /= 0_pInt) then if (iand(debug_level(debug_crystallite), debug_levelBasic) /= 0_pInt) then
write(6,'(a,i8,1x,i2,1x,i3)') '<< CRYST >> integrateStress failed on invFp_current inversion at el ip g ',e,i,g write(6,'(a,i8,1x,i2,1x,i3)') '<< CRYST >> integrateStress failed on inversion of Fp_current at el ip g ',e,i,g
! QUESTION: all FP_current == 0.0, why reporting FP_new ?? if (iand(debug_level(debug_crystallite), debug_levelExtensive) > 0_pInt) then
! if (iand(debug_level(debug_crystallite), debug_levelSelective) > 0_pInt & write(6,*)
! .and. ((e == debug_e .and. i == debug_i .and. g == debug_g) & write(6,'(a,/,3(12x,3(f12.7,1x)/))') '<< CRYST >> Fp_current',math_transpose33(Fp_current(1:3,1:3))
! .or. .not. iand(debug_level(debug_crystallite), debug_levelSelective) /= 0_pInt)) then endif
! write(6,*)
! write(6,'(a,/,3(12x,3(f12.7,1x)/))') '<< CRYST >> invFp_new',math_transpose33(invFp_new(1:3,1:3))
! endif
endif endif
#endif #endif
return return
@ -2874,8 +2867,8 @@ A = math_mul33x33(Fg_new,invFp_current) ! int
NiterationStress = 0_pInt NiterationStress = 0_pInt
jacoCounter = 0_pInt jacoCounter = 0_pInt
steplength0 = 1.0_pReal steplength0 = 1.0_pReal
steplength_max = 16.0_pReal
steplength = steplength0 steplength = steplength0
residuum_old = huge(1.0_pReal)
LpLoop: do LpLoop: do
NiterationStress = NiterationStress + 1_pInt NiterationStress = NiterationStress + 1_pInt
@ -2935,15 +2928,11 @@ LpLoop: do
!* update current residuum and check for convergence of loop !* update current residuum and check for convergence of loop
aTol = max(rTol_crystalliteStress * max(math_norm33(Lpguess),math_norm33(Lp_constitutive)), & ! absolute tolerance from largest acceptable relative error
aTol_crystalliteStress) ! minimum lower cutoff
residuum = Lpguess - Lp_constitutive residuum = Lpguess - Lp_constitutive
aTol = max(rTol_crystalliteStress * maxval(max(abs(Lpguess),abs(Lp_constitutive))), & ! absolute tolerance from largest acceptable relative error
aTol_crystalliteStress) ! minimum lower cutoff
if (.not. any(residuum /= residuum) & ! no convergence if NaN in residuum
.and. maxval(abs(residuum)) < aTol ) exit LpLoop ! converged if all below absolute tolerance...
!* NaN occurred at regular speed -> return if (any(residuum /= residuum)) then ! NaN in residuum...
if (steplength <= steplength0 .and. any(residuum /= residuum)) then
#ifndef _OPENMP #ifndef _OPENMP
if (iand(debug_level(debug_crystallite), debug_levelBasic) /= 0_pInt) then if (iand(debug_level(debug_crystallite), debug_levelBasic) /= 0_pInt) then
write(6,'(a,i8,1x,i2,1x,i3,a,i3,a)') '<< CRYST >> integrateStress encountered NaN at el ip g ',e,i,g,& write(6,'(a,i8,1x,i2,1x,i3,a,i3,a)') '<< CRYST >> integrateStress encountered NaN at el ip g ',e,i,g,&
@ -2951,68 +2940,21 @@ LpLoop: do
' >> returning..!' ' >> returning..!'
endif endif
#endif #endif
return ! me = .false. to inform integrator about problem return ! ...me = .false. to inform integrator about problem
elseif (math_norm33(residuum) < aTol) then ! converged if below absolute tolerance
exit LpLoop ! ...leave iteration loop
elseif (math_norm33(residuum) > math_norm33(residuum_old)) then ! not converged and worse residuum...
steplength = 0.5_pReal * steplength ! ...try with smaller step length in same direction
Lpguess = Lpguess_old + steplength * deltaLp
cycle LpLoop
else ! not converged, but improved norm of residuum...
residuum_old = residuum ! ...remember old values and...
Lpguess_old = Lpguess
steplength = steplength0 ! ...proceed with normal step length (calculate new search direction)
endif endif
if (NiterationStress > 1_pInt) then !* calculate Jacobian for correction term
!* not at regular speed
if (steplength <= steplength0) then
!* Armijo rule is fullfilled (norm of residuum was reduced by at least 0.01 of what was expected)
if (math_norm33(residuum) <= math_norm33(residuum_old) + 0.01_pReal * steplength * expectedImprovement) then
if (steplength < steplength0) then
steplength = steplength0 ! return to normal step length
elseif (sum(residuum * residuum_old) >= 0.0_pReal) then
steplength = min(steplength_max,steplength + 1.0_pReal) ! no change in sign of residuum -> accelerate up to maximum speed
endif
!* Armijo rule not fullfilled -> try smaller step size in same direction
else
steplength = 0.5_pReal * steplength
Lpguess = Lpguess_old + steplength * deltaLp
cycle LpLoop
endif
!* at high-speed
else
!* no NaN, Armijo rule fullfilled, and sign of residuum did not change -> accelerate if not yet at maximum speed
if (.not. any(residuum /= residuum) &
.and. math_norm33(residuum) <= math_norm33(residuum_old) + 0.01_pReal * steplength * expectedImprovement &
.and. sum(residuum * residuum_old) >= 0.0_pReal) then
steplength = min(steplength_max,steplength + 1.0_pReal) ! accelerate up to maximum speed
!* something went wrong at accelerated speed? -> return to regular speed and try again
else
#ifndef _OPENMP
if (iand(debug_level(debug_crystallite), debug_levelExtensive) /= 0_pInt) then
write(6,'(a,i8,1x,i2,1x,i3,1x,a,i3)') '<< CRYST >> integrateStress encountered high-speed crash at el ip g ',e,i,g,&
'; iteration ', NiterationStress
endif
#endif
if (iand(debug_level(debug_crystallite), debug_levelBasic) /= 0_pInt) then
!$OMP CRITICAL (distributionLeapfrogBreak)
debug_LeapfrogBreakDistribution(NiterationStress,numerics_integrationMode) = &
debug_LeapfrogBreakDistribution(NiterationStress,numerics_integrationMode) + 1_pInt
!$OMP END CRITICAL (distributionLeapfrogBreak)
endif
!* NaN occured -> use old guess and residuum
if (any(residuum /= residuum)) then
Lpguess = Lpguess_old
residuum = residuum_old
endif
steplength_max = max(steplength - 1.0_pReal, 1.0_pReal) ! limit acceleration
steplength = steplength0 ! grinding halt
jacoCounter = 0_pInt ! reset counter for Jacobian update (we want to do an update next time!)
endif
endif
endif
!* calculate Jacobian for correction term and remember current residuum and Lpguess
if (mod(jacoCounter, iJacoLpresiduum) == 0_pInt) then if (mod(jacoCounter, iJacoLpresiduum) == 0_pInt) then
dFe_dLp3333 = 0.0_pReal dFe_dLp3333 = 0.0_pReal
@ -3024,12 +2966,12 @@ LpLoop: do
dT_dFe_constitutive = math_Plain3333to99(dT_dFe3333) dT_dFe_constitutive = math_Plain3333to99(dT_dFe3333)
dR_dLp = math_identity2nd(9_pInt) - & dR_dLp = math_identity2nd(9_pInt) - &
math_mul99x99(dLp_dT_constitutive, math_mul99x99(dT_dFe_constitutive , dFe_dLp)) math_mul99x99(dLp_dT_constitutive, math_mul99x99(dT_dFe_constitutive , dFe_dLp))
dR_dLp2 = dR_dLp ! will be overwritten in first call to LAPACK routine dR_dLp2 = dR_dLp ! will be overwritten in first call to LAPACK routine
work = math_plain33to9(residuum) work = math_plain33to9(residuum)
#if(FLOAT==8) #if(FLOAT==8)
call dgesv(9,1,dR_dLp2,9,ipiv,work,9,ierr) ! solve dR/dLp * delta Lp = -res for dR/dLp call dgesv(9,1,dR_dLp2,9,ipiv,work,9,ierr) ! solve dR/dLp * delta Lp = -res for dR/dLp
#elif(FLOAT==4) #elif(FLOAT==4)
call sgesv(9,1,dR_dLp2,9,ipiv,work,9,ierr) ! solve dR/dLp * delta Lp = -res for dR/dLp call sgesv(9,1,dR_dLp2,9,ipiv,work,9,ierr) ! solve dR/dLp * delta Lp = -res for dR/dLp
#endif #endif
if (ierr /= 0_pInt) then if (ierr /= 0_pInt) then
#ifndef _OPENMP #ifndef _OPENMP
@ -3052,19 +2994,10 @@ LpLoop: do
#endif #endif
return return
endif endif
deltaLp = - math_plain9to33(work) deltaLp = - math_plain9to33(work)
gradientR = 0.0_pReal
do k=1_pInt,3_pInt; do l=1_pInt,3_pInt; do m=1_pInt,3_pInt; do n=1_pInt,3_pInt
gradientR(k,l) = gradientR(k,l) + dR_dLp(3*(k-1)+l,3_pInt*(m-1_pInt)+n) * residuum(m,n)
enddo; enddo; enddo; enddo
gradientR = gradientR / math_norm33(gradientR)
expectedImprovement = math_mul33xx33(deltaLp, gradientR)
endif endif
jacoCounter = jacoCounter + 1_pInt ! increase counter for jaco update jacoCounter = jacoCounter + 1_pInt ! increase counter for jaco update
residuum_old = residuum
Lpguess_old = Lpguess
Lpguess = Lpguess + steplength * deltaLp Lpguess = Lpguess + steplength * deltaLp
enddo LpLoop enddo LpLoop

View File

@ -92,7 +92,6 @@ module debug
integer(pInt), dimension(:,:), allocatable, public :: & integer(pInt), dimension(:,:), allocatable, public :: &
debug_StressLoopDistribution, & ! distribution of stress iterations until convergence debug_StressLoopDistribution, & ! distribution of stress iterations until convergence
debug_LeapfrogBreakDistribution, & ! distribution of iterations where leapfrog breaks occurred
debug_StateLoopDistribution ! distribution of state iterations until convergence debug_StateLoopDistribution ! distribution of state iterations until convergence
real(pReal), public :: & real(pReal), public :: &
@ -151,10 +150,6 @@ subroutine debug_init
deallocate(debug_StressLoopDistribution) deallocate(debug_StressLoopDistribution)
allocate(debug_StressLoopDistribution(nStress+1,2)) allocate(debug_StressLoopDistribution(nStress+1,2))
debug_StressLoopDistribution = 0_pInt debug_StressLoopDistribution = 0_pInt
if (allocated(debug_LeapfrogBreakDistribution)) &
deallocate(debug_LeapfrogBreakDistribution)
allocate(debug_LeapfrogBreakDistribution(nStress+1,2))
debug_LeapfrogBreakDistribution = 0_pInt
if (allocated(debug_StateLoopDistribution)) & if (allocated(debug_StateLoopDistribution)) &
deallocate(debug_StateLoopDistribution) deallocate(debug_StateLoopDistribution)
allocate(debug_StateLoopDistribution(nState+1,2)) allocate(debug_StateLoopDistribution(nState+1,2))
@ -326,7 +321,6 @@ subroutine debug_reset
implicit none implicit none
debug_StressLoopDistribution = 0_pInt ! initialize debugging data debug_StressLoopDistribution = 0_pInt ! initialize debugging data
debug_LeapfrogBreakDistribution = 0_pInt
debug_StateLoopDistribution = 0_pInt debug_StateLoopDistribution = 0_pInt
debug_CrystalliteLoopDistribution = 0_pInt debug_CrystalliteLoopDistribution = 0_pInt
debug_MaterialpointStateLoopDistribution = 0_pInt debug_MaterialpointStateLoopDistribution = 0_pInt
@ -411,21 +405,18 @@ subroutine debug_info
integral = 0_pInt integral = 0_pInt
write(6,*) write(6,*)
write(6,*) write(6,*)
write(6,*) 'distribution_StressLoop : stress frogbreak stiffness frogbreak' write(6,*) 'distribution_StressLoop : stress stiffness'
do i=1_pInt,nStress+1_pInt do i=1_pInt,nStress+1_pInt
if (any(debug_StressLoopDistribution(i,:) /= 0_pInt ) .or. & if (any(debug_StressLoopDistribution(i,:) /= 0_pInt )) then
any(debug_LeapfrogBreakDistribution(i,:) /= 0_pInt ) ) then
integral = integral + i*(debug_StressLoopDistribution(i,1) + debug_StressLoopDistribution(i,2)) integral = integral + i*(debug_StressLoopDistribution(i,1) + debug_StressLoopDistribution(i,2))
exceed = ' ' exceed = ' '
if (i > nStress) exceed = '+' ! last entry gets "+" if (i > nStress) exceed = '+' ! last entry gets "+"
write(6,'(i25,a1,i10,1x,i10,1x,i10,1x,i10)') min(nStress,i),exceed, & write(6,'(i25,a1,i10,1x,i10)') min(nStress,i),exceed,debug_StressLoopDistribution(i,1),&
debug_StressLoopDistribution(i,1),debug_LeapfrogBreakDistribution(i,1), & debug_StressLoopDistribution(i,2)
debug_StressLoopDistribution(i,2),debug_LeapfrogBreakDistribution(i,2)
endif endif
enddo enddo
write(6,'(a15,i10,1x,i10,12x,i10)') ' total',integral,& write(6,'(a15,i10,2(1x,i10))') ' total',integral,sum(debug_StressLoopDistribution(:,1)), &
sum(debug_StressLoopDistribution(:,1)), & sum(debug_StressLoopDistribution(:,2))
sum(debug_StressLoopDistribution(:,2))
integral = 0_pInt integral = 0_pInt
write(6,*) write(6,*)
@ -435,13 +426,12 @@ subroutine debug_info
integral = integral + i*(debug_StateLoopDistribution(i,1) + debug_StateLoopDistribution(i,2)) integral = integral + i*(debug_StateLoopDistribution(i,1) + debug_StateLoopDistribution(i,2))
exceed = ' ' exceed = ' '
if (i > nState) exceed = '+' ! last entry gets "+" if (i > nState) exceed = '+' ! last entry gets "+"
write(6,'(i25,a1,i10,12x,i10)') min(nState,i),exceed, & write(6,'(i25,a1,i10,1x,i10)') min(nState,i),exceed,debug_StateLoopDistribution(i,1),&
debug_StateLoopDistribution(i,1),debug_StateLoopDistribution(i,2) debug_StateLoopDistribution(i,2)
endif endif
enddo enddo
write(6,'(a15,i10,1x,i10,12x,i10)') ' total',integral,& write(6,'(a15,i10,2(1x,i10))') ' total',integral,sum(debug_StateLoopDistribution(:,1)), &
sum(debug_StateLoopDistribution(:,1)), & sum(debug_StateLoopDistribution(:,2))
sum(debug_StateLoopDistribution(:,2))
integral = 0_pInt integral = 0_pInt
write(6,*) write(6,*)