Working multi-precision simulations

The pure gauge theory with groups SU(2) and SU(3) is working
properly.
This commit is contained in:
Alberto Ramos 2021-09-20 18:21:16 +02:00
parent 1416efdbee
commit 09a09153b9
8 changed files with 188 additions and 283 deletions

View file

@ -9,7 +9,7 @@
### created: Thu Jul 15 11:27:28 2021
###
function gauge_action(U, lp::SpaceParm, gp::GaugeParm, ymws::YMworkspace)
function gauge_action(U, lp::SpaceParm, gp::GaugeParm{T}, ymws::YMworkspace{T}) where T <: AbstractFloat
CUDA.@sync begin
CUDA.@cuda threads=lp.bsz blocks=lp.rsz krnl_plaq!(ymws.cm, U, lp)
@ -32,7 +32,7 @@ function plaquette(U, lp::SpaceParm, gp::GaugeParm, ymws::YMworkspace)
end
function hamiltonian(mom, U, lp, gp, ymws)
K = norm_field(mom)/2.0
K = CUDA.mapreduce(norm2, +, mom)/2
V = gauge_action(U, lp, gp, ymws)
println("K: ", K, " V: ", V)
return K+V
@ -42,7 +42,7 @@ function HMC!(U, eps, ns, lp::SpaceParm, gp::GaugeParm, ymws::YMworkspace; noacc
ymws.U1 .= U
randomn!(ymws.mom, lp)
randomize!(ymws.mom, lp, ymws)
hini = hamiltonian(ymws.mom, U, lp, gp, ymws)
OMF4!(ymws.mom, U, eps, ns, lp, gp, ymws)
@ -78,14 +78,14 @@ function krnl_updt!(mom, frc1, frc2, eps1, U, eps2, lp::SpaceParm)
return nothing
end
function OMF4!(mom, U, eps, ns, lp::SpaceParm, gp::GaugeParm, ymws::YMworkspace)
function OMF4!(mom, U, eps, ns, lp::SpaceParm, gp::GaugeParm{T}, ymws::YMworkspace{T}) where T <: AbstractFloat
r1::Float64 = 0.08398315262876693
r2::Float64 = 0.2539785108410595
r3::Float64 = 0.6822365335719091
r4::Float64 = -0.03230286765269967
r5::Float64 = 0.5-r1-r3
r6::Float64 = 1.0-2.0*(r2+r4)
r1::T = 0.08398315262876693
r2::T = 0.2539785108410595
r3::T = 0.6822365335719091
r4::T = -0.03230286765269967
r5::T = 0.5-r1-r3
r6::T = 1.0-2.0*(r2+r4)
# ee = eps*gp.beta/gp.ng
# @device_code_warntype force0_wilson!(ymws.frc1,ymws.frc2, U, lp, gp)
@ -129,36 +129,35 @@ function OMF4!(mom, U, eps, ns, lp::SpaceParm, gp::GaugeParm, ymws::YMworkspace)
# end
ee = eps*gp.beta/gp.ng
force0_wilson!(ymws.frc1, U, lp)
zero!(ymws.frc2, lp)
force0_wilson_pln!(ymws.frc1, ymws.frc2, U, lp)
for i in 1:ns
# STEP 1
mom .= mom .+ (r1*ee) .* (ymws.frc1 .+ ymws.frc2)
mom .= mom .+ (r1*ee) .* ymws.frc1
U .= expm.(U, mom, eps*r2)
# STEP 2
force0_wilson!(ymws.frc1, U, lp)
mom .= mom .+ (r3*ee) .* (ymws.frc1 .+ ymws.frc2)
force0_wilson_pln!(ymws.frc1, ymws.frc2, U, lp)
mom .= mom .+ (r3*ee) .* ymws.frc1
U .= expm.(U, mom, eps*r4)
# STEP 3
force0_wilson!(ymws.frc1, U, lp)
mom .= mom .+ (r5*ee) .* (ymws.frc1 .+ ymws.frc2)
force0_wilson_pln!(ymws.frc1, ymws.frc2, U, lp)
mom .= mom .+ (r5*ee) .* ymws.frc1
U .= expm.(U, mom, eps*r6)
# STEP 4
force0_wilson!(ymws.frc1, U, lp)
mom .= mom .+ (r5*ee) .* (ymws.frc1 .+ ymws.frc2)
force0_wilson_pln!(ymws.frc1, ymws.frc2, U, lp)
mom .= mom .+ (r5*ee) .* ymws.frc1
U .= expm.(U, mom, eps*r4)
# STEP 5
force0_wilson!(ymws.frc1, U, lp)
mom .= mom .+ (r3*ee) .* (ymws.frc1 .+ ymws.frc2)
force0_wilson_pln!(ymws.frc1, ymws.frc2, U, lp)
mom .= mom .+ (r3*ee) .* ymws.frc1
U .= expm.(U, mom, eps*r2)
# STEP 6
force0_wilson!(ymws.frc1, U, lp)
mom .= mom .+ (r1*ee) .* (ymws.frc1 .+ ymws.frc2)
force0_wilson_pln!(ymws.frc1, ymws.frc2, U, lp)
mom .= mom .+ (r1*ee) .* ymws.frc1
end
return nothing