mirror of
https://igit.ific.uv.es/alramos/latticegpu.jl.git
synced 2025-05-15 11:43:42 +02:00
Bugs corrected
This commit is contained in:
parent
b347d33dbf
commit
e8493693b0
6 changed files with 35 additions and 21 deletions
|
@ -102,4 +102,7 @@ export krnl_plaq!, force0_wilson!
|
|||
include("YMhmc.jl")
|
||||
export gauge_action, hamiltonian, plaquette, HMC!, OMF4!
|
||||
|
||||
include("YMflow.jl")
|
||||
export wfl_euler, wfl_rk3
|
||||
|
||||
end
|
||||
|
|
|
@ -9,7 +9,7 @@
|
|||
### created: Mon Jul 12 18:31:19 2021
|
||||
###
|
||||
|
||||
function krnl_plaq!(plx, U, lp::SpaceParm{N,M,D}) where {T,N,M,D}
|
||||
function krnl_plaq!(plx, U::AbstractArray{T}, lp::SpaceParm{N,M,D}) where {T,N,M,D}
|
||||
|
||||
b, r = CUDA.threadIdx().x, CUDA.blockIdx().x
|
||||
|
||||
|
@ -17,25 +17,29 @@ function krnl_plaq!(plx, U, lp::SpaceParm{N,M,D}) where {T,N,M,D}
|
|||
|
||||
plx[b,r] = zero(plx[b,r])
|
||||
for id1 in 1:N-1
|
||||
if ru2 == r
|
||||
gt2 = Ush[bu2,1]
|
||||
else
|
||||
gt2 = U[bu2,id1,ru2]
|
||||
end
|
||||
bu1, ru1 = up((b, r), id1, lp)
|
||||
Ush[b,1] = U[b,id1,r]
|
||||
|
||||
for id2 = id1+1:N
|
||||
bu2, ru2 = up((b, r), id2, lp)
|
||||
Ush[b,2] = U[b,id2,r]
|
||||
sync_threads()
|
||||
|
||||
if ru1 == r
|
||||
gt1 = Ush[bu1,2]
|
||||
else
|
||||
gt1 = U[bu1,id2,ru1]
|
||||
end
|
||||
sync_threads()
|
||||
|
||||
bu1, ru1 = up((b, r), id1, lp)
|
||||
bu2, ru2 = up((b, r), id2, lp)
|
||||
if ru2 == r
|
||||
gt2 = Ush[bu2,1]
|
||||
else
|
||||
gt2 = U[bu2,id1,ru2]
|
||||
end
|
||||
|
||||
plx[b,r] += tr(Ush[b,1]*gt1 / (Ush[b,2]*gt2))
|
||||
end
|
||||
end
|
||||
|
||||
|
||||
return nothing
|
||||
end
|
||||
|
||||
|
|
|
@ -13,7 +13,7 @@ function wfl_euler(U, ns, eps, lp::SpaceParm, ymws::YMworkspace)
|
|||
|
||||
for i in 1:ns
|
||||
force_wilson(ymws, U, lp)
|
||||
U .= expm(U, ymws.frc1, 2*eps)
|
||||
U .= expm.(U, ymws.frc1, 2*eps)
|
||||
end
|
||||
|
||||
return nothing
|
||||
|
@ -25,18 +25,18 @@ function wfl_rk3(U, ns, eps, lp::SpaceParm, ymws::YMworkspace)
|
|||
c0 = eps/2
|
||||
force_wilson(ymws, U, lp)
|
||||
ymws.mom .= ymws.frc1
|
||||
U .= expm(U, ymws.mom, c0)
|
||||
U .= expm.(U, ymws.mom, c0)
|
||||
|
||||
c0 = -34*eps/36
|
||||
c1 = 16*eps/9
|
||||
force_wilson(ymws, U, lp)
|
||||
ymws.mom .= c0.*ymws.mom .+ c1.*ymws.frc1
|
||||
U .= expm(U, ymws.mom)
|
||||
U .= expm.(U, ymws.mom)
|
||||
|
||||
c1 = 6*eps/4
|
||||
force_wilson(ymws, U, lp)
|
||||
ymws.mom .= c1.*ymws.frc1 .- ymws.mom
|
||||
U .= expm(U, ymws.mom)
|
||||
U .= expm.(U, ymws.mom)
|
||||
end
|
||||
|
||||
return nothing
|
||||
|
|
|
@ -15,7 +15,7 @@
|
|||
|
||||
Returns the value of the Wilson plaquette action for the configuration U.
|
||||
"""
|
||||
function gauge_action(U, lp::SpaceParm, gp::GaugeParm{T}, ymws::YMworkspace{T}) where T <: A
|
||||
function gauge_action(U, lp::SpaceParm, gp::GaugeParm{T}, ymws::YMworkspace{T}) where T <: AbstractFloat
|
||||
|
||||
CUDA.@sync begin
|
||||
CUDA.@cuda threads=lp.bsz blocks=lp.rsz krnl_plaq!(ymws.cm, U, lp)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue