Skip to content

Commit 7517e60

Browse files
authored
Merge pull request #33 from JuliaSIMD/intializefor32bit
Tests pass locally on 32 bit
2 parents 2f7177e + c287e36 commit 7517e60

File tree

5 files changed

+53
-43
lines changed

5 files changed

+53
-43
lines changed

src/ThreadingUtilities.jl

+14-1
Original file line numberDiff line numberDiff line change
@@ -37,17 +37,30 @@ function initialize_task(tid)
3737
# set to tid, we have tasks 2...nthread, from 1-based ind perspective
3838
ccall(:jl_set_task_tid, Cvoid, (Any, Cint), t, tid % Cint)
3939
TASKS[tid] = t
40+
return nothing
4041
end
4142

43+
if Sys.WORD_SIZE == 32
44+
retnothing(::Ptr{UInt}) = nothing
45+
end
4246
function __init__()
4347
_print_exclusivity_warning()
4448
nt = min(Threads.nthreads(), (Sys.CPU_THREADS)::Int) - 1
4549
resize!(THREADPOOL, (THREADBUFFERSIZE ÷ sizeof(UInt)) * nt + (LINESPACING ÷ sizeof(UInt)) - 1)
4650
copyto!(THREADPOOL, zero(UInt))
4751
# align to LINESPACING boundary, and then subtract THREADBUFFERSIZE to make the pointer 1-indexed
48-
THREADPOOLPTR[] = reinterpret(Ptr{UInt}, (reinterpret(UInt, (pointer(THREADPOOL)))+LINESPACING-1) & (-LINESPACING)) - THREADBUFFERSIZE
52+
THREADPOOLPTR[] = reinterpret(Ptr{UInt}, (reinterpret(UInt, pointer(THREADPOOL))+LINESPACING-1) & (-LINESPACING)) - THREADBUFFERSIZE
4953
resize!(TASKS, nt)
5054
foreach(initialize_task, 1:nt)
55+
@static if Sys.WORD_SIZE == 32
56+
if nt > 0
57+
fptr = @cfunction(retnothing, Cvoid, (Ptr{UInt},))
58+
store!(taskpointer(1), fptr, sizeof(UInt))
59+
_atomic_xchg!(taskpointer(1), TASK)
60+
wake_thread!(1)
61+
wait(1)
62+
end
63+
end
5164
end
5265

5366
end # module

src/threadtasks.jl

+1
Original file line numberDiff line numberDiff line change
@@ -56,6 +56,7 @@ end
5656
if istaskfailed(t)
5757
display(t)
5858
dump(t)
59+
println()
5960
initialize_task(tid)
6061
return true
6162
end

test/aqua.jl

+1
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
import Aqua
12
@testset "Aqua.jl" begin
23
@time Aqua.test_all(ThreadingUtilities)
34
end

test/testsetup.jl

-1
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,5 @@ using ThreadingUtilities
22
using Test
33
using VectorizationBase
44

5-
import Aqua
65
import InteractiveUtils
76

test/threadingutilities.jl

+37-41
Original file line numberDiff line numberDiff line change
@@ -1,54 +1,50 @@
11
struct Copy{P} end
22
function (::Copy{P})(p::Ptr{UInt}) where {P}
3-
_, (ptry,ptrx,N) = ThreadingUtilities.load(p, P, 2*sizeof(UInt))
4-
N > 0 || throw("This function throws if N == 0 for testing purposes.")
5-
@simd ivdep for n 1:N
6-
vstore!(ptry, vload(ptrx, (n,)), (n,))
7-
end
3+
_, (ptry,ptrx,N) = ThreadingUtilities.load(p, P, 2*sizeof(UInt))
4+
N > 0 || throw("This function throws if N == 0 for testing purposes.")
5+
@simd ivdep for n 1:N
6+
vstore!(ptry, vload(ptrx, (n,)), (n,))
7+
end
88
end
99
@generated function copy_ptr(::A, ::B) where {A,B}
10-
c = Copy{Tuple{A,B,Int}}()
11-
quote
12-
@cfunction($c, Cvoid, (Ptr{UInt},))
13-
end
10+
c = Copy{Tuple{A,B,Int}}()
11+
quote
12+
@cfunction($c, Cvoid, (Ptr{UInt},))
13+
end
1414
end
1515
function setup_copy!(p, y, x)
16-
N = length(y)
17-
@assert length(x) == N
18-
py = stridedpointer(y)
19-
px = stridedpointer(x)
20-
fptr = copy_ptr(py, px)
21-
offset = ThreadingUtilities.store!(p, fptr, sizeof(UInt))
22-
ThreadingUtilities.store!(p, (py,px,N), offset)
16+
N = length(y)
17+
@assert length(x) == N
18+
py = stridedpointer(y)
19+
px = stridedpointer(x)
20+
fptr = copy_ptr(py, px)
21+
offset = ThreadingUtilities.store!(p, fptr, sizeof(UInt))
22+
ThreadingUtilities.store!(p, (py,px,N), offset)
2323
end
2424

25-
@inline function launch_thread_copy!(tid, y, x)
26-
ThreadingUtilities.launch(tid, y, x) do p, y, x
27-
setup_copy!(p, y, x)
28-
end
29-
end
25+
@inline launch_thread_copy!(tid, y, x) = ThreadingUtilities.launch(setup_copy!, tid, y, x)
3026

3127
function test_copy(tid, N = 100_000)
32-
a = rand(N);
33-
b = rand(N);
34-
c = rand(N);
35-
x = similar(a) .= NaN;
36-
y = similar(b) .= NaN;
37-
z = similar(c) .= NaN;
38-
GC.@preserve a b c x y z begin
39-
launch_thread_copy!(tid, x, a)
40-
yield()
41-
@assert !ThreadingUtilities.wait(tid)
42-
launch_thread_copy!(tid, y, b)
43-
yield()
44-
@assert !ThreadingUtilities.wait(tid)
45-
launch_thread_copy!(tid, z, c)
46-
yield()
47-
@assert !ThreadingUtilities.wait(ThreadingUtilities.taskpointer(tid))
48-
end
49-
@test a == x
50-
@test b == y
51-
@test c == z
28+
a = rand(N);
29+
b = rand(N);
30+
c = rand(N);
31+
x = similar(a) .= NaN;
32+
y = similar(b) .= NaN;
33+
z = similar(c) .= NaN;
34+
GC.@preserve a b c x y z begin
35+
launch_thread_copy!(tid, x, a)
36+
yield()
37+
@assert !ThreadingUtilities.wait(tid)
38+
launch_thread_copy!(tid, y, b)
39+
yield()
40+
@assert !ThreadingUtilities.wait(tid)
41+
launch_thread_copy!(tid, z, c)
42+
yield()
43+
@assert !ThreadingUtilities.wait(ThreadingUtilities.taskpointer(tid))
44+
end
45+
@test a == x
46+
@test b == y
47+
@test c == z
5248
end
5349

5450
@testset "ThreadingUtilities.jl" begin

0 commit comments

Comments
 (0)