|
1 | 1 | struct Copy{P} end
|
2 | 2 | function (::Copy{P})(p::Ptr{UInt}) where {P}
|
3 |
| - _, (ptry,ptrx,N) = ThreadingUtilities.load(p, P, 2*sizeof(UInt)) |
4 |
| - N > 0 || throw("This function throws if N == 0 for testing purposes.") |
5 |
| - @simd ivdep for n ∈ 1:N |
6 |
| - vstore!(ptry, vload(ptrx, (n,)), (n,)) |
7 |
| - end |
| 3 | + _, (ptry,ptrx,N) = ThreadingUtilities.load(p, P, 2*sizeof(UInt)) |
| 4 | + N > 0 || throw("This function throws if N == 0 for testing purposes.") |
| 5 | + @simd ivdep for n ∈ 1:N |
| 6 | + vstore!(ptry, vload(ptrx, (n,)), (n,)) |
| 7 | + end |
8 | 8 | end
|
9 | 9 | @generated function copy_ptr(::A, ::B) where {A,B}
|
10 |
| - c = Copy{Tuple{A,B,Int}}() |
11 |
| - quote |
12 |
| - @cfunction($c, Cvoid, (Ptr{UInt},)) |
13 |
| - end |
| 10 | + c = Copy{Tuple{A,B,Int}}() |
| 11 | + quote |
| 12 | + @cfunction($c, Cvoid, (Ptr{UInt},)) |
| 13 | + end |
14 | 14 | end
|
15 | 15 | function setup_copy!(p, y, x)
|
16 |
| - N = length(y) |
17 |
| - @assert length(x) == N |
18 |
| - py = stridedpointer(y) |
19 |
| - px = stridedpointer(x) |
20 |
| - fptr = copy_ptr(py, px) |
21 |
| - offset = ThreadingUtilities.store!(p, fptr, sizeof(UInt)) |
22 |
| - ThreadingUtilities.store!(p, (py,px,N), offset) |
| 16 | + N = length(y) |
| 17 | + @assert length(x) == N |
| 18 | + py = stridedpointer(y) |
| 19 | + px = stridedpointer(x) |
| 20 | + fptr = copy_ptr(py, px) |
| 21 | + offset = ThreadingUtilities.store!(p, fptr, sizeof(UInt)) |
| 22 | + ThreadingUtilities.store!(p, (py,px,N), offset) |
23 | 23 | end
|
24 | 24 |
|
25 |
| -@inline function launch_thread_copy!(tid, y, x) |
26 |
| - ThreadingUtilities.launch(tid, y, x) do p, y, x |
27 |
| - setup_copy!(p, y, x) |
28 |
| - end |
29 |
| -end |
| 25 | +@inline launch_thread_copy!(tid, y, x) = ThreadingUtilities.launch(setup_copy!, tid, y, x) |
30 | 26 |
|
31 | 27 | function test_copy(tid, N = 100_000)
|
32 |
| - a = rand(N); |
33 |
| - b = rand(N); |
34 |
| - c = rand(N); |
35 |
| - x = similar(a) .= NaN; |
36 |
| - y = similar(b) .= NaN; |
37 |
| - z = similar(c) .= NaN; |
38 |
| - GC.@preserve a b c x y z begin |
39 |
| - launch_thread_copy!(tid, x, a) |
40 |
| - yield() |
41 |
| - @assert !ThreadingUtilities.wait(tid) |
42 |
| - launch_thread_copy!(tid, y, b) |
43 |
| - yield() |
44 |
| - @assert !ThreadingUtilities.wait(tid) |
45 |
| - launch_thread_copy!(tid, z, c) |
46 |
| - yield() |
47 |
| - @assert !ThreadingUtilities.wait(ThreadingUtilities.taskpointer(tid)) |
48 |
| - end |
49 |
| - @test a == x |
50 |
| - @test b == y |
51 |
| - @test c == z |
| 28 | + a = rand(N); |
| 29 | + b = rand(N); |
| 30 | + c = rand(N); |
| 31 | + x = similar(a) .= NaN; |
| 32 | + y = similar(b) .= NaN; |
| 33 | + z = similar(c) .= NaN; |
| 34 | + GC.@preserve a b c x y z begin |
| 35 | + launch_thread_copy!(tid, x, a) |
| 36 | + yield() |
| 37 | + @assert !ThreadingUtilities.wait(tid) |
| 38 | + launch_thread_copy!(tid, y, b) |
| 39 | + yield() |
| 40 | + @assert !ThreadingUtilities.wait(tid) |
| 41 | + launch_thread_copy!(tid, z, c) |
| 42 | + yield() |
| 43 | + @assert !ThreadingUtilities.wait(ThreadingUtilities.taskpointer(tid)) |
| 44 | + end |
| 45 | + @test a == x |
| 46 | + @test b == y |
| 47 | + @test c == z |
52 | 48 | end
|
53 | 49 |
|
54 | 50 | @testset "ThreadingUtilities.jl" begin
|
|
0 commit comments