Skip to content

Commit 88566e5

Browse files
Ian AtolIan Atol
Ian Atol
authored and
Ian Atol
committed
Implement broadcast, memory_opt! performance improvements, additional tests
Add a couple allocation test cases Improvements to memory_opt, change jl_typeof attribute, always-copy on BoundsError Whitespace, fix copy in BoundsError contstructor
1 parent fcbafaa commit 88566e5

File tree

9 files changed

+494
-31
lines changed

9 files changed

+494
-31
lines changed

base/abstractarray.jl

+4
Original file line numberDiff line numberDiff line change
@@ -1073,6 +1073,10 @@ function copy(a::AbstractArray)
10731073
copymutable(a)
10741074
end
10751075

1076+
function copy(a::Core.ImmutableArray)
1077+
a
1078+
end
1079+
10761080
function copyto!(B::AbstractVecOrMat{R}, ir_dest::AbstractRange{Int}, jr_dest::AbstractRange{Int},
10771081
A::AbstractVecOrMat{S}, ir_src::AbstractRange{Int}, jr_src::AbstractRange{Int}) where {R,S}
10781082
if length(ir_dest) != length(ir_src)

base/array.jl

+38-6
Original file line numberDiff line numberDiff line change
@@ -118,6 +118,35 @@ Union type of [`DenseVector{T}`](@ref) and [`DenseMatrix{T}`](@ref).
118118
"""
119119
const DenseVecOrMat{T} = Union{DenseVector{T}, DenseMatrix{T}}
120120

121+
"""
122+
ImmutableArray
123+
124+
Dynamically allocated, immutable array.
125+
126+
"""
127+
const ImmutableArray = Core.ImmutableArray
128+
129+
"""
130+
IMArray{T,N}
131+
132+
Union type of [`Array{T,N}`](@ref) and [`ImmutableArray{T,N}`](@ref)
133+
"""
134+
const IMArray{T,N} = Union{Array{T, N}, ImmutableArray{T,N}}
135+
136+
"""
137+
IMVector{T}
138+
139+
One-dimensional [`ImmutableArray`](@ref) or [`Array`](@ref) with elements of type `T`. Alias for `IMArray{T, 1}`.
140+
"""
141+
const IMVector{T} = IMArray{T, 1}
142+
143+
"""
144+
IMMatrix{T}
145+
146+
Two-dimensional [`ImmutableArray`](@ref) or [`Array`](@ref) with elements of type `T`. Alias for `IMArray{T,2}`.
147+
"""
148+
const IMMatrix{T} = IMArray{T, 2}
149+
121150
## Basic functions ##
122151

123152
import Core: arraysize, arrayset, arrayref, const_arrayref
@@ -147,14 +176,13 @@ function vect(X...)
147176
return copyto!(Vector{T}(undef, length(X)), X)
148177
end
149178

150-
const ImmutableArray = Core.ImmutableArray
151-
const IMArray{T,N} = Union{Array{T, N}, ImmutableArray{T,N}}
152-
const IMVector{T} = IMArray{T, 1}
153-
const IMMatrix{T} = IMArray{T, 2}
154-
179+
# Freeze and thaw constructors
155180
ImmutableArray(a::Array) = Core.arrayfreeze(a)
156181
Array(a::ImmutableArray) = Core.arraythaw(a)
157182

183+
ImmutableArray(a::AbstractArray{T,N}) where {T,N} = ImmutableArray{T,N}(a)
184+
185+
# Size functions for arrays, both mutable and immutable
158186
size(a::IMArray, d::Integer) = arraysize(a, convert(Int, d))
159187
size(a::IMVector) = (arraysize(a,1),)
160188
size(a::IMMatrix) = (arraysize(a,1), arraysize(a,2))
@@ -393,6 +421,9 @@ similar(a::Array{T}, m::Int) where {T} = Vector{T}(undef, m)
393421
similar(a::Array, T::Type, dims::Dims{N}) where {N} = Array{T,N}(undef, dims)
394422
similar(a::Array{T}, dims::Dims{N}) where {T,N} = Array{T,N}(undef, dims)
395423

424+
ImmutableArray{T}(undef::UndefInitializer, m::Int) where T = ImmutableArray(Array{T}(undef, m))
425+
ImmutableArray{T}(undef::UndefInitializer, dims::Dims) where T = ImmutableArray(Array{T}(undef, dims))
426+
396427
# T[x...] constructs Array{T,1}
397428
"""
398429
getindex(type[, elements...])
@@ -626,8 +657,8 @@ oneunit(x::AbstractMatrix{T}) where {T} = _one(oneunit(T), x)
626657

627658
## Conversions ##
628659

629-
convert(::Type{T}, a::AbstractArray) where {T<:Array} = a isa T ? a : T(a)
630660
convert(::Type{Union{}}, a::AbstractArray) = throw(MethodError(convert, (Union{}, a)))
661+
convert(T::Union{Type{<:Array},Type{<:Core.ImmutableArray}}, a::AbstractArray) = a isa T ? a : T(a)
631662

632663
promote_rule(a::Type{Array{T,n}}, b::Type{Array{S,n}}) where {T,n,S} = el_same(promote_type(T,S), a, b)
633664

@@ -637,6 +668,7 @@ if nameof(@__MODULE__) === :Base # avoid method overwrite
637668
# constructors should make copies
638669
Array{T,N}(x::AbstractArray{S,N}) where {T,N,S} = copyto_axcheck!(Array{T,N}(undef, size(x)), x)
639670
AbstractArray{T,N}(A::AbstractArray{S,N}) where {T,N,S} = copyto_axcheck!(similar(A,T), A)
671+
ImmutableArray{T,N}(Ar::AbstractArray{S,N}) where {T,N,S} = Core.arrayfreeze(copyto_axcheck!(Array{T,N}(undef, size(Ar)), Ar))
640672
end
641673

642674
## copying iterators to containers

base/boot.jl

+14-2
Original file line numberDiff line numberDiff line change
@@ -279,9 +279,21 @@ struct BoundsError <: Exception
279279
a::Any
280280
i::Any
281281
BoundsError() = new()
282-
BoundsError(@nospecialize(a)) = (@_noinline_meta; new(a))
283-
BoundsError(@nospecialize(a), i) = (@_noinline_meta; new(a,i))
282+
# For now, always* copy to avoid escaping a
283+
# Eventually, we want to figure out if the copy is needed to save the performance of copying
284+
285+
# * to avoid throwing a MethodError and breaking many test suites, first check if copy is defined for a
286+
287+
#BoundsError(@nospecialize(a)) = (@_noinline_meta; new(a))
288+
BoundsError(@nospecialize(a)) = Main.Base.hasmethod(Main.Base.copy, Tuple{typeof(a)}) ?
289+
(@_noinline_meta; new(Main.Base.copy(a))) :
290+
(@_noinline_meta; new(a))
291+
#BoundsError(@nospecialize(a), i) = (@_noinline_meta; new(a, i))
292+
BoundsError(@nospecialize(a), i) = Main.Base.hasmethod(Main.Base.copy, Tuple{typeof(a)}) ?
293+
(@_noinline_meta; new(Main.Base.copy(a), i)) :
294+
(@_noinline_meta; new(a, i))
284295
end
296+
285297
struct DivideError <: Exception end
286298
struct OutOfMemoryError <: Exception end
287299
struct ReadOnlyMemoryError <: Exception end

base/broadcast.jl

+13
Original file line numberDiff line numberDiff line change
@@ -1385,4 +1385,17 @@ function Base.show(io::IO, op::BroadcastFunction)
13851385
end
13861386
Base.show(io::IO, ::MIME"text/plain", op::BroadcastFunction) = show(io, op)
13871387

1388+
struct IMArrayStyle <: Broadcast.AbstractArrayStyle{Any} end
1389+
BroadcastStyle(::Type{<:Core.ImmutableArray}) = IMArrayStyle()
1390+
1391+
#similar has to return mutable array
1392+
function Base.similar(bc::Broadcasted{IMArrayStyle}, ::Type{ElType}) where ElType
1393+
similar(Array{ElType}, axes(bc))
1394+
end
1395+
1396+
@inline function copy(bc::Broadcasted{IMArrayStyle})
1397+
ElType = combine_eltypes(bc.f, bc.args)
1398+
return Core.ImmutableArray(copyto!(similar(bc, ElType), bc))
1399+
end
1400+
13881401
end # module

base/compiler/optimize.jl

+1
Original file line numberDiff line numberDiff line change
@@ -307,6 +307,7 @@ function run_passes(ci::CodeInfo, sv::OptimizationState)
307307
ir = adce_pass!(ir)
308308
#@Base.show ("after_adce", ir)
309309
@timeit "type lift" ir = type_lift_pass!(ir)
310+
#@timeit "compact 3" ir = compact!(ir)
310311
ir = memory_opt!(ir)
311312
#@Base.show ir
312313
if JLOptions().debug_level == 2

base/compiler/ssair/passes.jl

+162-18
Original file line numberDiff line numberDiff line change
@@ -1256,23 +1256,47 @@ function cfg_simplify!(ir::IRCode)
12561256
return finish(compact)
12571257
end
12581258

1259-
function is_allocation(stmt)
1259+
# function is_known_fcall(stmt::Expr, @nospecialize(func))
1260+
# isexpr(stmt, :foreigncall) || return false
1261+
# s = stmt.args[1]
1262+
# isa(s, QuoteNode) && (s = s.value)
1263+
# return s === func
1264+
# end
1265+
1266+
function is_known_fcall(stmt::Expr, funcs::Vector{Symbol})
12601267
isexpr(stmt, :foreigncall) || return false
12611268
s = stmt.args[1]
12621269
isa(s, QuoteNode) && (s = s.value)
1263-
return s === :jl_alloc_array_1d
1270+
# return any(e -> s === e, funcs)
1271+
return true in map(e -> s === e, funcs)
1272+
end
1273+
1274+
function is_allocation(stmt::Expr)
1275+
isexpr(stmt, :foreigncall) || return false
1276+
s = stmt.args[1]
1277+
isa(s, QuoteNode) && (s = s.value)
1278+
return (s === :jl_alloc_array_1d
1279+
|| s === :jl_alloc_array_2d
1280+
|| s === :jl_alloc_array_3d
1281+
|| s === :jl_new_array)
12641282
end
12651283

12661284
function memory_opt!(ir::IRCode)
12671285
compact = IncrementalCompact(ir, false)
12681286
uses = IdDict{Int, Vector{Int}}()
1269-
relevant = IdSet{Int}()
1270-
revisit = Int[]
1271-
function mark_val(val)
1287+
relevant = IdSet{Int}() # allocations
1288+
revisit = Int[] # potential targets for a mutating_arrayfreeze drop-in
1289+
1290+
function mark_escape(@nospecialize val)
12721291
isa(val, SSAValue) || return
1292+
#println(val.id, " escaped.")
12731293
val.id in relevant && pop!(relevant, val.id)
12741294
end
1295+
12751296
for ((_, idx), stmt) in compact
1297+
1298+
#println("idx: ", idx, " = ", stmt)
1299+
12761300
if isa(stmt, ReturnNode)
12771301
isdefined(stmt, :val) || continue
12781302
val = stmt.val
@@ -1281,51 +1305,171 @@ function memory_opt!(ir::IRCode)
12811305
push!(uses[val.id], idx)
12821306
end
12831307
continue
1308+
1309+
# check for phinodes that are possibly allocations
1310+
elseif isa(stmt, PhiNode)
1311+
1312+
# this loop seems like a waste, but using map here didn't go well
1313+
defined = true
1314+
for i = 1:length(stmt.values)
1315+
if !isassigned(stmt.values, i)
1316+
defined = false
1317+
end
1318+
end
1319+
1320+
defined || continue
1321+
1322+
for val in stmt.values
1323+
if isa(val, SSAValue) && val.id in relevant
1324+
#println("Adding ", idx ," to relevant from PhiNode: " , stmt)
1325+
push!(relevant, idx)
1326+
end
1327+
end
12841328
end
1329+
12851330
(isexpr(stmt, :call) || isexpr(stmt, :foreigncall)) || continue
1331+
12861332
if is_allocation(stmt)
12871333
push!(relevant, idx)
12881334
# TODO: Mark everything else here
12891335
continue
12901336
end
1291-
# TODO: Replace this by interprocedural escape analysis
1292-
if is_known_call(stmt, arrayset, compact)
1337+
1338+
if is_known_call(stmt, arrayset, compact) && length(stmt.args) >= 5
12931339
# The value being set escapes, everything else doesn't
1294-
mark_val(stmt.args[4])
1340+
mark_escape(stmt.args[4])
1341+
1342+
arr = stmt.args[3]
1343+
1344+
if isa(arr, SSAValue) && arr.id in relevant
1345+
(haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1346+
push!(uses[arr.id], idx)
1347+
end
1348+
1349+
elseif is_known_call(stmt, arrayref, compact) && length(stmt.args) == 4
12951350
arr = stmt.args[3]
1351+
1352+
if isa(arr, SSAValue) && arr.id in relevant
1353+
(haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1354+
push!(uses[arr.id], idx)
1355+
end
1356+
1357+
elseif is_known_call(stmt, setindex!, compact) && length(stmt.args) == 4
1358+
#println("setindex!: ", stmt.args)
1359+
# handle similarly to arrayset
1360+
# escape the value being set
1361+
val = stmt.args[3]
1362+
mark_escape(val)
1363+
# track usage of arr for dominance analysis
1364+
arr = stmt.args[2]
1365+
if isa(arr, SSAValue) && arr.id in relevant
1366+
(haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1367+
push!(uses[arr.id], idx)
1368+
end
1369+
1370+
# these foreigncalls have similar structure and don't escape our array, so handle them all at once
1371+
elseif is_known_fcall(stmt, [:jl_array_ptr, :jl_array_copy]) && length(stmt.args) == 6
1372+
#println("is_known_fcall: ", stmt)
1373+
arr = stmt.args[6]
1374+
1375+
# just record usage info
12961376
if isa(arr, SSAValue) && arr.id in relevant
12971377
(haskey(uses, arr.id)) || (uses[arr.id] = Int[])
12981378
push!(uses[arr.id], idx)
12991379
end
1380+
1381+
# elseif is_known_fcall(stmt, :jl_array_ptr) && length(stmt.args) == 6
1382+
# arr = stmt.args[6]
1383+
1384+
# if isa(arr, SSAValue) && arr.id in relevant
1385+
# (haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1386+
# push!(uses[arr.id], idx)
1387+
# end
1388+
1389+
# elseif is_known_fcall(stmt, :jl_array_copy) && length(stmt.args) == 6
1390+
# arr = stmt.args[6]
1391+
1392+
# if isa(arr, SSAValue) && arr.id in relevant
1393+
# (haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1394+
# push!(uses[arr.id], idx)
1395+
# end
1396+
1397+
elseif is_known_call(stmt, arraysize, compact) && isa(stmt.args[2], SSAValue) #&& isa(stmt.args[3], Number)
1398+
arr = stmt.args[2]
1399+
# dim = stmt.args[3]
1400+
# typ = types(compact)[arr]
1401+
1402+
# if isa(typ, Core.Const)
1403+
# typ = typ.val
1404+
# end
1405+
1406+
# NEW: since exceptions no longer escape arrays, we can just assume no escape
1407+
1408+
if arr.id in relevant
1409+
(haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1410+
push!(uses[arr.id], idx)
1411+
end
1412+
1413+
# # make sure this call isn't going to throw
1414+
# if isa(typ, Type) && typ <: AbstractArray && dim >= 1
1415+
# # don't escape the array, but mark usage for dom analysis
1416+
# if arr.id in relevant
1417+
# (haskey(uses, arr.id)) || (uses[arr.id] = Int[])
1418+
# push!(uses[arr.id], idx)
1419+
# end
1420+
1421+
# else # if this call throws or we can't tell, assume all uses escape
1422+
# for ur in userefs(stmt)
1423+
# mark_escape(ur[])
1424+
# end
1425+
# end
1426+
13001427
elseif is_known_call(stmt, Core.arrayfreeze, compact) && isa(stmt.args[2], SSAValue)
1428+
# mark these for potential replacement with mutating_arrayfreeze
13011429
push!(revisit, idx)
1430+
13021431
else
1303-
# For now we assume everything escapes
1304-
# TODO: We could handle PhiNodes specially and improve this
1432+
# Assume everything else escapes
13051433
for ur in userefs(stmt)
1306-
mark_val(ur[])
1434+
mark_escape(ur[])
13071435
end
13081436
end
13091437
end
1438+
13101439
ir = finish(compact)
13111440
isempty(revisit) && return ir
1441+
13121442
domtree = construct_domtree(ir.cfg.blocks)
1443+
13131444
for idx in revisit
13141445
# Make sure that the value we reference didn't escape
1315-
id = ir.stmts[idx][:inst].args[2].id
1446+
stmt = ir.stmts[idx][:inst]::Expr
1447+
id = (stmt.args[2]::SSAValue).id
1448+
# print("Relevant: ")
1449+
# for id in relevant
1450+
# print(id, " ")
1451+
# end
1452+
# println(" ")
1453+
# print("Revisit: ")
1454+
# Main.Base.show(revisit)
1455+
# println()
13161456
(id in relevant) || continue
13171457

1458+
#println("Revisiting ", stmt)
1459+
13181460
# We're ok to steal the memory if we don't dominate any uses
13191461
ok = true
1320-
for use in uses[id]
1321-
if ssadominates(ir, domtree, idx, use)
1322-
ok = false
1323-
break
1462+
if haskey(uses, id)
1463+
for use in uses[id]
1464+
if ssadominates(ir, domtree, idx, use)
1465+
ok = false
1466+
break
1467+
end
13241468
end
13251469
end
13261470
ok || continue
1327-
1328-
ir.stmts[idx][:inst].args[1] = Core.mutating_arrayfreeze
1471+
#println("Optimization of ", stmt)
1472+
stmt.args[1] = Core.mutating_arrayfreeze
13291473
end
13301474
return ir
13311475
end

base/pointer.jl

+1
Original file line numberDiff line numberDiff line change
@@ -63,6 +63,7 @@ cconvert(::Type{Ptr{UInt8}}, s::AbstractString) = String(s)
6363
cconvert(::Type{Ptr{Int8}}, s::AbstractString) = String(s)
6464

6565
unsafe_convert(::Type{Ptr{T}}, a::Array{T}) where {T} = ccall(:jl_array_ptr, Ptr{T}, (Any,), a)
66+
unsafe_convert(::Type{Ptr{T}}, a::Core.ImmutableArray{T}) where {T} = ccall(:jl_array_ptr, Ptr{T}, (Any,), a)
6667
unsafe_convert(::Type{Ptr{S}}, a::AbstractArray{T}) where {S,T} = convert(Ptr{S}, unsafe_convert(Ptr{T}, a))
6768
unsafe_convert(::Type{Ptr{T}}, a::AbstractArray{T}) where {T} = error("conversion to pointer not defined for $(typeof(a))")
6869

0 commit comments

Comments
 (0)