Improper function nesting causes boxing/runtime dispatch?

bremez · May 15, 2024, 4:19pm

Note the code example below:

struct Radix{N} 
    Radix(n::Integer) = new{n}();
end

# Nesting: testfunc! -> _add, _addpositions
function testfunc!(array, num, radix)
    
    _add(a, b, ::Radix{2}) = a ⊻ b
    _add(a, b, ::Radix{radix}) where radix = mod(a+b, radix)
    
    function _add_positions(array, a, b) 
        array[b] =  _add(array[a], array[b], radix)
    end
    
    for _ in 1:num
        a,b = rand(1:length(array)), rand(1:length(array))
        _add_positions(array, a, b)
    end
end

# Nesting: testfunc! -> _addpositions -> _add
function testfunc2!(array, num, radix)
    
    function _add_positions(array, a, b) 
        _add(a, b, ::Radix{2}) = a ⊻ b
        _add(a, b, ::Radix{radix}) where radix = mod(a+b, radix)
        array[b] =  _add(array[a], array[b], radix)
    end
    
    for _ in 1:num
        a,b = rand(1:length(array)), rand(1:length(array))
        _add_positions(array, a, b)
    end
end

# Nesting: testfunc! -> _add, _addpositions
function testfunc3!(array, num, radix)
    
    #_add(a, b, ::Radix{2}) = a ⊻ b # Commented out - so no dispatch ambiguity
    _add(a, b, ::Radix{radix}) where radix = mod(a+b, radix)
    
    function _add_positions(array, a, b) 
        array[b] =  _add(array[a], array[b], radix)
    end
    
    for _ in 1:num
        a,b = rand(1:length(array)), rand(1:length(array))
        _add_positions(array, a, b)
    end
end

which benchmarks as follows:

arr = rand(0:1, 1024);
@btime testfunc!(arr, 1000, Radix(5))
@btime testfunc2!(arr, 1000, Radix(5))
@btime testfunc3!(arr, 1000, Radix(5))

#  117.200 μs (439 allocations: 6.86 KiB)
#  13.300 μs (0 allocations: 0 bytes)
#  17.200 μs (0 allocations: 0 bytes)

Note specifically the extra allocations. A @code_warntype check of testfunc! shows that _add itself gets boxed. Why does this happen, and why does it not in testfunc2! (which can receive the value of radix without boxing)? Once only one definition of _add exists, see testfunc3!, the problem is resolved.

Oscar_Smith · May 15, 2024, 7:36pm

See Performance Tips · The Julia Language

bremez · May 16, 2024, 2:16am

@Oscar_Smith so if I understand right, in the first implementation ‘_add’ is implicitly passed as an argument to a lifted realization of ‘_add_positions’? Then, since its type is ‘Function’, ‘_add_positions’ doesn’t specialize, and since it’s passed implicitly I cannot add the explicit specialization directive the manual suggests?

The documentation mentions this problem won’t show up with ‘@code_warntype’ - this fact indeed stumped my search for where these allocations were coming from! (I had guessed it arose from the capturing of ‘radix’)

nsajko · May 17, 2024, 7:00am

I think @Oscar_Smith just linked the wrong section of the Performance Tips. This should be the right one.

Topic		Replies	Views
Why does runtime dispatch allocate when the return type is inferred? Internals & Design memory-allocation , runtime-dispatch	5	232	May 17, 2025
Elimination of (unnecessary) runtime dispatch allocations Internals & Design box , allocations , runtime-dispatch	13	1134	May 5, 2024
Function inside struct allocates when referenced New to Julia function	25	1044	November 7, 2023
How slow is runtime dispatch, anyway? Benchmark attempts Performance	8	333	January 15, 2025
Strange allocations with default positional argument and static arrays Performance	6	624	July 7, 2019

Improper function nesting causes boxing/runtime dispatch?

Related topics