typeof(:clock)

Symbol


ccall((:clock, "libc"), Int32, ())

12204446


f() = ccall((:clock, "libc"), Int32, ())

f (generic function with 1 method)

f()

12896611


@code_llvm(f())

;  @ In[3]:1 within `f`
define i32 @julia_f_1439() #0 {
top:
  %0 = call i32 inttoptr (i64 140703431076467 to i32 ()*)()
  ret i32 %0
}


@code_native(f())

	.section	__TEXT,__text,regular,pure_instructions
	.build_version macos, 12, 0
	.globl	_julia_f_1481                   ## -- Begin function julia_f_1481
	.p2align	4, 0x90
_julia_f_1481:                          ## @julia_f_1481
; ┌ @ In[3]:1 within `f`
	.cfi_startproc
## %bb.0:                               ## %top
	subq	$8, %rsp
	.cfi_def_cfa_offset 16
	movabsq	$140703431076467, %rax          ## imm = 0x7FF812072A73
	callq	*%rax
	popq	%rcx
	retq
	.cfi_endproc
; └
                                        ## -- End function
.subsections_via_symbols


ret = ccall((:getenv, "libc"), Cstring, (Cstring,), "SHELL")

Cstring(0x00007ff7bafc14b9)


unsafe_string(ret)

"/usr/local/bin/fish"


ret = ccall((:getenv, "libc"), Cstring, (Cstring,), "asdf")

Cstring(0x0000000000000000)


unsafe_string(ret)

ArgumentError: cannot convert NULL to string

Stacktrace:
 [1] unsafe_string
   @ ./strings/string.jl:72 [inlined]
 [2] unsafe_string(s::Cstring)
   @ Base ./c.jl:193
 [3] top-level scope
   @ In[10]:1
 [4] eval
   @ ./boot.jl:368 [inlined]
 [5] include_string(mapexpr::typeof(REPL.softscope), mod::Module, code::String, filename::String)
   @ Base ./loading.jl:1428


function getenv(var::AbstractString)
    val = ccall((:getenv, "libc"),
                Cstring, (Cstring,), var)
    if val == C_NULL
        error("getenv: undefined variable: ", var)
    end
    unsafe_string(val)
end

getenv (generic function with 1 method)


getenv("SHELL")

"/usr/local/bin/fish"


getenv("asdf")

getenv: undefined variable: asdf

Stacktrace:
 [1] error(::String, ::String)
   @ Base ./error.jl:44
 [2] getenv(var::String)
   @ Main ./In[11]:5
 [3] top-level scope
   @ In[13]:1
 [4] eval
   @ ./boot.jl:368 [inlined]
 [5] include_string(mapexpr::typeof(REPL.softscope), mod::Module, code::String, filename::String)
   @ Base ./loading.jl:1428


ccall((:asdf_int, "asdf_lib"), Int32, (Int32,), -1)

0


a = rand(10^7) # 1D vector of random numbers, uniform on [0,1)

10000000-element Vector{Float64}:
 0.8613616678836064
 0.6788806822948108
 0.47735441120249267
 0.9872453487938009
 0.0939569660165096
 0.9975542610320133
 0.9359560690972771
 0.13179595010979905
 0.3870351677953733
 0.30137106295064764
 0.0827855699267499
 0.05531853697162825
 0.9348339001953763
 ⋮
 0.7703630608529817
 0.785851212129005
 0.9956362623582224
 0.4591075308839966
 0.8398996934654701
 0.9995945836053647
 0.12824102300712326
 0.9404965731289516
 0.6715917272434537
 0.0025913133378624442
 0.5697798774608598
 0.9956946163870105


sum(a)

4.998520918420762e6

open(`gcc -fPIC -O3 -msse3 -xc -shared -o $(Clib * "." * Libdl.dlext) -`, "w") do f
    print(f, C_code) 
end


C_code = """
#include <stddef.h>
double c_sum(size_t n, double *X) {
    double s = 0.0;
    for (size_t i = 0; i < n; ++i) {
        s += X[i];
    }
    return s;
}
"""

const Clib = tempname()   # make a temporary file


# compile to a shared library by piping C_code to gcc
# (works only if you have gcc installed):

open(`gcc -fPIC -O3 -msse3 -xc -shared -o $(Clib * "." * Libdl.dlext) -`, "w") do f
    print(f, C_code) 
end

# define a Julia function that calls the C function:
c_sum(X::Array{Float64}) = ccall(
    ("c_sum", Clib), Float64, 
    (Csize_t, Ptr{Float64}), length(X), X
)

c_sum (generic function with 1 method)

ccall(
    ("c_sum", Clib), Float64, 
    (Csize_t, Ptr{Float64}), length(X), X
)


@code_llvm(c_sum(a))

;  @ In[18]:23 within `c_sum`
define double @julia_c_sum_2217({}* nonnull align 16 dereferenceable(40) %0) #0 {
top:
; ┌ @ array.jl:215 within `length`
   %1 = bitcast {}* %0 to { i8*, i64, i16, i16, i32 }*
   %2 = getelementptr inbounds { i8*, i64, i16, i16, i32 }, { i8*, i64, i16, i16, i32 }* %1, i64 0, i32 1
   %3 = load i64, i64* %2, align 8
; └
; ┌ @ pointer.jl:65 within `unsafe_convert`
   %4 = bitcast {}* %0 to i8**
   %5 = load i8*, i8** %4, align 8
   %6 = ptrtoint i8* %5 to i64
; └
  %7 = call double inttoptr (i64 4382146336 to double (i64, i64)*)(i64 %3, i64 %6)
  ret double %7
}


@code_native(c_sum(a))

	.section	__TEXT,__text,regular,pure_instructions
	.build_version macos, 12, 0
	.globl	_julia_c_sum_2220               ## -- Begin function julia_c_sum_2220
	.p2align	4, 0x90
_julia_c_sum_2220:                      ## @julia_c_sum_2220
; ┌ @ In[18]:23 within `c_sum`
	.cfi_startproc
## %bb.0:                               ## %top
	subq	$8, %rsp
	.cfi_def_cfa_offset 16
; │┌ @ pointer.jl:65 within `unsafe_convert`
	movq	(%rdi), %rsi
; │└
; │┌ @ array.jl:215 within `length`
	movq	8(%rdi), %rdi
	movabsq	$4382146336, %rax               ## imm = 0x105323F20
; │└
	callq	*%rax
	popq	%rax
	retq
	.cfi_endproc
; └
                                        ## -- End function
.subsections_via_symbols


c_sum(a) ≈ sum(a)  # type \approx and then <TAB> to get the ≈ symbolb

true


c_bench = @benchmark c_sum(a)

BenchmarkTools.Trial: 312 samples with 1 evaluation.
 Range (min … max):  15.628 ms …  19.708 ms  ┊ GC (min … max): 0.00% … 0.00%
 Time  (median):     15.808 ms               ┊ GC (median):    0.00%
 Time  (mean ± σ):   16.053 ms ± 649.531 μs  ┊ GC (mean ± σ):  0.00% ± 0.00%

  ▃▇█▆▅▄▃ ▂                                                     
  ███████▇█▇▆█▁▇▄▆▆▄▄▆█▆▄▄▆▁▇▄▁▄▁▆▄▄▄▄▁▄▁▁▁▄▄▄▁▄▄▄▁▁▄▄▁▁▄▁▁▄▄▄ ▇
  15.6 ms       Histogram: log(frequency) by time      18.7 ms <

 Memory estimate: 48 bytes, allocs estimate: 1.


j_bench = @benchmark sum(a)

BenchmarkTools.Trial: 974 samples with 1 evaluation.
 Range (min … max):  4.411 ms …  10.278 ms  ┊ GC (min … max): 0.00% … 0.00%
 Time  (median):     4.885 ms               ┊ GC (median):    0.00%
 Time  (mean ± σ):   5.122 ms ± 748.226 μs  ┊ GC (mean ± σ):  0.00% ± 0.00%

   ▅█▅▆▂▅▂▄▁▁                                                  
  ▆██████████▇█▅▆▆▅▄▄▄▅▃▄▄▃▃▃▃▃▃▃▃▂▃▃▂▂▃▃▂▁▂▃▃▂▂▂▂▂▂▂▂▂▂▁▂▂▁▂ ▄
  4.41 ms         Histogram: frequency by time        7.81 ms <

 Memory estimate: 16 bytes, allocs estimate: 1.


function j_sqrt(x::Cdouble)
    convert(Cdouble, sqrt(x))::Cdouble
end

j_sqrt (generic function with 1 method)


j_sqrt(2.) ≈ √2.

true


const j_sqrt_c = @cfunction(j_sqrt, Cdouble, (Cdouble,))

Ptr{Nothing} @0x000000010793d360

double c_sqrt_sum(double (* j_sqrt)(double), size_t n, double *X)


C_sqrt_code = """
#include <stddef.h>

double c_sqrt_sum(double (* j_sqrt)(double), size_t n, double *X) {
    double s = 0.0;
    for (size_t i = 0; i < n; ++i) {
        s += j_sqrt(X[i]);
    }
    return s;
}
"""

const Clib_sqrt = tempname()   # make a temporary file


# compile to a shared library by piping C_code to gcc
# (works only if you have gcc installed):

open(`gcc -fPIC -O3 -msse3 -xc -shared -o $(Clib_sqrt * "." * Libdl.dlext) -`, "w") do f
    print(f, C_sqrt_code) 
end

# define a Julia function that calls the C function:
c_sqrt_sum(X::Array{Float64}) = ccall(
    ("c_sqrt_sum", Clib_sqrt), 
    Float64, 
    (Ptr{Nothing}, Csize_t, Ptr{Float64}), 
    j_sqrt_c, length(X), X
)

c_sqrt_sum (generic function with 1 method)


j_sqrt_sum(X::Array{Float64}) = sum( broadcast( sqrt, X ) )

j_sqrt_sum (generic function with 1 method)


c_sqrt_sum(a) ≈ j_sqrt_sum(a)

true


@benchmark(c_sqrt_sum($a))

BenchmarkTools.Trial: 64 samples with 1 evaluation.
 Range (min … max):  72.559 ms … 107.022 ms  ┊ GC (min … max): 0.00% … 0.00%
 Time  (median):     77.179 ms               ┊ GC (median):    0.00%
 Time  (mean ± σ):   78.712 ms ±   6.748 ms  ┊ GC (mean ± σ):  0.00% ± 0.00%

   █ █   ▃▃ ▁▃▃                                                 
  ▇█▆█▄▆▆██▄███▁▁▄▆▁▄▆▁▁▁▁▄▁▄▁▁▄▁▁▄▁▁▁▁▁▁▄▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▄ ▁
  72.6 ms         Histogram: frequency by time          106 ms <

 Memory estimate: 0 bytes, allocs estimate: 0.


@benchmark(j_sqrt_sum($a))

BenchmarkTools.Trial: 117 samples with 1 evaluation.
 Range (min … max):  34.171 ms … 56.576 ms  ┊ GC (min … max):  0.00% … 26.07%
 Time  (median):     42.539 ms              ┊ GC (median):     0.48%
 Time  (mean ± σ):   42.940 ms ±  6.606 ms  ┊ GC (mean ± σ):  13.98% ± 12.45%

  ▂▆ ▂▆▄█▂ ▂                       ▂ ▂▂▄   ▂                   
  ████████▆██▄▄▆▁▁▁▄▄▄▁▁▄█▁▁▁▁▁▄▄▆▆█▄███▆▆▆█▄█▆▁█▆▆▆▆▁▆▄▁▆▁▁▄ ▄
  34.2 ms         Histogram: frequency by time        55.3 ms <

 Memory estimate: 76.29 MiB, allocs estimate: 2.


Cc_sqrt_code = """
#include <stddef.h>
#include <math.h>

double cc_sqrt_sum(size_t n, double *X) {
    double s = 0.0;
    for (size_t i = 0; i < n; ++i) {
        s += sqrt(X[i]);
    }
    return s;
}
"""

const Clib_c_sqrt = tempname()   # make a temporary file


# compile to a shared library by piping C_code to gcc
# (works only if you have gcc installed):

open(`gcc -fPIC -O3 -msse3 -xc -shared -lm -o $(Clib_c_sqrt * "." * Libdl.dlext) -`, "w") do f
    print(f, Cc_sqrt_code) 
end

# define a Julia function that calls the C function:
cc_sqrt_sum(X::Array{Float64}) = ccall(
    ("cc_sqrt_sum", Clib_c_sqrt), 
    Float64, 
    (Csize_t, Ptr{Float64}), 
    length(X), X
)

cc_sqrt_sum (generic function with 1 method)


@benchmark(c_sqrt_sum($a))

BenchmarkTools.Trial: 67 samples with 1 evaluation.
 Range (min … max):  72.338 ms … 104.730 ms  ┊ GC (min … max): 0.00% … 0.00%
 Time  (median):     73.986 ms               ┊ GC (median):    0.00%
 Time  (mean ± σ):   75.805 ms ±   5.319 ms  ┊ GC (mean ± σ):  0.00% ± 0.00%

  █▁                                                            
  ██▆▅▇▅▇▄▅▇▄▁▁▁▃▁▁▃▁▃▄▁▃▃▃▁▄▁▁▁▁▁▁▁▁▁▁▁▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▃ ▁
  72.3 ms         Histogram: frequency by time           95 ms <

 Memory estimate: 0 bytes, allocs estimate: 0.


@benchmark(cc_sqrt_sum($a))

BenchmarkTools.Trial: 202 samples with 1 evaluation.
 Range (min … max):  24.082 ms …  28.802 ms  ┊ GC (min … max): 0.00% … 0.00%
 Time  (median):     24.452 ms               ┊ GC (median):    0.00%
 Time  (mean ± σ):   24.770 ms ± 833.654 μs  ┊ GC (mean ± σ):  0.00% ± 0.00%

  ▃▄▄█▄▂                                                        
  ██████▇▇▄▅▃▄▄▃▅▃▃▁▃▅▄▃▁▃▄▃▃▃▃▄▁▃▃▃▁▁▁▁▁▃▁▁▁▁▁▁▁▃▁▁▁▁▃▁▁▁▁▁▁▃ ▃
  24.1 ms         Histogram: frequency by time         28.6 ms <

 Memory estimate: 0 bytes, allocs estimate: 0.

Integrating with external C libraries¶

C-compatible strings¶

Writing and calling your own libraries:¶

Benchmarking your C libaries¶

Knitting code closer together¶