toivoh · November 2, 2014 09:08 · toivoh · Nov 2, 2014 · Keno · Nov 2, 2014
diff --git a/TestSIMD2.jl b/TestSIMD2.jl
 module TestSIMD2

 # requires Julia 0.4 for llvmcall

 typealias Uint64x2 NTuple{2, Uint64}
 function ($)(x::Uint64x2, y::Uint64x2)
    Base.llvmcall("""%3 = xor <2 x i64> %1, %0
                     ret <2 x i64> %3""",
                  Uint64x2, (Uint64x2, Uint64x2), x, y)
 end

 function innerloop!{T}(dest::Vector{T}, dest_ofs, src::Vector{T}, src_ofs)
    @inbounds s = ( src[1 + 2*src_ofs],   src[2 + 2*src_ofs])
    @inbounds d = (dest[1 + 2*dest_ofs], dest[2 + 2*dest_ofs])
    d $= s
    @inbounds (dest[1 + 2*dest_ofs], dest[2 + 2*dest_ofs]) = d
 end

 T = Uint64
 code_native(innerloop!, (Vector{T}, Int, Vector{T}, Int))

 end
	module TestSIMD2

	# requires Julia 0.4 for llvmcall

	typealias Uint64x2 NTuple{2, Uint64}
	function ($)(x::Uint64x2, y::Uint64x2)
	Base.llvmcall("""%3 = xor <2 x i64> %1, %0
	ret <2 x i64> %3""",
	Uint64x2, (Uint64x2, Uint64x2), x, y)
	end

	function innerloop!{T}(dest::Vector{T}, dest_ofs, src::Vector{T}, src_ofs)
	@inbounds s = ( src[1 + 2src_ofs], src[2 + 2src_ofs])
	@inbounds d = (dest[1 + 2dest_ofs], dest[2 + 2dest_ofs])
	d $= s
	@inbounds (dest[1 + 2dest_ofs], dest[2 + 2dest_ofs]) = d
	end

	T = Uint64
	code_native(innerloop!, (Vector{T}, Int, Vector{T}, Int))

	end