@testset "broadcast" begin @test testf((x) -> fill!(x, 1), rand(3,3)) @test testf((x, y) -> map(+, x, y), rand(2, 3), rand(2, 3)) @test testf((x) -> sin.(x), rand(2, 3)) @test testf((x) -> log.(x) .+ 1, rand(2, 3)) @test testf((x) -> 2x, rand(2, 3)) @test testf((x) -> x .^ 0, rand(2, 3)) @test testf((x) -> x .^ 1, rand(2, 3)) @test testf((x) -> x .^ 2, rand(2, 3)) @test testf((x) -> x .^ 3, rand(2, 3)) @test testf((x) -> x .^ 5, rand(2, 3)) @test testf((x) -> (z = Int32(5); x .^ z), rand(2, 3)) @test testf((x) -> (z = Float64(π); x .^ z), rand(2, 3)) @test testf((x) -> (z = Float32(π); x .^ z), rand(Float32, 2, 3)) @test testf((x, y) -> x .+ y, rand(2, 3), rand(1, 3)) @test testf((z, x, y) -> z .= x .+ y, rand(2, 3), rand(2, 3), rand(2)) @test (CuArray{Ptr{Cvoid}}(undef, 1) .= C_NULL) == CuArray([C_NULL]) @test CuArray([1,2,3]) .+ CuArray([1.0,2.0,3.0]) == CuArray([2,4,6]) @eval struct Whatever{T} x::Int end @test Array(Whatever{Int}.(CuArray([1]))) == Whatever{Int}.([1]) end @testset "cufunc" begin gelu1(x) = oftype(x, 0.5) * x * (1 + tanh(oftype(x, √(2/π))*(x + oftype(x, 0.044715) * x^3))) sig(x) = one(x) / (one(x) + exp(-x)) f(x) = gelu1(log(x)) * sig(x) * tanh(x) g(x) = x^7 - 2 * x^f(x^2) + 3 CUDA.@cufunc gelu1(x) = oftype(x, 0.5) * x * (1 + tanh(oftype(x, √(2/π))*(x + oftype(x, 0.044715) * x^3))) CUDA.@cufunc sig(x) = one(x) / (one(x) + exp(-x)) CUDA.@cufunc f(x) = gelu1(log(x)) * sig(x) * tanh(x) CUDA.@cufunc g(x) = x^7 - 2 * x^f(x^2) + 3 @test :gelu1 ∈ CUDA.cufuncs() @test :sig ∈ CUDA.cufuncs() @test :f ∈ CUDA.cufuncs() @test :g ∈ CUDA.cufuncs() @test testf(x -> gelu1.(x), rand(3,3)) @test testf(x -> sig.(x), rand(3,3)) @test testf(x -> f.(x), rand(3,3)) @test testf(x -> g.(x), rand(3,3)) end # https://github.com/JuliaGPU/CUDA.jl/issues/223 @testset "Ref Broadcast" begin foobar(idx, A) = A[idx] @test CuArray([42]) == foobar.(CuArray([1]), Base.RefValue(CuArray([42]))) end @testset "Broadcast Fix" begin @test testf(x -> log.(x), rand(3,3)) @test testf((x,xs) -> log.(x.+xs), Ref(1), rand(3,3)) end