Skip to content

Commit

Permalink
Merge pull request #403 from JuliaGPU/tb/latency
Browse files Browse the repository at this point in the history
Latency improvements
  • Loading branch information
maleadt authored Sep 1, 2020
2 parents 56699b2 + e095498 commit fa7438b
Show file tree
Hide file tree
Showing 3 changed files with 15 additions and 1 deletion.
4 changes: 3 additions & 1 deletion Manifest.toml
Original file line number Diff line number Diff line change
Expand Up @@ -65,7 +65,9 @@ version = "5.1.0"

[[GPUCompiler]]
deps = ["DataStructures", "InteractiveUtils", "LLVM", "Libdl", "TimerOutputs", "UUIDs"]
git-tree-sha1 = "c24978f4722e39510d2225db8823be74db4f7ecb"
git-tree-sha1 = "3d8cec72696d81556689e4dd131d4b714abbb47c"
repo-rev = "177bff3"
repo-url = "https://github.com/JuliaGPU/GPUCompiler.jl.git"
uuid = "61eb1bfa-7361-4325-ad38-22787b887f55"
version = "0.7.1"

Expand Down
3 changes: 3 additions & 0 deletions src/CUDA.jl
Original file line number Diff line number Diff line change
Expand Up @@ -90,4 +90,7 @@ export NVML, has_nvml

include("deprecated.jl")

include("precompile.jl")
_precompile_()

end
9 changes: 9 additions & 0 deletions src/precompile.jl
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
function _precompile_()
ccall(:jl_generating_output, Cint, ()) == 1 || return nothing
@assert precompile(Tuple{CUDA.HostKernel{identity, Tuple{Nothing}},Nothing})
@assert precompile(Tuple{Type{CuModule},String,Dict{CUDA.CUjit_option_enum, Any}})
@assert precompile(Tuple{typeof(CUDA.prepare_cuda_call)})
@assert precompile(Tuple{typeof(GPUCompiler.load_runtime),GPUCompiler.CompilerJob{GPUCompiler.PTXCompilerTarget, CUDA.CUDACompilerParams},LLVM.Context})
@assert precompile(Tuple{typeof(cufunction),typeof(identity),Type{Tuple{Nothing}}})
@assert precompile(Tuple{typeof(which(CUDA.pack_arguments,(Function,Vararg{Any, N} where N,)).generator.gen),Any,Any,Any})
end

0 comments on commit fa7438b

Please sign in to comment.