Skip to content

Commit 890c932

Browse files
authored
Merge pull request #438 from JuliaGPU/tb/bump
Bump toolchain.
2 parents f36b813 + 72bfd4e commit 890c932

File tree

4 files changed

+12
-3
lines changed

4 files changed

+12
-3
lines changed

Project.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@ GPUArrays = "10"
3434
GPUCompiler = "0.23, 0.24, 0.25, 0.26"
3535
KernelAbstractions = "0.9.1"
3636
LLVM = "6"
37-
NEO_jll = "=24.09.28717"
37+
NEO_jll = "=24.13.29138"
3838
Preferences = "1"
3939
SPIRV_LLVM_Translator_unified_jll = "0.4"
4040
SpecialFunctions = "1.3, 2"

lib/level-zero/module.jl

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -237,7 +237,10 @@ function properties(kernel::ZeKernel)
237237
preferred_group_size_props_ref = Ref(ze_kernel_preferred_group_size_properties_t())
238238
link_extensions(props_ref, preferred_group_size_props_ref)
239239
if haskey(oneL0.extension_properties(kernel.mod.context.driver),
240-
"ZE_extension_kernel_max_group_size_properties")
240+
"ZE_extension_kernel_max_group_size_properties") ||
241+
(!validation_layer[] && # intel/compute-runtime#733
242+
properties(kernel.mod.device).vendorId == 0x8086 &&
243+
properties(kernel.mod.context.driver).driverVersion >= v"1.3.29138")
241244
# TODO: memoize
242245
max_group_size_props_ref = Ref(ze_kernel_max_group_size_properties_ext_t())
243246
link_extensions(preferred_group_size_props_ref, max_group_size_props_ref)

lib/level-zero/oneL0.jl

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -101,6 +101,9 @@ include("residency.jl")
101101

102102
const functional = Ref{Bool}(false)
103103

104+
const validation_layer = Ref{Bool}()
105+
const parameter_validation = Ref{Bool}()
106+
104107
function __init__()
105108
precompiling = ccall(:jl_generating_output, Cint, ()) != 0
106109
precompiling && return
@@ -132,6 +135,9 @@ function __init__()
132135
functional[] = false
133136
return
134137
end
138+
139+
validation_layer[] = parse(Bool, get(ENV, "ZE_ENABLE_VALIDATION_LAYER", "false"))
140+
parameter_validation[] = parse(Bool, get(ENV, "ZE_ENABLE_PARAMETER_VALIDATION", "false"))
135141
end
136142

137143
end

src/compiler/execution.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -167,11 +167,11 @@ function launch_configuration(kernel::HostKernel{F,TT}) where {F,TT}
167167
# configurations, so roll our own version that behaves like CUDA's
168168
# occupancy API and assumes the kernel still does bounds checking.
169169

170-
# once the MAX_GROUP_SIZE extension is implemented, we can use it here
171170
kernel_props = oneL0.properties(kernel.fun)
172171
group_size = if kernel_props.maxGroupSize !== missing
173172
kernel_props.maxGroupSize
174173
else
174+
# without the MAX_GROUP_SIZE extension, we need to be conservative
175175
dev = kernel.fun.mod.device
176176
compute_props = oneL0.compute_properties(dev)
177177
max_size = compute_props.maxTotalGroupSize

0 commit comments

Comments
 (0)