Skip to content

Commit b6d6636

Browse files
committed
Merge branch 'sycl' into review/yang/fix_msan_usm
2 parents 17ff6cc + db7aff1 commit b6d6636

File tree

4 files changed

+37
-8
lines changed

4 files changed

+37
-8
lines changed

scripts/benchmarks/output_html.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,8 @@
44
# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
55

66
import re
7+
import os
8+
from pathlib import Path
79
import matplotlib.pyplot as plt
810
import mpld3
911
from collections import defaultdict
@@ -256,7 +258,9 @@ def generate_html(benchmark_runs: list[BenchmarkRun], github_repo: str, compare_
256258
suite_names = {t.suite for t in timeseries}
257259
suite_checkboxes_html = ' '.join(f'<label><input type="checkbox" class="suite-checkbox" data-suite="{suite}" checked> {suite}</label>' for suite in suite_names)
258260

259-
with open('benchmark_results.html.template', 'r') as file:
261+
script_path = os.path.dirname(os.path.realpath(__file__))
262+
results_template_path = Path(script_path, 'benchmark_results.html.template')
263+
with open(results_template_path, 'r') as file:
260264
html_template = file.read()
261265

262266
template = Template(html_template)

source/adapters/cuda/tensor_map.cpp

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,24 @@
1313

1414
#include "context.hpp"
1515

16+
#if CUDA_VERSION < 12000
17+
UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeIm2ColExp(
18+
ur_device_handle_t, ur_exp_tensor_map_data_type_flags_t, uint32_t, void *,
19+
const uint64_t *, const uint64_t *, const int *, const int *, uint32_t,
20+
uint32_t, const uint32_t *, ur_exp_tensor_map_interleave_flags_t,
21+
ur_exp_tensor_map_swizzle_flags_t, ur_exp_tensor_map_l2_promotion_flags_t,
22+
ur_exp_tensor_map_oob_fill_flags_t, ur_exp_tensor_map_handle_t *) {
23+
return UR_RESULT_ERROR_UNSUPPORTED_FEATURE;
24+
}
25+
UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeTiledExp(
26+
ur_device_handle_t, ur_exp_tensor_map_data_type_flags_t, uint32_t, void *,
27+
const uint64_t *, const uint64_t *, const uint32_t *, const uint32_t *,
28+
ur_exp_tensor_map_interleave_flags_t, ur_exp_tensor_map_swizzle_flags_t,
29+
ur_exp_tensor_map_l2_promotion_flags_t, ur_exp_tensor_map_oob_fill_flags_t,
30+
ur_exp_tensor_map_handle_t *) {
31+
return UR_RESULT_ERROR_UNSUPPORTED_FEATURE;
32+
}
33+
#else
1634
struct ur_exp_tensor_map_handle_t_ {
1735
CUtensorMap Map;
1836
};
@@ -140,3 +158,4 @@ UR_APIEXPORT ur_result_t UR_APICALL urTensorMapEncodeTiledExp(
140158
}
141159
return UR_RESULT_SUCCESS;
142160
}
161+
#endif

source/adapters/level_zero/context.cpp

Lines changed: 11 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -533,6 +533,13 @@ ur_result_t ur_context_handle_t_::getFreeSlotInExistingOrNewPool(
533533
if (*ZePool == nullptr) {
534534
ze_event_pool_counter_based_exp_desc_t counterBasedExt = {
535535
ZE_STRUCTURE_TYPE_COUNTER_BASED_EVENT_POOL_EXP_DESC, nullptr, 0};
536+
537+
ze_intel_event_sync_mode_exp_desc_t eventSyncMode = {
538+
ZE_INTEL_STRUCTURE_TYPE_EVENT_SYNC_MODE_EXP_DESC, nullptr, 0};
539+
eventSyncMode.syncModeFlags =
540+
ZE_INTEL_EVENT_SYNC_MODE_EXP_FLAG_LOW_POWER_WAIT |
541+
ZE_INTEL_EVENT_SYNC_MODE_EXP_FLAG_SIGNAL_INTERRUPT;
542+
536543
ZeStruct<ze_event_pool_desc_t> ZeEventPoolDesc;
537544
ZeEventPoolDesc.count = MaxNumEventsPerPool;
538545
ZeEventPoolDesc.flags = 0;
@@ -552,14 +559,11 @@ ur_result_t ur_context_handle_t_::getFreeSlotInExistingOrNewPool(
552559
}
553560
logger::debug("ze_event_pool_desc_t counter based flags set to: {}",
554561
counterBasedExt.flags);
562+
if (InterruptBasedEventEnabled) {
563+
counterBasedExt.pNext = &eventSyncMode;
564+
}
555565
ZeEventPoolDesc.pNext = &counterBasedExt;
556-
}
557-
if (InterruptBasedEventEnabled) {
558-
ze_intel_event_sync_mode_exp_desc_t eventSyncMode = {
559-
ZE_INTEL_STRUCTURE_TYPE_EVENT_SYNC_MODE_EXP_DESC, nullptr, 0};
560-
eventSyncMode.syncModeFlags =
561-
ZE_INTEL_EVENT_SYNC_MODE_EXP_FLAG_LOW_POWER_WAIT |
562-
ZE_INTEL_EVENT_SYNC_MODE_EXP_FLAG_SIGNAL_INTERRUPT;
566+
} else if (InterruptBasedEventEnabled) {
563567
ZeEventPoolDesc.pNext = &eventSyncMode;
564568
}
565569

source/loader/layers/sanitizer/msan/msan_libdevice.hpp

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -52,6 +52,8 @@ struct MsanLaunchInfo {
5252
uint32_t IsRecover = 0;
5353

5454
MsanErrorReport Report;
55+
56+
uint8_t CleanShadow[128] = {};
5557
};
5658

5759
// Based on the observation, only the last 24 bits of the address of the private

0 commit comments

Comments
 (0)