diff --git a/script/get-ml-model-gptj/customize.py b/script/get-ml-model-gptj/customize.py index b9c640faf..cb15d7ce1 100644 --- a/script/get-ml-model-gptj/customize.py +++ b/script/get-ml-model-gptj/customize.py @@ -40,6 +40,11 @@ def preprocess(i): env['MLC_CUDA_DEVICE_PROP_GPU_COMPUTE_CAPABILITY']) * 10) env['MLC_GPU_ARCH'] = gpu_arch + env['DOCKER_RUN_ARGS'] = f" -v {env['MLC_NVIDIA_MLPERF_SCRATCH_PATH']}:/mnt" + + if is_true(env.get('MLC_DOCKER_USE_GOOGLE_DNS', '')): + env['DOCKER_RUN_ARGS'] += ' --dns 8.8.8.8 --dns 8.8.4.4 ' + env['MLC_TMP_REQUIRE_DOWNLOAD'] = 'no' else: diff --git a/script/get-ml-model-gptj/run-nvidia.sh b/script/get-ml-model-gptj/run-nvidia.sh index a81d52f7c..458580490 100644 --- a/script/get-ml-model-gptj/run-nvidia.sh +++ b/script/get-ml-model-gptj/run-nvidia.sh @@ -13,7 +13,8 @@ make -C docker build test $? -eq 0 || exit $? export RUN_CMD="bash -c 'python3 scripts/build_wheel.py -a=${MLC_GPU_ARCH} --clean --install --trt_root /usr/local/tensorrt/ && python examples/quantization/quantize.py --dtype=float16 --output_dir=/mnt/models/GPTJ-6B/fp8-quantized-ammo/GPTJ-FP8-quantized --model_dir=/mnt/models/GPTJ-6B/checkpoint-final --qformat=fp8 --kv_cache_dtype=fp8 '" -export DOCKER_RUN_ARGS=" -v ${MLC_NVIDIA_MLPERF_SCRATCH_PATH}:/mnt" + + make -C docker run LOCAL_USER=1 test $? -eq 0 || exit $? diff --git a/script/kill-process/customize.py b/script/kill-process/customize.py index 0c39a62eb..0ee68220d 100644 --- a/script/kill-process/customize.py +++ b/script/kill-process/customize.py @@ -18,6 +18,9 @@ def generate_kill_command(env): # all in that group kill_cmd = f"pkill -g $(pgrep -o {process_name} | xargs ps -o pgid= -p | tr -d ' ')" + elif is_true(env.get("MLC_KILL_BUSIEST_PROCESS_GROUP")): + kill_cmd = r"busy_pgid=\$(ps -eo pgid,pcpu --sort=-pcpu | head -n 2 | tail -n 1 | awk '{print $1}') && kill -- -\$busy_pgid" + else: if env.get("MLC_KILL_PROCESS_ID"): process_id = env["MLC_KILL_PROCESS_ID"] diff --git a/script/kill-process/meta.yaml b/script/kill-process/meta.yaml index 3c0335c27..fda7b82b1 100644 --- a/script/kill-process/meta.yaml +++ b/script/kill-process/meta.yaml @@ -18,5 +18,6 @@ input_mapping: group: MLC_KILL_PROCESS_GROUP pid: MLC_KILL_PROCESS_ID pname: MLC_KILL_PROCESS_NAME + busy_group: MLC_KILL_BUSIEST_PROCESS_GROUP