Skip to content

Commit 03d9201

Browse files
authored
Merge pull request #174 from GATEOverflow/dev
Bert is now edge only
2 parents 02683cf + 518325f commit 03d9201

File tree

2 files changed

+7
-5
lines changed

2 files changed

+7
-5
lines changed

.github/workflows/test-mlperf-inference-mixtral.yml

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,8 @@
1-
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
2-
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
3-
41
name: MLPerf inference MIXTRAL-8x7B
52

63
on:
74
schedule:
8-
- cron: "59 19 * * *" # 30th minute and 20th hour => 20:30 UTC => 2 AM IST
5+
- cron: "59 23 * * */5" # 30th minute and 20th hour => 20:30 UTC => 2 AM IST
96

107
jobs:
118
build_reference:

.github/workflows/test-nvidia-mlperf-inference-implementations.yml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,11 @@ jobs:
4343
gpu_name=rtx_4090
4444
docker_string=" --docker"
4545
fi
46+
if [ "${{ matrix.model }}" = "bert-99" ] || [ "${{ matrix.model }}" = "bert-99.9" ]; then
47+
category="edge"
48+
else
49+
category="datacenter,edge"
50+
fi
4651
4752
if [ -f "gh_action/bin/deactivate" ]; then source gh_action/bin/deactivate; fi
4853
python3 -m venv gh_action
@@ -51,6 +56,6 @@ jobs:
5156
pip install --upgrade mlcflow
5257
mlc pull repo mlcommons@mlperf-automations --branch=dev
5358
54-
mlcr --tags=run-mlperf,inference,_all-scenarios,_submission,_full,_r5.0-dev --preprocess_submission=yes --pull_changes=yes --pull_inference_changes=yes --execution_mode=valid --gpu_name=$gpu_name --pull_changes=yes --pull_inference_changes=yes --model=${{ matrix.model }} --submitter="MLCommons" --hw_name=$hw_name --implementation=nvidia --backend=tensorrt --category=datacenter,edge --division=closed --docker_dt --docker_mlc_repo=mlcommons@mlperf-automations --docker_mlc_repo_branch=dev --adr.compiler.tags=gcc --device=cuda --use_model_from_host=yes --use_dataset_from_host=yes --results_dir=$HOME/gh_action_results --submission_dir=$HOME/gh_action_submissions --clean $docker_string --quiet
59+
mlcr --tags=run-mlperf,inference,_all-scenarios,_submission,_full,_r5.0-dev --preprocess_submission=yes --pull_changes=yes --pull_inference_changes=yes --execution_mode=valid --gpu_name=$gpu_name --pull_changes=yes --pull_inference_changes=yes --model=${{ matrix.model }} --submitter="MLCommons" --hw_name=$hw_name --implementation=nvidia --backend=tensorrt --category=$category --division=closed --docker_dt --docker_mlc_repo=mlcommons@mlperf-automations --docker_mlc_repo_branch=dev --adr.compiler.tags=gcc --device=cuda --use_model_from_host=yes --use_dataset_from_host=yes --results_dir=$HOME/gh_action_results --submission_dir=$HOME/gh_action_submissions --clean $docker_string --quiet
5560
5661
mlcr --tags=push,github,mlperf,inference,submission --repo_url=https://github.com/mlcommons/mlperf_inference_unofficial_submissions_v5.0 --repo_branch=auto-update --commit_message="Results from GH action on NVIDIA_$hw_name" --quiet --submission_dir=$HOME/gh_action_submissions --hw_name=$hw_name

0 commit comments

Comments
 (0)