File tree Expand file tree Collapse file tree 3 files changed +10
-3
lines changed Expand file tree Collapse file tree 3 files changed +10
-3
lines changed Original file line number Diff line number Diff line change 15
15
matrix :
16
16
python-version : ["3.10", "3.11"]
17
17
container :
18
- image : us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla:nightly_${{ matrix.python-version }}_tpuvm
18
+ image : us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla:nightly_${{ matrix.python-version }}_tpuvm_20250217
19
19
steps :
20
20
- uses : actions/checkout@v4
21
21
- name : Install torchax
Original file line number Diff line number Diff line change 1
1
# syntax=docker/dockerfile:experimental
2
2
# Use torch_xla Python 3.10 as the base image
3
- # TODO(https://github.com/pytorch/xla/issues/8683): Go back to nightly once the linked segfault is fixed.
4
- FROM us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla:r2.6.0_3.10_tpuvm_cxx11
3
+ FROM us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla:nightly_3.10_tpuvm_20250217
5
4
6
5
ARG USE_TRANSFORMERS=false
7
6
# Install system dependencies
Original file line number Diff line number Diff line change 4
4
from datetime import datetime
5
5
from pathlib import Path
6
6
7
+ # Workaround for MegaScale crash
8
+ #
9
+ # TODO(https://github.com/pytorch/xla/issues/8683): Remove the
10
+ # `--megascale_grpc_enable_xor_tracer=false` flag when libtpu is updated
11
+ xla_flags = os .environ .get ("LIBTPU_INIT_ARGS" , "" )
12
+ xla_flags = f"{ xla_flags } --megascale_grpc_enable_xor_tracer=false"
13
+ os .environ ["LIBTPU_INIT_ARGS" ] = xla_flags
14
+
7
15
# Get the artifact dir from env var.
8
16
gcs_artifact_dir = os .environ ["TORCHPRIME_ARTIFACT_DIR" ]
9
17
assert gcs_artifact_dir .startswith (
You can’t perform that action at this time.
0 commit comments