@@ -10,7 +10,7 @@ ARG TORCHVISION_VERSION
10
10
11
11
{{ if eq .Accelerator "gpu" }}
12
12
FROM gcr.io/kaggle-images/python-lightgbm-whl:${GPU_BASE_IMAGE_NAME}-${BASE_IMAGE_TAG}-${LIGHTGBM_VERSION} AS lightgbm_whl
13
- FROM gcr.io/kaggle-images/python-torch-whl:${GPU_BASE_IMAGE_NAME}-${BASE_IMAGE_TAG}-${TORCH_VERSION} AS torch_whl
13
+ # FROM gcr.io/kaggle-images/python-torch-whl:${GPU_BASE_IMAGE_NAME}-${BASE_IMAGE_TAG}-${TORCH_VERSION} AS torch_whl
14
14
FROM ${BASE_IMAGE_REPO}/${GPU_BASE_IMAGE_NAME}:${BASE_IMAGE_TAG}
15
15
{{ else }}
16
16
FROM ${BASE_IMAGE_REPO}/${CPU_BASE_IMAGE_NAME}:${BASE_IMAGE_TAG}
@@ -34,7 +34,7 @@ RUN ln -s /usr/local/cuda/lib64/stubs/libcuda.so /usr/local/cuda/lib64/stubs/lib
34
34
{{ end }}
35
35
36
36
# Keep these variables in sync if base image is updated.
37
- ENV TENSORFLOW_VERSION=2.9.2
37
+ ENV TENSORFLOW_VERSION=2.11.0
38
38
39
39
# We need to redefine the ARG here to get the ARG value defined above the FROM instruction.
40
40
# See: https://docs.docker.com/engine/reference/builder/#understand-how-arg-and-from-interact
@@ -93,11 +93,10 @@ RUN conda config --add channels nvidia && \
93
93
{{ if eq .Accelerator "gpu" }}
94
94
95
95
# b/232247930: uninstall pyarrow to avoid double installation with the GPU specific version.
96
- # b/267180053: RapidsAI (cudf/cuml) are not compatible with the latest tensorflow cudatoolkit version.
97
- # RUN pip uninstall -y pyarrow && \
98
- # mamba install -y cudf cuml && \
99
- # /tmp/clean-layer.sh
100
- # {{ end }}
96
+ RUN pip uninstall -y pyarrow && \
97
+ mamba install -y cudf cuml && \
98
+ /tmp/clean-layer.sh
99
+ {{ end }}
101
100
102
101
# Install implicit
103
102
{{ if eq .Accelerator "gpu" }}
@@ -110,17 +109,17 @@ RUN mamba install implicit && \
110
109
111
110
# Install PyTorch
112
111
{{ if eq .Accelerator "gpu" }}
113
- COPY --from=torch_whl /tmp/whl/*.whl /tmp/torch/
112
+ # COPY --from=torch_whl /tmp/whl/*.whl /tmp/torch/
114
113
RUN mamba install -c pytorch magma-cuda${CUDA_MAJOR_VERSION}${CUDA_MINOR_VERSION} && \
115
- pip install /tmp/torch/*.whl && \
114
+ # pip install /tmp/torch/*.whl && \
116
115
# b/255757999 openmp (libomp.so) is an dependency of libtorchtext and libtorchaudio but
117
116
# the built from source versions don't seem to properly link it in. This forces the dep
118
117
# which makes sure that libomp is loaded when these libraries are loaded.
119
- mamba install -y openmp && \
120
- pip install patchelf && \
121
- patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchtext/lib/libtorchtext.so && \
122
- patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchaudio/lib/libtorchaudio.so && \
123
- rm -rf /tmp/torch && \
118
+ pip install torch==1.12.1+cu113 torchvision==0.13.1+cu113 torchaudio==0.12.1 --extra-index-url https://download.pytorch.org/whl/cu113 && \
119
+ # pip install patchelf && \
120
+ # patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchtext/lib/libtorchtext.so && \
121
+ # patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchaudio/lib/libtorchaudio.so && \
122
+ # rm -rf /tmp/torch && \
124
123
/tmp/clean-layer.sh
125
124
{{ else }}
126
125
RUN pip install \
@@ -376,22 +375,24 @@ RUN pip install tensorpack && \
376
375
/tmp/clean-layer.sh
377
376
378
377
# install cython & cysignals before pyfasttext
378
+ RUN rm /opt/conda/lib/python3.7/site-packages/*/direct_url.json
379
379
RUN pip install cython \
380
380
cysignals \
381
381
pyfasttext \
382
382
fasttext && \
383
- apt-get install -y libhunspell-dev && pip install hunspell && \
384
- pip install annoy \
385
- category_encoders \
383
+ apt-get install -y libhunspell-dev && pip install hunspell
384
+ RUN pip install annoy \
385
+ category_encoders && \
386
+ # These should already be installed?
386
387
# google-cloud-automl 2.0.0 introduced incompatible API changes, need to pin to 1.0.1
387
- google-cloud-automl==1.0.1 \
388
- google-api-core==1.33.2 \
389
- google-cloud-bigquery==2.2.0 \
390
- google-cloud-storage \
391
- google-cloud-translate==3.* \
392
- google-cloud-language==2.* \
393
- google-cloud-videointelligence==2.* \
394
- google-cloud-vision==2.* && \
388
+ # google-cloud-automl==1.0.1 \
389
+ # google-api-core==1.33.2 \
390
+ # google-cloud-bigquery==2.2.0 \
391
+ # google-cloud-storage \
392
+ # google-cloud-translate==3.* \
393
+ # google-cloud-language==2.* \
394
+ # google-cloud-videointelligence==2.* \
395
+ # google-cloud-vision==2.* && \
395
396
# b/183041606#comment5: the Kaggle data proxy doesn't support these APIs. If the library is missing, it falls back to using a regular BigQuery query to fetch data.
396
397
pip uninstall -y google-cloud-bigquery-storage && \
397
398
# After launch this should be installed from pip
@@ -414,6 +415,7 @@ RUN pip install cython \
414
415
415
416
416
417
# Fix qgrid by pinning ipywidgets https://github.com/quantopian/qgrid/issues/376
418
+ # allennlp \
417
419
RUN pip install bleach \
418
420
certifi \
419
421
cycler \
@@ -466,11 +468,10 @@ RUN pip install bleach \
466
468
pyarrow \
467
469
feather-format \
468
470
fastai \
469
- allennlp \
470
- importlib-metadata && \
471
- python -m spacy download en_core_web_sm && python -m spacy download en_core_web_lg && \
472
- apt-get install -y ffmpeg && \
473
- /tmp/clean-layer.sh
471
+ importlib-metadata
472
+ #RUN python -m spacy download en_core_web_sm && python -m spacy download en_core_web_lg && \
473
+ # apt-get install -y ffmpeg && \
474
+ # /tmp/clean-layer.sh
474
475
475
476
###########
476
477
#
@@ -495,7 +496,7 @@ RUN pip install flashtext \
495
496
pympler \
496
497
s3fs \
497
498
featuretools \
498
- -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper \
499
+ # -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper \
499
500
hpsklearn \
500
501
git+https://github.com/Kaggle/learntools \
501
502
kmapper \
@@ -526,7 +527,7 @@ RUN pip install flashtext \
526
527
pip install pytorch-ignite \
527
528
qgrid \
528
529
bqplot \
529
- earthengine-api \
530
+ # earthengine-api \
530
531
transformers \
531
532
# b/232247930 >= 2.2.0 requires pyarrow >= 6.0.0 which conflicts with dependencies for rapidsai 0.21.*
532
533
datasets==2.1.0 \
0 commit comments