@@ -34,7 +34,7 @@ RUN ln -s /usr/local/cuda/lib64/stubs/libcuda.so /usr/local/cuda/lib64/stubs/lib
34
34
{{ end }}
35
35
36
36
# Keep these variables in sync if base image is updated.
37
- ENV TENSORFLOW_VERSION=2.9.2
37
+ ENV TENSORFLOW_VERSION=2.11.0
38
38
39
39
# We need to redefine the ARG here to get the ARG value defined above the FROM instruction.
40
40
# See: https://docs.docker.com/engine/reference/builder/#understand-how-arg-and-from-interact
@@ -93,11 +93,10 @@ RUN conda config --add channels nvidia && \
93
93
{{ if eq .Accelerator "gpu" }}
94
94
95
95
# b/232247930: uninstall pyarrow to avoid double installation with the GPU specific version.
96
- # b/267180053: RapidsAI (cudf/cuml) are not compatible with the latest tensorflow cudatoolkit version.
97
- # RUN pip uninstall -y pyarrow && \
98
- # mamba install -y cudf cuml && \
99
- # /tmp/clean-layer.sh
100
- # {{ end }}
96
+ RUN pip uninstall -y pyarrow && \
97
+ mamba install -y cudf cuml && \
98
+ /tmp/clean-layer.sh
99
+ {{ end }}
101
100
102
101
# Install implicit
103
102
{{ if eq .Accelerator "gpu" }}
@@ -114,12 +113,10 @@ COPY --from=torch_whl /tmp/whl/*.whl /tmp/torch/
114
113
RUN mamba install -c pytorch magma-cuda${CUDA_MAJOR_VERSION}${CUDA_MINOR_VERSION} && \
115
114
pip install /tmp/torch/*.whl && \
116
115
# b/255757999 openmp (libomp.so) is an dependency of libtorchtext and libtorchaudio but
117
- # the built from source versions don't seem to properly link it in. This forces the dep
118
- # which makes sure that libomp is loaded when these libraries are loaded.
119
116
mamba install -y openmp && \
120
- pip install patchelf && \
121
- patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchtext/lib/libtorchtext.so && \
122
- patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchaudio/lib/libtorchaudio.so && \
117
+ # pip install patchelf && \
118
+ # patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchtext/lib/libtorchtext.so && \
119
+ # patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchaudio/lib/libtorchaudio.so && \
123
120
rm -rf /tmp/torch && \
124
121
/tmp/clean-layer.sh
125
122
{{ else }}
@@ -181,8 +178,7 @@ RUN pip install spacy && \
181
178
# No specific package for nnabla-ext-cuda 11.x minor versions.
182
179
RUN pip install pycuda \
183
180
pynvrtc \
184
- pynvml \
185
- nnabla-ext-cuda${CUDA_MAJOR_VERSION}0 && \
181
+ pynvml && \
186
182
/tmp/clean-layer.sh
187
183
{{ end }}
188
184
@@ -197,9 +193,10 @@ RUN pip install pysal \
197
193
apt-get install -y default-jre-headless && \
198
194
pip install -f https://h2o-release.s3.amazonaws.com/h2o/latest_stable_Py.html h2o \
199
195
"tensorflow-gcs-config<=${TENSORFLOW_VERSION}" \
200
- tensorflow-addons==0.17.1 \
201
- tensorflow_decision_forests==0.2.7 \
202
- tensorflow_text==2.9.0 && \
196
+ "tensorflow==${TENSORFLOW_VERSION}" \
197
+ tensorflow-addons \
198
+ tensorflow_decision_forests \
199
+ tensorflow_text && \
203
200
/tmp/clean-layer.sh
204
201
205
202
RUN apt-get install -y libfreetype6-dev && \
@@ -377,27 +374,34 @@ RUN pip install tensorpack && \
377
374
memory_profiler && \
378
375
/tmp/clean-layer.sh
379
376
377
+
378
+
379
+
380
+ # Remove files that can't be uninstalled normally:
381
+ RUN rm /opt/conda/lib/python3.7/site-packages/google*/REQUESTED
382
+ RUN rm /opt/conda/lib/python3.7/site-packages/google*/direct_url.json
380
383
# install cython & cysignals before pyfasttext
381
384
RUN pip install cython \
382
385
cysignals \
383
386
pyfasttext \
384
387
fasttext && \
385
- apt-get install -y libhunspell-dev && pip install hunspell && \
386
- pip install annoy \
387
- category_encoders \
388
- # google-cloud-automl 2.0.0 introduced incompatible API changes, need to pin to 1.0.1
388
+ apt-get install -y libhunspell-dev && pip install hunspell
389
+ RUN pip install annoy \
390
+ category_encoders && \
391
+ # b/183041606#comment5: the Kaggle data proxy doesn't support these APIs. If the library is missing, it falls back to using a regular BigQuery query to fetch data.
392
+ pip uninstall -y google-cloud-bigquery-storage && \
393
+ # google-cloud-automl 2.0.0 introduced incompatible API changes, need to pin to 1.0.1
394
+ # After launch this should be installed from pip
395
+ pip install git+https://github.com/googleapis/python-aiplatform.git@mb-release \
389
396
google-cloud-automl==1.0.1 \
390
397
google-api-core==1.33.2 \
391
398
google-cloud-bigquery==2.2.0 \
392
399
google-cloud-storage \
393
400
google-cloud-translate==3.* \
394
401
google-cloud-language==2.* \
395
402
google-cloud-videointelligence==2.* \
396
- google-cloud-vision==2.* && \
397
- # b/183041606#comment5: the Kaggle data proxy doesn't support these APIs. If the library is missing, it falls back to using a regular BigQuery query to fetch data.
398
- pip uninstall -y google-cloud-bigquery-storage && \
399
- # After launch this should be installed from pip
400
- pip install git+https://github.com/googleapis/python-aiplatform.git@mb-release \
403
+ google-cloud-vision==2.* \
404
+ protobuf==3.20.3 \
401
405
ortools \
402
406
scattertext \
403
407
# Pandas data reader
@@ -416,6 +420,7 @@ RUN pip install cython \
416
420
417
421
418
422
# Fix qgrid by pinning ipywidgets https://github.com/quantopian/qgrid/issues/376
423
+ # allennlp \
419
424
RUN pip install bleach \
420
425
certifi \
421
426
cycler \
@@ -468,9 +473,8 @@ RUN pip install bleach \
468
473
pyarrow \
469
474
feather-format \
470
475
fastai \
471
- allennlp \
472
- importlib-metadata && \
473
- python -m spacy download en_core_web_sm && python -m spacy download en_core_web_lg && \
476
+ importlib-metadata
477
+ RUN python -m spacy download en_core_web_sm && python -m spacy download en_core_web_lg && \
474
478
apt-get install -y ffmpeg && \
475
479
/tmp/clean-layer.sh
476
480
@@ -497,7 +501,7 @@ RUN pip install flashtext \
497
501
pympler \
498
502
s3fs \
499
503
featuretools \
500
- -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper \
504
+ # -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper \
501
505
hpsklearn \
502
506
git+https://github.com/Kaggle/learntools \
503
507
kmapper \
@@ -524,8 +528,8 @@ RUN pip install flashtext \
524
528
catalyst \
525
529
# b/206990323 osmx 1.1.2 requires numpy >= 1.21 which we don't want.
526
530
osmnx==1.1.1 && \
527
- apt-get -y install libspatialindex-dev && \
528
- pip install pytorch-ignite \
531
+ apt-get -y install libspatialindex-dev
532
+ RUN pip install pytorch-ignite \
529
533
qgrid \
530
534
bqplot \
531
535
earthengine-api \
@@ -544,7 +548,7 @@ RUN pip install flashtext \
544
548
# flask is used by agents in the simulation competitions.
545
549
flask \
546
550
# pycrypto is used by competitions team.
547
- pycrypto \
551
+ pycryptodome \
548
552
easyocr \
549
553
# ipympl adds interactive widget support for matplotlib
550
554
ipympl==0.7.0 \
@@ -599,6 +603,8 @@ RUN pip install --upgrade dask && \
599
603
ln -sf /usr/lib/x86_64-linux-gnu/libpixman-1.so.0.34.0 /opt/conda/lib/libpixman-1.so.0.38.0 && \
600
604
/tmp/clean-layer.sh
601
605
606
+ RUN pip install setuptools==59.8.0 && pip install -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper
607
+
602
608
# Add BigQuery client proxy settings
603
609
ENV PYTHONUSERBASE "/root/.local"
604
610
ADD patches/kaggle_gcp.py /root/.local/lib/python3.7/site-packages/kaggle_gcp.py
0 commit comments