@@ -34,7 +34,7 @@ RUN ln -s /usr/local/cuda/lib64/stubs/libcuda.so /usr/local/cuda/lib64/stubs/lib
3434{{ end }}
3535
3636# Keep these variables in sync if base image is updated.
37- ENV TENSORFLOW_VERSION=2.9.2
37+ ENV TENSORFLOW_VERSION=2.11.0
3838
3939# We need to redefine the ARG here to get the ARG value defined above the FROM instruction.
4040# See: https://docs.docker.com/engine/reference/builder/#understand-how-arg-and-from-interact
@@ -93,11 +93,10 @@ RUN conda config --add channels nvidia && \
9393{{ if eq .Accelerator "gpu" }}
9494
9595# b/232247930: uninstall pyarrow to avoid double installation with the GPU specific version.
96- # b/267180053: RapidsAI (cudf/cuml) are not compatible with the latest tensorflow cudatoolkit version.
97- # RUN pip uninstall -y pyarrow && \
98- # mamba install -y cudf cuml && \
99- # /tmp/clean-layer.sh
100- # {{ end }}
96+ RUN pip uninstall -y pyarrow && \
97+ mamba install -y cudf cuml && \
98+ /tmp/clean-layer.sh
99+ {{ end }}
101100
102101# Install implicit
103102{{ if eq .Accelerator "gpu" }}
@@ -114,12 +113,10 @@ COPY --from=torch_whl /tmp/whl/*.whl /tmp/torch/
114113RUN mamba install -c pytorch magma-cuda${CUDA_MAJOR_VERSION}${CUDA_MINOR_VERSION} && \
115114 pip install /tmp/torch/*.whl && \
116115 # b/255757999 openmp (libomp.so) is an dependency of libtorchtext and libtorchaudio but
117- # the built from source versions don't seem to properly link it in. This forces the dep
118- # which makes sure that libomp is loaded when these libraries are loaded.
119116 mamba install -y openmp && \
120- pip install patchelf && \
121- patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchtext/lib/libtorchtext.so && \
122- patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchaudio/lib/libtorchaudio.so && \
117+ # pip install patchelf && \
118+ # patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchtext/lib/libtorchtext.so && \
119+ # patchelf --add-needed libomp.so /opt/conda/lib/python3.7/site-packages/torchaudio/lib/libtorchaudio.so && \
123120 rm -rf /tmp/torch && \
124121 /tmp/clean-layer.sh
125122{{ else }}
@@ -181,8 +178,7 @@ RUN pip install spacy && \
181178# No specific package for nnabla-ext-cuda 11.x minor versions.
182179RUN pip install pycuda \
183180 pynvrtc \
184- pynvml \
185- nnabla-ext-cuda${CUDA_MAJOR_VERSION}0 && \
181+ pynvml && \
186182 /tmp/clean-layer.sh
187183{{ end }}
188184
@@ -197,9 +193,10 @@ RUN pip install pysal \
197193 apt-get install -y default-jre-headless && \
198194 pip install -f https://h2o-release.s3.amazonaws.com/h2o/latest_stable_Py.html h2o \
199195 "tensorflow-gcs-config<=${TENSORFLOW_VERSION}" \
200- tensorflow-addons==0.17.1 \
201- tensorflow_decision_forests==0.2.7 \
202- tensorflow_text==2.9.0 && \
196+ "tensorflow==${TENSORFLOW_VERSION}" \
197+ tensorflow-addons \
198+ tensorflow_decision_forests \
199+ tensorflow_text && \
203200 /tmp/clean-layer.sh
204201
205202RUN apt-get install -y libfreetype6-dev && \
@@ -377,27 +374,34 @@ RUN pip install tensorpack && \
377374 memory_profiler && \
378375 /tmp/clean-layer.sh
379376
377+
378+
379+
380+ # Remove files that can't be uninstalled normally:
381+ RUN rm /opt/conda/lib/python3.7/site-packages/google*/REQUESTED
382+ RUN rm /opt/conda/lib/python3.7/site-packages/google*/direct_url.json
380383# install cython & cysignals before pyfasttext
381384RUN pip install cython \
382385 cysignals \
383386 pyfasttext \
384387 fasttext && \
385- apt-get install -y libhunspell-dev && pip install hunspell && \
386- pip install annoy \
387- category_encoders \
388- # google-cloud-automl 2.0.0 introduced incompatible API changes, need to pin to 1.0.1
388+ apt-get install -y libhunspell-dev && pip install hunspell
389+ RUN pip install annoy \
390+ category_encoders && \
391+ # b/183041606#comment5: the Kaggle data proxy doesn't support these APIs. If the library is missing, it falls back to using a regular BigQuery query to fetch data.
392+ pip uninstall -y google-cloud-bigquery-storage && \
393+ # google-cloud-automl 2.0.0 introduced incompatible API changes, need to pin to 1.0.1
394+ # After launch this should be installed from pip
395+ pip install git+https://github.com/googleapis/python-aiplatform.git@mb-release \
389396 google-cloud-automl==1.0.1 \
390397 google-api-core==1.33.2 \
391398 google-cloud-bigquery==2.2.0 \
392399 google-cloud-storage \
393400 google-cloud-translate==3.* \
394401 google-cloud-language==2.* \
395402 google-cloud-videointelligence==2.* \
396- google-cloud-vision==2.* && \
397- # b/183041606#comment5: the Kaggle data proxy doesn't support these APIs. If the library is missing, it falls back to using a regular BigQuery query to fetch data.
398- pip uninstall -y google-cloud-bigquery-storage && \
399- # After launch this should be installed from pip
400- pip install git+https://github.com/googleapis/python-aiplatform.git@mb-release \
403+ google-cloud-vision==2.* \
404+ protobuf==3.20.3 \
401405 ortools \
402406 scattertext \
403407 # Pandas data reader
@@ -416,6 +420,7 @@ RUN pip install cython \
416420
417421
418422# Fix qgrid by pinning ipywidgets https://github.com/quantopian/qgrid/issues/376
423+ # allennlp \
419424RUN pip install bleach \
420425 certifi \
421426 cycler \
@@ -468,9 +473,8 @@ RUN pip install bleach \
468473 pyarrow \
469474 feather-format \
470475 fastai \
471- allennlp \
472- importlib-metadata && \
473- python -m spacy download en_core_web_sm && python -m spacy download en_core_web_lg && \
476+ importlib-metadata
477+ RUN python -m spacy download en_core_web_sm && python -m spacy download en_core_web_lg && \
474478 apt-get install -y ffmpeg && \
475479 /tmp/clean-layer.sh
476480
@@ -497,7 +501,7 @@ RUN pip install flashtext \
497501 pympler \
498502 s3fs \
499503 featuretools \
500- -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper \
504+ # -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper \
501505 hpsklearn \
502506 git+https://github.com/Kaggle/learntools \
503507 kmapper \
@@ -524,8 +528,8 @@ RUN pip install flashtext \
524528 catalyst \
525529 # b/206990323 osmx 1.1.2 requires numpy >= 1.21 which we don't want.
526530 osmnx==1.1.1 && \
527- apt-get -y install libspatialindex-dev && \
528- pip install pytorch-ignite \
531+ apt-get -y install libspatialindex-dev
532+ RUN pip install pytorch-ignite \
529533 qgrid \
530534 bqplot \
531535 earthengine-api \
@@ -544,7 +548,7 @@ RUN pip install flashtext \
544548 # flask is used by agents in the simulation competitions.
545549 flask \
546550 # pycrypto is used by competitions team.
547- pycrypto \
551+ pycryptodome \
548552 easyocr \
549553 # ipympl adds interactive widget support for matplotlib
550554 ipympl==0.7.0 \
@@ -599,6 +603,8 @@ RUN pip install --upgrade dask && \
599603 ln -sf /usr/lib/x86_64-linux-gnu/libpixman-1.so.0.34.0 /opt/conda/lib/libpixman-1.so.0.38.0 && \
600604 /tmp/clean-layer.sh
601605
606+ RUN pip install setuptools==59.8.0 && pip install -e git+https://github.com/SohierDane/BigQuery_Helper#egg=bq_helper
607+
602608# Add BigQuery client proxy settings
603609ENV PYTHONUSERBASE "/root/.local"
604610ADD patches/kaggle_gcp.py /root/.local/lib/python3.7/site-packages/kaggle_gcp.py
0 commit comments