github.com/apache/beam/sdks/v2@v2.48.2/python/container/base_image_requirements_manual.txt (about) 1 2 ############################################################################### 3 # Licensed to the Apache Software Foundation (ASF) under one 4 # or more contributor license agreements. See the NOTICE file 5 # distributed with this work for additional information 6 # regarding copyright ownership. The ASF licenses this file 7 # to you under the Apache License, Version 2.0 (the 8 # "License"); you may not use this file except in compliance 9 # with the License. You may obtain a copy of the License at 10 # 11 # http://www.apache.org/licenses/LICENSE-2.0 12 # 13 # Unless required by applicable law or agreed to in writing, software 14 # distributed under the License is distributed on an "AS IS" BASIS, 15 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 16 # See the License for the specific language governing permissions and 17 # limitations under the License. 18 ############################################################################### 19 20 # This file has additional packages to install in Beam's containers. 21 # Do not specify dependencies, which are already in Beam's setup.py. 22 # See generate_pip_requirements_list.sh to find which extras (e.g. gcp) are used. 23 # Do not specify a constrained version without a particular reason, so that 24 # we can pick up recent versions when regenerating the requirements. 25 # Consider constraining requirements of Beam itself when necessary. 26 27 bs4 # Commonly used HTML processing tool. 28 # Don't upgrade to Cython 3.x, until it's released, stable and we have consensus 29 # to upgrade. Use 0.xx for now. 30 cython<1 31 # future is no longer a Beam dependency, but is an implicit dependency in 32 # some versions of libraries that launch Beam pipelines, like tensorflow-transform. 33 # Leaving 'future' in our containers for now prevent breaking tft users. 34 future 35 # TODO(https://github.com/GoogleCloudPlatform/cloud-profiler-python/issues/127): Unpin python version. 36 google-cloud-profiler;python_version<"3.11" 37 guppy3 38 mmh3 # Optimizes execution of some Beam codepaths. TODO: Make it Beam's dependency. 39 nltk # Commonly used for natural language processing. 40 nose==1.3.7 # For Dataflow internal testing. TODO: remove this. 41 # TODO: Uncomment python version once python-snappy supports it. 42 # https://github.com/apache/beam/issues/25985 43 python-snappy;python_version<"3.11" # Optimizes execution of some Beam codepaths. 44 scipy 45 scikit-learn 46 tensorflow>=2.12.0;python_version>="3.8"