github.com/apache/beam/sdks/v2@v2.48.2/python/container/base_image_requirements_manual.txt (about)

     1  
     2  ###############################################################################
     3  #  Licensed to the Apache Software Foundation (ASF) under one
     4  #  or more contributor license agreements.  See the NOTICE file
     5  #  distributed with this work for additional information
     6  #  regarding copyright ownership.  The ASF licenses this file
     7  #  to you under the Apache License, Version 2.0 (the
     8  #  "License"); you may not use this file except in compliance
     9  #  with the License.  You may obtain a copy of the License at
    10  #
    11  #      http://www.apache.org/licenses/LICENSE-2.0
    12  #
    13  #  Unless required by applicable law or agreed to in writing, software
    14  #  distributed under the License is distributed on an "AS IS" BASIS,
    15  #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    16  #  See the License for the specific language governing permissions and
    17  # limitations under the License.
    18  ###############################################################################
    19  
    20  # This file has additional packages to install in Beam's containers.
    21  # Do not specify dependencies, which are already in Beam's setup.py.
    22  # See generate_pip_requirements_list.sh to find which extras (e.g. gcp) are used.
    23  # Do not specify a constrained version without a particular reason, so that
    24  # we can pick up recent versions when regenerating the requirements.
    25  # Consider constraining requirements of Beam itself when necessary.
    26  
    27  bs4  # Commonly used HTML processing tool.
    28  # Don't upgrade to Cython 3.x, until it's released, stable and we have consensus
    29  # to upgrade. Use 0.xx for now.
    30  cython<1
    31  # future is no longer a Beam dependency, but is an implicit dependency in
    32  # some versions of libraries that launch Beam pipelines, like tensorflow-transform.
    33  # Leaving 'future' in our containers for now prevent breaking tft users.
    34  future
    35  # TODO(https://github.com/GoogleCloudPlatform/cloud-profiler-python/issues/127): Unpin python version.
    36  google-cloud-profiler;python_version<"3.11"
    37  guppy3
    38  mmh3  # Optimizes execution of some Beam codepaths. TODO: Make it Beam's dependency.
    39  nltk  # Commonly used for natural language processing.
    40  nose==1.3.7  # For Dataflow internal testing. TODO: remove this.
    41  # TODO: Uncomment python version once python-snappy supports it.
    42  # https://github.com/apache/beam/issues/25985
    43  python-snappy;python_version<"3.11"  # Optimizes execution of some Beam codepaths.
    44  scipy
    45  scikit-learn
    46  tensorflow>=2.12.0;python_version>="3.8"