diff --git a/.github/workflows/merlin.yml b/.github/workflows/merlin.yml index e716b14f9..0a91eec6d 100644 --- a/.github/workflows/merlin.yml +++ b/.github/workflows/merlin.yml @@ -42,7 +42,7 @@ jobs: strategy: fail-fast: false matrix: - python-version: ["3.7", "3.8", "3.9", "3.10"] #TODO: Remove Python 3.7 support + python-version: ["3.8", "3.9", "3.10"] env: PIPENV_DEFAULT_PYTHON_VERSION: ${{ matrix.python-version }} steps: @@ -74,7 +74,7 @@ jobs: strategy: fail-fast: false matrix: - python-version: ["3.7", "3.8", "3.9", "3.10"] #TODO: Remove Python 3.7 support + python-version: ["3.8", "3.9", "3.10"] env: PIPENV_DEFAULT_PYTHON_VERSION: ${{ matrix.python-version }} steps: @@ -263,7 +263,7 @@ jobs: strategy: fail-fast: false matrix: - python-version: ["37", "38", "39", "310"] + python-version: ["38", "39", "310"] needs: - create-version steps: @@ -284,7 +284,7 @@ jobs: strategy: fail-fast: false matrix: - python-version: ["37", "38", "39", "310"] + python-version: ["38", "39", "310"] needs: - create-version steps: diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml index a43ceb164..dbc517a3f 100644 --- a/.github/workflows/release.yml +++ b/.github/workflows/release.yml @@ -63,8 +63,7 @@ jobs: working-directory: ./python/sdk run: | IMAGE_TAG="${{ env.CONTAINER_REGISTRY }}/merlin-sdk:py${{ matrix.python-version }}-${{ inputs.version }}" - SDK_VERSION="$(sed 's/^v\(.*\)-/\1/' <<< "${{ inputs.version }}")" - docker build -t ${IMAGE_TAG} --build-arg PYTHON_VERSION=${{ matrix.python-version }} --build-arg VERSION=${SDK_VERSION} . + docker build -t ${IMAGE_TAG} --build-arg PYTHON_VERSION=${{ matrix.python-version }} . docker push ${IMAGE_TAG} publish-api: @@ -106,7 +105,7 @@ jobs: strategy: fail-fast: false matrix: - python-version: ["37", "38", "39", "310"] + python-version: ["38", "39", "310"] steps: - name: Log in to the Container registry uses: docker/login-action@v1 @@ -132,7 +131,7 @@ jobs: strategy: fail-fast: false matrix: - python-version: ["37", "38", "39", "310"] + python-version: ["38", "39", "310"] steps: - name: Log in to the Container registry uses: docker/login-action@v1 diff --git a/Makefile b/Makefile index 8f0a0c121..00dc2b5e7 100644 --- a/Makefile +++ b/Makefile @@ -12,7 +12,7 @@ TEST_TAGS?= GOLANGCI_LINT_VERSION="v1.51.2" PROTOC_GEN_GO_JSON_VERSION="v1.1.0" PROTOC_GEN_GO_VERSION="v1.26" -PYTHON_VERSION ?= "37" #set as 37 38 39 310 for 3.7-3.10 respectively +PYTHON_VERSION ?= "39" #set as 38 39 310 for 3.8-3.10 respectively all: setup init-dep lint test clean build run diff --git a/examples/batch/env.yaml b/examples/batch/env.yaml index 525de4685..258b26116 100644 --- a/examples/batch/env.yaml +++ b/examples/batch/env.yaml @@ -2,6 +2,6 @@ dependencies: - pip: - joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version - numpy>=1.19.5 - - scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation + - scikit-learn>=1.1.2 - xgboost==1.6.2 - - mlflow==1.23.0 \ No newline at end of file + - mlflow==1.26.1 \ No newline at end of file diff --git a/examples/batch/requirements.txt b/examples/batch/requirements.txt index 867ba1313..f28cb2246 100644 --- a/examples/batch/requirements.txt +++ b/examples/batch/requirements.txt @@ -1,8 +1,8 @@ joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version numpy>=1.19.5 -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 xgboost==1.6.2 -mlflow==1.23.0 +mlflow==1.26.1 merlin-sdk cloudpickle==2.0.0 google-cloud diff --git a/examples/custom-model/http_json/requirements.txt b/examples/custom-model/http_json/requirements.txt index 65c525967..94b54e531 100644 --- a/examples/custom-model/http_json/requirements.txt +++ b/examples/custom-model/http_json/requirements.txt @@ -1,3 +1,3 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 xgboost==1.6.2 merlin-sdk \ No newline at end of file diff --git a/examples/model-endpoint/requirements.txt b/examples/model-endpoint/requirements.txt index f9f15f6c0..359564de6 100644 --- a/examples/model-endpoint/requirements.txt +++ b/examples/model-endpoint/requirements.txt @@ -1,4 +1,4 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 merlin-sdk joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version cloudpickle==2.0.0 \ No newline at end of file diff --git a/examples/pyfunc/env.yaml b/examples/pyfunc/env.yaml index c170d7bf9..a3db7a247 100644 --- a/examples/pyfunc/env.yaml +++ b/examples/pyfunc/env.yaml @@ -2,5 +2,5 @@ dependencies: - python=3.8 - pip: - joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version - - scikit-learn==1.1.2 #TODO: >=1.1.2 upon python 3.7 deprecation + - scikit-learn>=1.1.2 - xgboost==1.6.2 diff --git a/examples/pyfunc/requirements.txt b/examples/pyfunc/requirements.txt index c94dc0bb9..ee4923e7f 100644 --- a/examples/pyfunc/requirements.txt +++ b/examples/pyfunc/requirements.txt @@ -1,4 +1,4 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version xgboost==1.6.2 merlin-sdk diff --git a/examples/resource-request-gpu/requirements.txt b/examples/resource-request-gpu/requirements.txt index f9f15f6c0..359564de6 100644 --- a/examples/resource-request-gpu/requirements.txt +++ b/examples/resource-request-gpu/requirements.txt @@ -1,4 +1,4 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 merlin-sdk joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version cloudpickle==2.0.0 \ No newline at end of file diff --git a/examples/resource-request/requirements.txt b/examples/resource-request/requirements.txt index f9f15f6c0..359564de6 100644 --- a/examples/resource-request/requirements.txt +++ b/examples/resource-request/requirements.txt @@ -1,4 +1,4 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 merlin-sdk joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version cloudpickle==2.0.0 \ No newline at end of file diff --git a/examples/sklearn/requirements.txt b/examples/sklearn/requirements.txt index f9f15f6c0..359564de6 100644 --- a/examples/sklearn/requirements.txt +++ b/examples/sklearn/requirements.txt @@ -1,4 +1,4 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 merlin-sdk joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version cloudpickle==2.0.0 \ No newline at end of file diff --git a/examples/xgboost/requirements.txt b/examples/xgboost/requirements.txt index 916acd8da..054f198eb 100644 --- a/examples/xgboost/requirements.txt +++ b/examples/xgboost/requirements.txt @@ -1,4 +1,4 @@ -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 xgboost==1.6.2 merlin-sdk cloudpickle==2.0.0 \ No newline at end of file diff --git a/python/batch-predictor/README.md b/python/batch-predictor/README.md index c16762782..9e3745b32 100644 --- a/python/batch-predictor/README.md +++ b/python/batch-predictor/README.md @@ -69,7 +69,7 @@ OBJC_DISABLE_INITIALIZE_FORK_SAFETY=YES python main.py --job-name iris-predictio ### Requirements -- python 3.7.0 +- python >= 3.8.0 - pipenv (install using `pip install pipenv`) - protoc (see [installation instruction](http://google.github.io/proto-lens/installing-protoc.html)) - gcloud (see [installation instruction](https://cloud.google.com/sdk/install)) diff --git a/python/batch-predictor/docker/app.Dockerfile b/python/batch-predictor/docker/app.Dockerfile index f630c000a..1f8582da4 100644 --- a/python/batch-predictor/docker/app.Dockerfile +++ b/python/batch-predictor/docker/app.Dockerfile @@ -24,6 +24,6 @@ ARG GOOGLE_APPLICATION_CREDENTIALS RUN if [[ ! -z "$GOOGLE_APPLICATION_CREDENTIALS" ]]; then gcloud auth activate-service-account --key-file=${GOOGLE_APPLICATION_CREDENTIALS}; fi RUN gsutil -m cp -r ${MODEL_URL} . RUN /bin/bash -c ". activate ${CONDA_ENVIRONMENT} && \ - sed -i 's/mlflow$/mlflow==1.23.0/' ${HOME}/model/conda.yaml && \ + sed -i 's/mlflow\(\s*==\s*[^ ]*\)\{0,1\}/mlflow==1.26.1/g' ${HOME}/model/conda.yaml && \ conda env update --name ${CONDA_ENVIRONMENT} --file ${HOME}/model/conda.yaml && \ python ${HOME}/merlin-spark-app/main.py --dry-run-model ${HOME}/model" diff --git a/python/batch-predictor/docker/base.Dockerfile b/python/batch-predictor/docker/base.Dockerfile index ea51d3901..3a8af51b6 100644 --- a/python/batch-predictor/docker/base.Dockerfile +++ b/python/batch-predictor/docker/base.Dockerfile @@ -12,7 +12,7 @@ # See the License for the specific language governing permissions and # limitations under the License. -FROM gcr.io/spark-operator/spark-py:v3.0.0 +FROM apache/spark-py:v3.1.3 # Switch to user root so we can add additional jars and configuration files. USER root diff --git a/python/batch-predictor/docker/env37.yaml b/python/batch-predictor/docker/env37.yaml deleted file mode 100644 index f02ff6fd7..000000000 --- a/python/batch-predictor/docker/env37.yaml +++ /dev/null @@ -1,8 +0,0 @@ -name: merlin-model -dependencies: - - python=3.7 - - pip=22.2.2 - - pip: - - -r ../requirements.txt - - --extra-index-url=https://test.pypi.org/simple - - --trusted-host=test.pypi.org diff --git a/python/batch-predictor/merlinpyspark/model.py b/python/batch-predictor/merlinpyspark/model.py index cbeff1e0e..9a47555f0 100644 --- a/python/batch-predictor/merlinpyspark/model.py +++ b/python/batch-predictor/merlinpyspark/model.py @@ -67,7 +67,7 @@ def spark_udf(spark, model_uri, features, result_type="double"): archive_path = SparkModelCache.add_local_model(spark, local_model_path) def predict(*args): - model = SparkModelCache.get_or_load(archive_path) + model, _ = SparkModelCache.get_or_load(archive_path) schema = {features[i]: arg for i, arg in enumerate(args)} pdf = None for x in args: diff --git a/python/batch-predictor/requirements.txt b/python/batch-predictor/requirements.txt index c7624d8d2..10499e497 100644 --- a/python/batch-predictor/requirements.txt +++ b/python/batch-predictor/requirements.txt @@ -1,8 +1,7 @@ findspark pyspark==3.0.1 -mlflow>=1.2.0,<=1.23.0 +mlflow>=1.26.1,<2.0.0 cloudpickle==2.0.0 pyarrow>=0.14.1,<=9.0.0 -protobuf>=3.0,<4.0.0 -#TODO: Update merlin-sdk dep to: file:${SDK_PATH}#egg=merlin-sdk -merlin-sdk==0.33.0 # Pin to the version that supports Python 3.7. +protobuf>=3.0,<5.0.0 +file:${SDK_PATH}#egg=merlin-sdk diff --git a/python/batch-predictor/requirements_test.txt b/python/batch-predictor/requirements_test.txt index d1bf453d4..67b37771f 100644 --- a/python/batch-predictor/requirements_test.txt +++ b/python/batch-predictor/requirements_test.txt @@ -2,9 +2,7 @@ pytest pytest-cov mypy google-cloud-bigquery -scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation +scikit-learn>=1.1.2 joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version mypy-protobuf>=1.19 -types-PyYAML -protobuf<4.0.0 -grpcio<1.49.0 \ No newline at end of file +types-PyYAML \ No newline at end of file diff --git a/python/batch-predictor/setup.py b/python/batch-predictor/setup.py index f4b10f427..7b9fc6bee 100644 --- a/python/batch-predictor/setup.py +++ b/python/batch-predictor/setup.py @@ -21,12 +21,11 @@ with open('requirements.txt') as f: REQUIRE = f.read().splitlines() -# TODO: Uncomment below lines after Pyfunc server stops supporting Python 3.7 -# merlin_path = os.path.join(os.getcwd(), "../sdk") -# merlin_sdk_package = "merlin-sdk" -# for index, item in enumerate(REQUIRE): -# if merlin_sdk_package in item: -# REQUIRE[index] = f"{merlin_sdk_package} @ file://localhost/{merlin_path}#egg={merlin_sdk_package}" +merlin_path = os.path.join(os.getcwd(), "../sdk") +merlin_sdk_package = "merlin-sdk" +for index, item in enumerate(REQUIRE): + if merlin_sdk_package in item: + REQUIRE[index] = f"{merlin_sdk_package} @ file://localhost/{merlin_path}#egg={merlin_sdk_package}" setup( name='merlin-pyspark-app', @@ -34,7 +33,7 @@ author_email='merlin-dev@gojek.com', description='Base pyspark application for running merlin prediction job', long_description=open('README.md').read(), - python_requires='>=3.7,<3.11', + python_requires='>=3.8,<3.11', packages=find_packages("merlinpyspark"), install_requires=REQUIRE, tests_require=TEST_REQUIRE, diff --git a/python/batch-predictor/test-model/conda.yaml b/python/batch-predictor/test-model/conda.yaml index fcba475e2..a05d8495e 100644 --- a/python/batch-predictor/test-model/conda.yaml +++ b/python/batch-predictor/test-model/conda.yaml @@ -1,4 +1,4 @@ dependencies: - pip: - - scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation + - scikit-learn>=1.1.2 - joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version diff --git a/python/pyfunc-scaffolding/{{cookiecutter.model_slug}}/Pipfile b/python/pyfunc-scaffolding/{{cookiecutter.model_slug}}/Pipfile index 6febd113d..6a7f88af9 100644 --- a/python/pyfunc-scaffolding/{{cookiecutter.model_slug}}/Pipfile +++ b/python/pyfunc-scaffolding/{{cookiecutter.model_slug}}/Pipfile @@ -7,4 +7,4 @@ verify_ssl = true merlin-sdk = "=={{ cookiecutter.merlin_sdk_version }}" [requires] -python_version = "3.7" +python_version = "3.8" diff --git a/python/pyfunc-server/docker/Dockerfile b/python/pyfunc-server/docker/Dockerfile index 380b60424..807e8bed3 100644 --- a/python/pyfunc-server/docker/Dockerfile +++ b/python/pyfunc-server/docker/Dockerfile @@ -24,7 +24,7 @@ WORKDIR /pyfunc-server RUN if [ ! -z "$GOOGLE_APPLICATION_CREDENTIALS" ]; then gcloud auth activate-service-account --key-file=${GOOGLE_APPLICATION_CREDENTIALS}; fi RUN gsutil cp -r ${MODEL_URL} . RUN /bin/bash -c ". activate merlin-model && \ - sed -i 's/mlflow$/mlflow==1.23.0/' model/conda.yaml && \ + sed -i 's/mlflow\(\s*==\s*[^ ]*\)\{0,1\}/mlflow==1.26.1/g' model/conda.yaml && \ conda env update --name merlin-model --file model/conda.yaml && \ python -m pyfuncserver --model_dir model --dry_run" diff --git a/python/pyfunc-server/docker/env37.yaml b/python/pyfunc-server/docker/env37.yaml deleted file mode 100644 index f02ff6fd7..000000000 --- a/python/pyfunc-server/docker/env37.yaml +++ /dev/null @@ -1,8 +0,0 @@ -name: merlin-model -dependencies: - - python=3.7 - - pip=22.2.2 - - pip: - - -r ../requirements.txt - - --extra-index-url=https://test.pypi.org/simple - - --trusted-host=test.pypi.org diff --git a/python/pyfunc-server/requirements.txt b/python/pyfunc-server/requirements.txt index 8acae2198..b1b86e5e5 100644 --- a/python/pyfunc-server/requirements.txt +++ b/python/pyfunc-server/requirements.txt @@ -12,5 +12,4 @@ grpcio<1.49.0 grpcio-reflection<1.49.0 grpcio-tools<1.49.0 grpcio-health-checking<1.49.0 -#TODO: Update merlin-sdk dep to: file:${SDK_PATH}#egg=merlin-sdk -merlin-sdk==0.33.0 # Pin to the version that supports Python 3.7. +file:${SDK_PATH}#egg=merlin-sdk diff --git a/python/pyfunc-server/setup.py b/python/pyfunc-server/setup.py index e25cbb30b..28c1b18b7 100644 --- a/python/pyfunc-server/setup.py +++ b/python/pyfunc-server/setup.py @@ -31,12 +31,11 @@ # replace merlin relative path in requirements.txt into absolute path # setuptools could not install relative path requirements -# TODO: Uncomment below lines after Pyfunc server stops supporting Python 3.7 -# merlin_path = os.path.join(os.getcwd(), "../sdk") -# merlin_sdk_package = "merlin-sdk" -# for index, item in enumerate(REQUIRE): -# if merlin_sdk_package in item: -# REQUIRE[index] = f"{merlin_sdk_package} @ file://localhost/{merlin_path}#egg={merlin_sdk_package}" +merlin_path = os.path.join(os.getcwd(), "../sdk") +merlin_sdk_package = "merlin-sdk" +for index, item in enumerate(REQUIRE): + if merlin_sdk_package in item: + REQUIRE[index] = f"{merlin_sdk_package} @ file://localhost/{merlin_path}#egg={merlin_sdk_package}" setup( name='pyfuncserver', @@ -45,7 +44,7 @@ description='Model Server implementation for mlflow pyfunc model', long_description=open('README.md').read(), long_description_content_type='text/markdown', - python_requires='>=3.7,<3.11', + python_requires='>=3.8,<3.11', packages=find_packages(exclude=["test"]), install_requires=REQUIRE, tests_require=tests_require, diff --git a/python/sdk/Dockerfile b/python/sdk/Dockerfile index e6dd237b8..b2968dc22 100644 --- a/python/sdk/Dockerfile +++ b/python/sdk/Dockerfile @@ -10,7 +10,5 @@ RUN apt-get update && apt-get install build-essential curl vim wget -y COPY . .${WORKDIR} -ARG VERSION - -RUN pip install merlin-sdk==${VERSION} -RUN pip install merlin-sdk[test]==${VERSION} +RUN pip install . +RUN pip install ".[test]" diff --git a/python/sdk/setup.py b/python/sdk/setup.py index 0ebb50f88..9b42f1e8b 100644 --- a/python/sdk/setup.py +++ b/python/sdk/setup.py @@ -30,8 +30,8 @@ "cookiecutter>=1.7.2", "docker>=4.2.1", "google-cloud-storage>=1.19.0", - "mlflow>=1.2.0,<=1.23.0", # for py3.11 due to proto -> "mlflow>=1.26.1", - "protobuf>=3.0.0,<4.0.0", # for py3.11 due to proto -> "protobuf>=4.0.0,<5.0dev", + "protobuf>=3.0.0,<5.0.0", + "mlflow>=1.26.1,<2.0.0", "PyPrind>=2.11.2", "python_dateutil>=2.5.3", "PyYAML>=5.4", @@ -53,7 +53,7 @@ "pytest", "recursive-diff>=1.0.0", "requests", - "scikit-learn==1.0.2", #TODO: >=1.1.2 upon python 3.7 deprecation + "scikit-learn>=1.1.2", "types-python-dateutil", "types-PyYAML", "types-six", diff --git a/python/sdk/test/batch/model/env.yaml b/python/sdk/test/batch/model/env.yaml index 659bb6b71..31c061ad4 100644 --- a/python/sdk/test/batch/model/env.yaml +++ b/python/sdk/test/batch/model/env.yaml @@ -1,7 +1,7 @@ dependencies: - pip: - mlflow - - scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation + - scikit-learn>=1.1.2 - joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version - numpy>=1.19.5,<1.23.4 # https://github.com/Azure/MachineLearningNotebooks/issues/1314 - pandas==1.3.5 diff --git a/python/sdk/test/pyfunc/env.yaml b/python/sdk/test/pyfunc/env.yaml index d8ec45541..fe3129f70 100644 --- a/python/sdk/test/pyfunc/env.yaml +++ b/python/sdk/test/pyfunc/env.yaml @@ -3,7 +3,7 @@ dependencies: - pip: - joblib>=0.13.0,<1.2.0 # >=1.2.0 upon upgrade of kserve's version - numpy<=1.23.5 # Temporary pin numpy due to https://numpy.org/doc/stable/release/1.20.0-notes.html#numpy-1-20-0-release-notes - - scikit-learn==1.0.2 #TODO: >=1.1.2 upon python 3.7 deprecation + - scikit-learn>=1.1.2 - xgboost==1.6.2 - pytest - pytest-xdist==1.34.0