snowflakedb
diff --git a/‎.bazelrc
+1-1 b/‎.bazelrc
+1-1
diff --git a/‎BUILD.bazel
+8 b/‎BUILD.bazel
+8
diff --git a/‎CHANGELOG.md
+18 b/‎CHANGELOG.md
+18
diff --git a/‎README.md
+1-3 b/‎README.md
+1-3
diff --git a/‎WORKSPACE
+17-10 b/‎WORKSPACE
+17-10
diff --git a/‎bazel/BUILD.bazel
+6 b/‎bazel/BUILD.bazel
+6
diff --git a/‎bazel/filter_affected_targets.py
+1-1 b/‎bazel/filter_affected_targets.py
+1-1
diff --git a/‎bazel/get_affected_targets.sh
+101 b/‎bazel/get_affected_targets.sh
+101
diff --git a/‎bazel/py_rules.bzl
+10-4 b/‎bazel/py_rules.bzl
+10-4
diff --git a/‎bazel/requirements/parse_and_generate_requirements.py
+2-2 b/‎bazel/requirements/parse_and_generate_requirements.py
+2-2
diff --git a/‎bazel/test_wrapper.sh
+36 b/‎bazel/test_wrapper.sh
+36
@@ -1,6 +1,6 @@
 # Make the target platform and the host platform the same
 build --platforms //bazel/platforms:extended_conda_env --host_platform //bazel/platforms:extended_conda_env
-test --platforms //bazel/platforms:extended_conda_env --host_platform //bazel/platforms:extended_conda_env
+test --platforms //bazel/platforms:extended_conda_env --host_platform //bazel/platforms:extended_conda_env --run_under='//bazel:test_wrapper'
 run --platforms //bazel/platforms:extended_conda_env --host_platform //bazel/platforms:extended_conda_env
 cquery --platforms //bazel/platforms:extended_conda_env --host_platform //bazel/platforms:extended_conda_env
 
 
@@ -1,3 +1,5 @@
+load("@rules_java//java:defs.bzl", "java_binary")
+
 exports_files([
     "CHANGELOG.md",
     "README.md",
@@ -8,3 +10,9 @@ exports_files([
     "requirements.txt",
     "requirements.yml",
 ])
+
+java_binary(
+    name = "bazel-diff",
+    main_class = "com.bazel_diff.Main",
+    runtime_deps = ["@bazel_diff//jar"],
+)
@@ -1,5 +1,23 @@
 # Release History
 
+## 1.0.3 (2023-07-12)
+
+### Behavior Changes
+- Model Registry: When predicting a model whose output is a list of NumPy ndarray, the output would not be flattened, instead, every ndarray will act as a feature(column) in the output.
+
+### New Features
+- Model Registry: Added support save/load/deploy PyTorch models (`torch.nn.Module` and `torch.jit.ScriptModule`).
+
+### Bug Fixes
+
+- Model Registry: Fix an issue that when database or schema name provided to `create_model_registry` contains special characters, the model registry cannot be created.
+- Model Registry: Fix an issue that `get_model_description` returns with additional quotes.
+- Model Registry: Fix incorrect error message when attempting to remove a unset tag of a model.
+- Model Registry: Fix a typo in the default deployment table name.
+- Model Registry: Snowpark dataframe for sample input or input for `predict` method that contains a column with Snowflake `NUMBER(precision, scale)` data type where `scale = 0` will not lead to error, and will now correctly recognized as `INT64` data type in model signature.
+- Model Registry: Fix an issue that prevent model logged in the system whose default encoding is not UTF-8 compatible from deploying.
+- Model Registry: Added earlier and better error message when any file name in the model or the file name of model itself contains characters that are unable to be encoded using ASCII. It is currently not supported to deploy such a model.
+
 ## 1.0.2 (2023-06-22)
 
 ### Behavior Changes
 
@@ -22,9 +22,7 @@ Snowpark MLOps complements the Snowpark ML Development API, and provides model m
 
 During PrPr, we are iterating on API without backward compatibility guarantees. It is better to recreate your registry everytime you update the package. This means, at this time, you cannot use the registry for production use.
 
-- [Documentation](http://docs.snowflake.com/developer-guide/snowpark/python/snowpark-ml-modeling)
-- [Issues](https://github.com/snowflakedb/snowflake-ml-python/issues)
-- [Source](https://github.com/snowflakedb/snowflake-ml-python/)
+- [Documentation](https://docs.snowflake.com/developer-guide/snowpark-ml)
 
 ## Getting started
 ### Have your Snowflake account ready
 
@@ -1,6 +1,15 @@
 workspace(name = "SnowML")
 
-load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive")
+load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive", "http_jar")
+load("@bazel_tools//tools/build_defs/repo:git.bzl", "git_repository")
+
+http_jar(
+    name = "bazel_diff",
+    urls = [
+        "https://github.com/Tinder/bazel-diff/releases/download/4.3.0/bazel-diff_deploy.jar",
+    ],
+    sha256 = "9c4546623a8b9444c06370165ea79a897fcb9881573b18fa5c9ee5c8ba0867e2",
+)
 
 http_archive(
     name = "bazel_skylib",
@@ -14,15 +23,13 @@ http_archive(
 load("@bazel_skylib//:workspace.bzl", "bazel_skylib_workspace")
 
 bazel_skylib_workspace()
-# Latest @ 2022-10-18. Version 0.13.0 released 2022-09-25
-http_archive(
-    name = "rules_python",
-    sha256 = "8c8fe44ef0a9afc256d1e75ad5f448bb59b81aba149b8958f02f7b3a98f5d9b4",
-    strip_prefix = "rules_python-0.13.0",
-    url = "https://github.com/bazelbuild/rules_python/archive/refs/tags/0.13.0.tar.gz",
-    # This will be unnecessary once https://github.com/bazelbuild/rules_python/pull/1274
-    # is released.
-    patches = ["//third_party:rules_python_description_content_type.patch"],
+
+# Latest @ 2023-06-20
+# Replace with released version once newer version released.
+git_repository(
+    name="rules_python",
+    commit="0d59fcf561f6d2c4705924bc17c151fb4b998841",
+    remote="https://github.com/bazelbuild/rules_python.git"
 )
 
 load("//third_party/rules_conda:defs.bzl", "conda_create", "load_conda", "register_toolchain")
 
@@ -1,4 +1,5 @@
 load("@rules_python//python:defs.bzl", native_py_test = "py_test")
+package(default_visibility = ["//visibility:public"])
 
 native_py_test(
     name = "repo_paths_test",
@@ -7,3 +8,8 @@ native_py_test(
     python_version = "PY3",
     srcs_version = "PY3",
 )
+
+sh_binary(
+    name = "test_wrapper",
+    srcs = ["test_wrapper.sh"]
+)
@@ -21,7 +21,7 @@
 
 
 def main(input_file: str, test_target_only: bool) -> None:
-    with open(input_file) as f:
+    with open(input_file, encoding="utf-8") as f:
         raw_targets = f.read()
     pattern = _AFFECTED_TESTS_QUERY_PATTERN if test_target_only else _AFFECTED_TARGETS_QUERY_PATTERN
     print(pattern.format(raw_targets=raw_targets))
 
@@ -0,0 +1,101 @@
+#!/bin/bash
+
+# Usage
+# get_affected_targets.sh [-b <bazel_path>] [-f <output_path>] [-r <revision>] [-w <workspace path>]
+#
+# Flags
+# -b: specify path to bazel
+# -f: specify output file path
+# -r: specify the revision to use, default the current
+# -w: specify the workspace_path, default $(cwd)
+#
+# Notes:
+#   This script relies on bazel-diff, which is installed in WORKSPACE via L6-12 of WORKSPACE file.
+#
+# Action
+#   - Get affected targets list in our repo to the output_path file
+
+set -o pipefail
+set -u
+PROG=$0
+
+help() {
+    local exit_code=$1
+    echo "Usage: ${PROG} [-b <bazel_path>] [-f <output_path>] [-r <revision>] [-w <workspace>]"
+    exit "${exit_code}"
+}
+
+echo "Running ${PROG}"
+
+bazel="bazel"
+current_revision=$(git rev-parse HEAD)
+pr_revision=${current_revision}
+output_path="/tmp/affected_targets/targets"
+workspace_path=$(pwd)
+
+
+
+while getopts "b:f:r:w:h" opt; do
+    case "${opt}" in
+    b)
+        bazel=${OPTARG}
+        ;;
+    f)
+        output_path=${OPTARG}
+        ;;
+    r)
+        pr_revision=${OPTARG}
+        ;;
+    w)
+        workspace_path=${OPTARG}
+        ;;
+    h)
+        help 0
+        ;;
+    :)
+        help 1
+        ;;
+    ?)
+        help 1
+        ;;
+    esac
+done
+
+working_dir=$(mktemp -d "/tmp/tmp_XXXXX")
+trap 'rm -rf "${working_dir}"' EXIT
+
+starting_hashes_json="${working_dir}/starting_hashes.json"
+final_hashes_json="${working_dir}/final_hashes.json"
+impacted_targets_path="${working_dir}/impacted_targets.txt"
+bazel_diff="${working_dir}/bazel_diff"
+
+"${bazel}" run :bazel-diff --script_path="${bazel_diff}"
+
+git -C "${workspace_path}" checkout "${pr_revision}" --quiet
+
+echo "Generating Hashes for Revision '${pr_revision}'"
+
+"${bazel_diff}" generate-hashes -w "$workspace_path" -b "${bazel}" "${starting_hashes_json}"
+
+MERGE_BASE_MAIN=$(git merge-base "${pr_revision}" main)
+git -C "${workspace_path}" checkout "${MERGE_BASE_MAIN}" --quiet
+
+echo "Generating Hashes for merge base ${MERGE_BASE_MAIN}"
+
+$bazel_diff generate-hashes -w "${workspace_path}" -b "${bazel}" "${final_hashes_json}"
+
+echo "Determining Impacted Targets and output to ${output_path}"
+$bazel_diff get-impacted-targets -sh "${starting_hashes_json}" -fh "${final_hashes_json}" -o "${impacted_targets_path}"
+
+filter_query_rules_file="${working_dir}/filter_query_rules"
+
+# -- Begin of Query Rules Heredoc --
+cat > "${filter_query_rules_file}" << EndOfMessage
+let raw_targets = set($(<"${impacted_targets_path}")) in
+    \$raw_targets - kind('source file', \$raw_targets) - filter('//external[:/].*', \$raw_targets)
+EndOfMessage
+# -- End of Query Rules Heredoc --
+
+"${bazel}" query --query_file="${filter_query_rules_file}" >"${output_path}"
+
+git -C "${workspace_path}" checkout "${current_revision}" --quiet
@@ -144,9 +144,7 @@ def snowml_wheel(
         deps,
         description_file = None,
         development_status = "Alpha",
-        compatible_with_snowpark = True,
-        homepage = None,
-        summary = None):
+        compatible_with_snowpark = True):
     """A SnowML customized wheel definition with lots of default values filled in.
 
     Args:
@@ -156,6 +154,7 @@ def snowml_wheel(
       version: Version string
       deps: List of dependencies of type py_package
       development_status: String with PrPr, PuPr & GA
+      description_file: Label of readme file.
       compatible_with_snowpark: adds a tag to the wheel to indicate that this
         wheel is compatible with the snowpark running environment.
     """
@@ -164,6 +163,7 @@ def snowml_wheel(
         dev_status = "Development Status :: 3 - Alpha"
     elif development_status.lower() == "pupr":
         dev_status = "Development Status :: 3 - Beta"
+    homepage = "https://github.com/snowflakedb/snowflake-ml-python"
     py_wheel(
         name = name,
         author = "Snowflake, Inc",
@@ -194,11 +194,17 @@ def snowml_wheel(
         distribution = "snowflake-ml-python",
         extra_requires = extra_requires,
         homepage = homepage,
+        project_urls = {
+            "Changelog": homepage + "/blob/main/CHANGELOG.md",
+            "Documentation": "https://docs.snowflake.com/developer-guide/snowpark-ml",
+            "Issues": homepage + "/issues",
+            "Source": homepage,
+        },
         license = "Apache License, Version 2.0",
         python_requires = ">=3.8,<4",
         python_tag = "py3",
         requires = requires,
-        summary = summary,
+        summary = "The machine learning client library that is used for interacting with Snowflake to build machine learning solutions.",
         version = version,
         deps = deps,
     )
@@ -267,9 +267,9 @@ def generate_requirements(
     tag_filter: Optional[str] = None,
     version: Optional[str] = None,
 ) -> None:
-    with open(schema_file_path) as f:
+    with open(schema_file_path, encoding="utf-8") as f:
         schema = json.load(f)
-    with open(req_file_path) as f:
+    with open(req_file_path, encoding="utf-8") as f:
         requirements = yaml.safe_load(f)
 
     jsonschema.validate(requirements, schema=schema)
 
@@ -0,0 +1,36 @@
+#!/usr/bin/env bash
+
+# Bazel test wrapper
+
+# Get the bazel arg, which is a bazel generated python entrance file.
+# Example: snowflake/ml/model/_model_test
+# Part of its content (auto-generated) where the main_rel_path gets picked.
+#
+#  # The main Python source file.
+#  # The magic string percent-main-percent is replaced with the runfiles-relative
+#  # filename of the main file of the Python binary in BazelPythonSemantics.java.
+#  main_rel_path = 'SnowML/snowflake/ml/model/_model_test.py'
+#
+
+ENTRY_FILE="$1"
+
+# Follow how bazel generated entry file works
+RUNFILES_DIR=$(dirname $(pwd))
+# Get the actual main file by searching in bazel generated file.
+MAIN_REL_PATH=$(cat ${ENTRY_FILE} | grep -o "  main_rel_path = '[^']*" | sed "s/  main_rel_path = '//g")
+
+# If not a python test then this is empty
+if [[ "$MAIN_REL_PATH" ]]; then
+  # Pattern for the main block
+  TEST_STR="if[[:space:]]+__name__[[:space:]]+==[[:space:]]+[\'\"]__main__[\'\"]:[[:space:]]*"
+
+  # Check if main block exist
+  if ! grep -q -x -E "$TEST_STR" "${RUNFILES_DIR}/${MAIN_REL_PATH}" ; then
+    echo "Missing \`if __name__ == \"__main__\":\` block in test entry file ${ENTRY_FILE}, your tests won't be run."
+    # Follow pytest which uses exit code 5 to label no tests can be found and run.
+    exit 5
+  fi
+fi
+
+# Execute the actual target
+$@