diff --git a/templates/devcontainer.json b/templates/devcontainer.json index d358a09..e881a7c 100644 --- a/templates/devcontainer.json +++ b/templates/devcontainer.json @@ -7,7 +7,7 @@ // Update 'VARIANT' to pick an Debian version: bullseye, buster // Use bullseye on local arm64/Apple Silicon. "args": { - "RELEASE": "emr-6.6.0", + "RELEASE": "emr-6.10.0", "RELEASE_TAG": "latest", "REGION": "us-west-2", "EMR_ACCOUNT_ID": "895885662937" diff --git a/templates/pyspark.dockerfile b/templates/pyspark.dockerfile index 165d208..062b45b 100644 --- a/templates/pyspark.dockerfile +++ b/templates/pyspark.dockerfile @@ -1,6 +1,6 @@ # See here for image details: https://docs.aws.amazon.com/emr/latest/EMR-on-EKS-DevelopmentGuide/docker-custom-images-steps.html # Arguments used to build the image URI - update to your desired region/EMR release version per the link above -ARG RELEASE="emr-6.6.0" +ARG RELEASE="emr-6.10.0" ARG RELEASE_TAG="latest" ARG REGION="us-west-2" ARG EMR_ACCOUNT_ID="895885662937" @@ -42,8 +42,10 @@ RUN if [ "$TARGETARCH" != "amd64" ]; then yum install -y gcc python3-devel; fi # Upgrade pip first RUN python3 -m pip install -U pip -# Enable Jupyter notebooks -RUN python3 -m pip install ipykernel +# Enable Jupyter notebooks and pytest +RUN python3 -m pip install \ + ipykernel \ + pytest # Switch back to the default user USER hadoop:hadoop