From c01b537fe7061e8ecb3fe8d5534baa30c2263a6f Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 10 Apr 2024 11:24:40 -0400 Subject: [PATCH 01/38] Move systemd service configurations into functions --- pkg/deploy/generator/scripts/rpVMSS.sh | 693 ++++++++++++++++--------- 1 file changed, 447 insertions(+), 246 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 290b534c1c9..eb567b06443 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -1,46 +1,125 @@ #!/bin/bash -echo "setting ssh password authentication" -# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work -sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config -systemctl reload sshd.service - -#Adding retry logic to yum commands in order to avoid stalling out on resource locks -echo "running RHUI fix" -for attempt in {1..5}; do - yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +set -o errexit \ + -o nounset \ + +# trap 'catch' ERR + +main() { + configure_sshd + configure_rhui_repo + dnf_update_pkgs + configure_disk_partitions + configure_logrotate + create_azure_rpm_repos + configure_selinux + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store + configure_firewalld_rules + pull_container_images +} -echo "running yum update" -for attempt in {1..5}; do - yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work +configure_sshd() { + log "setting ssh password authentication" + sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config -echo "extending partition table" -# Linux block devices are inconsistently named -# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here -physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" -growpart "$physicalDisk" 2 + systemctl reload sshd.service + systemctl is-active --quiet sshd || abort "sshd failed to reload" +} -echo "extending filesystems" -lvextend -l +20%FREE /dev/rootvg/rootlv -xfs_growfs / +configure_rhui_repo() { + log "running RHUI package updates" + #Adding retry logic to yum commands in order to avoid stalling out on resource locks + for attempt in {1..5}; do + dnf update \ + -y \ + --disablerepo='*' \ + --enablerepo='rhui-microsoft-azure*' \ + && break + if [[ ${attempt} -lt 5 ]]; then + sleep 10 + else + abort "failed to run dnf update" + fi + done +} -lvextend -l +100%FREE /dev/rootvg/varlv -xfs_growfs /var +dnf_update_pkgs() { + log "running dnf update" + for attempt in {1..5}; do + dnf -y \ + -x WALinuxAgent \ + -x WALinuxAgent-udev \ + update --allowerasing \ + && break + if [[ ${attempt} -lt 5 ]]; then + sleep 10 + else + return 1 + fi + done +} -echo "importing rpm repositories" -rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 -rpm --import https://packages.microsoft.com/keys/microsoft.asc +dnf_install_pkgs() { + log "importing rpm repositories" + rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + rpm --import https://packages.microsoft.com/keys/microsoft.asc + + for attempt in {1..5}; do + yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break + if [[ ${attempt} -lt 5 ]]; then + sleep 10 + else + return 1 + fi + done + + for attempt in {1..5}; do + yum -y \ + install \ + clamav \ + azsec-clamav \ + azsec-monitor \ + azure-cli \ + azure-mdsd \ + azure-security \ + podman \ + podman-docker \ + openssl-perl \ + python3 \ + && break + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + if [[ ${attempt} -lt 5 ]]; then + sleep 10 + else + abort "failed to install required packages" + fi + done +} -for attempt in {1..5}; do - yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +configure_disk_partitions() { + log "extending partition table" + # Linux block devices are inconsistently named + # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here + physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" + growpart "$physicalDisk" 2 + + log "extending filesystems" + log "extending root lvm" + lvextend -l +20%FREE /dev/rootvg/rootlv + log "growing root filesystem" + xfs_growfs / + + log "extending var lvm" + lvextend -l +100%FREE /dev/rootvg/varlv + log "growing var filesystem" + xfs_growfs /var +} -echo "configuring logrotate" +# configure_logrotate clobbers /etc/logrotate.conf +configure_logrotate() { + log "configuring logrotate" cat >/etc/logrotate.conf <<'EOF' # see "man logrotate" for details # rotate log files weekly @@ -76,8 +155,11 @@ include /etc/logrotate.d rotate 1 } EOF +} -echo "configuring yum repository and running yum update" +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { + log "configuring yum repository and running yum update" cat >/etc/yum.repos.d/azure.repo <<'EOF' [azure-cli] name=azure-cli @@ -91,18 +173,16 @@ baseurl=https://packages.microsoft.com/yumrepos/azurecore enabled=yes gpgcheck=no EOF +} -semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" -mkdir -p /var/log/journal - -for attempt in {1..5}; do -yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman podman-docker openssl-perl python3 && break - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +configure_selinux() { + semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" + chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent +} -# https://access.redhat.com/security/cve/cve-2020-13401 -echo "applying firewall rules" +configure_firewalld_rules() { + # https://access.redhat.com/security/cve/cve-2020-13401 + log "applying firewall rules" cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF' net.ipv6.conf.all.accept_ra=0 EOF @@ -110,35 +190,95 @@ EOF cat >/etc/sysctl.d/01-disable-core.conf <<'EOF' kernel.core_pattern = |/bin/true EOF -sysctl --system + sysctl --system + + log "adding firewalld ports to default zone" + firewall-cmd \ + --add-port=443/tcp \ + --permanent + firewall-cmd \ + --add-port=444/tcp \ + --permanent + firewall-cmd \ + --add-port=445/tcp \ + --permanent + firewall-cmd \ + --add-port=2222/tcp \ + --permanent + + log "reloading firewalld" + firewall-cmd reload +} -firewall-cmd --add-port=443/tcp --permanent -firewall-cmd --add-port=444/tcp --permanent -firewall-cmd --add-port=445/tcp --permanent -firewall-cmd --add-port=2222/tcp --permanent +export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -export AZURE_CLOUD_NAME=$AZURECLOUDNAME +pull_container_images() { + echo "logging into prod acr" + az login -i --allow-no-subscriptions -echo "logging into prod acr" -az login -i --allow-no-subscriptions + # Suppress emulation output for podman instead of docker for az acr compatability + mkdir -p /etc/containers/ + touch /etc/containers/nodocker -# Suppress emulation output for podman instead of docker for az acr compatability -mkdir -p /etc/containers/ -touch /etc/containers/nodocker + mkdir -p /root/.docker + REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" -mkdir -p /root/.docker -REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + docker pull "$MDMIMAGE" + docker pull "$RPIMAGE" + docker pull "$FLUENTBITIMAGE" -MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" -docker pull "$MDMIMAGE" -docker pull "$RPIMAGE" -docker pull "$FLUENTBITIMAGE" + az logout +} -az logout +# configure_system_services creates, configures, and enables the following systemd services and timers +# services +# fluentbit +# mdm +# mdsd +# arp-rp +# aro-dbtoken +# aro-monitor +# aro-portal +configure_system_services() { + configure_service_fluentbit + configure_service_mdm + configure_timers_mdm_mdsd + configure_service_aro_rp + configure_service_aro_dbtoken + configure_service_aro_monitor + configure_service_aro_portal + configure_service_mdsd +} + +# enable_aro_services enables all services required for aro rp +enable_aro_services() { + local -a aro_services=( + "aro-dbtoken" + "aro-monitor" + "aro-portal" + "aro-rp" + "auoms" + "azsecd" + "azsecmond" + "mdsd" + "mdm" + "chronyd" + "fluentbit" + ) + log "enabling aro services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} -echo "configuring fluentbit service" -mkdir -p /etc/fluentbit/ -mkdir -p /var/lib/fluent +# configure_service_fluentbit +configure_service_fluentbit() { + log "configuring fluentbit service" + mkdir -p /etc/fluentbit/ + mkdir -p /var/lib/fluent cat >/etc/fluentbit/fluentbit.conf <<'EOF' [INPUT] @@ -176,7 +316,7 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' Port 29230 EOF -echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit + log "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit cat >/etc/systemd/system/fluentbit.service <<'EOF' [Unit] @@ -211,15 +351,42 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target EOF +} -mkdir /etc/aro-rp -base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem -if [[ -n "$ARMAPICABUNDLE" ]]; then - base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem -fi -chown -R 1000:1000 /etc/aro-rp +# configure_certs +configure_certs() { + mkdir /etc/aro-rp + base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + if [[ -n "$ARMAPICABUNDLE" ]]; then + base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + fi + chown -R 1000:1000 /etc/aro-rp + + # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not + # to honour SSL_CERT_FILE any more, heaven only knows why. + mkdir -p /usr/lib/ssl/certs + csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null + c_rehash /usr/lib/ssl/certs + +# we leave clientId blank as long as only 1 managed identity assigned to vmss +# if we have more than 1, we will need to populate with clientId used for off-node scanning +cat >/etc/default/vsa-nodescan-agent.config </etc/sysconfig/mdm </etc/systemd/system/mdm.service <<'EOF' [Unit] After=network-online.target @@ -263,9 +430,142 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target EOF +} + +# configure_timers_mdm_mdsd +configure_timers_mdm_mdsd() { + for var in "mdsd" "mdm"; do +cat >/etc/systemd/system/download-$var-credentials.service </etc/systemd/system/download-$var-credentials.timer </usr/local/bin/download-credentials.sh </etc/sysconfig/aro-rp </etc/systemd/system/watch-mdm-credentials.service </etc/systemd/system/watch-mdm-credentials.path <"$arp_rp_config_file"</etc/systemd/system/aro-rp.service <<'EOF' + local aro_rp_service_file="/etc/systemd/system/aro-rp.service" + log "Writing $aro_rp_service_file" +cat >"$aro_rp_service_file" <<'EOF' [Unit] After=network-online.target Wants=network-online.target @@ -347,9 +649,13 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target EOF +} -echo "configuring aro-dbtoken service" -cat >/etc/sysconfig/aro-dbtoken <"$aro_dbtoken_service_file" </etc/systemd/system/aro-dbtoken.service <<'EOF' + local aro_dbtoken_service_file="/etc/systemd/system/aro-dbtoken.service" + log "Writing $aro_dbtoken_service_file" +cat >"$aro_dbtoken_service_config_file" <<'EOF' [Unit] After=network-online.target Wants=network-online.target @@ -393,11 +701,15 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target EOF +} +# configure_service_aro_monitor +configure_service_aro_monitor() { + local aro_monitor_service_config="/etc/sysconfig/aro-monitor" + log "configuring aro-monitor service" # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE # are not used, but can't easily be refactored out. Should be revisited in the future. -echo "configuring aro-monitor service" -cat >/etc/sysconfig/aro-monitor <"$aro_monitor_service_config" </etc/systemd/system/aro-monitor.service <<'EOF' + local aro_monitor_service_file="/etc/systemd/system/aro-monitor.service" + log "Writing $aro_monitor_service_file" +cat >"$aro_monitor_service_file" <<'EOF' [Unit] After=network-online.target Wants=network-online.target @@ -454,9 +768,13 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target EOF +} -echo "configuring aro-portal service" -cat >/etc/sysconfig/aro-portal <"$aro_portal_service_config" </etc/systemd/system/aro-portal.service <<'EOF' + local aro_portal_service_file="/etc/systemd/system/aro-portal.service" + log "Writing $aro_portal_service_config" +cat >"$aro_portal_service_file" <<'EOF' [Unit] After=network-online.target Wants=network-online.target @@ -503,138 +823,16 @@ RestartSec=1 [Install] WantedBy=multi-user.target EOF - -echo "configuring mdsd and mdm services" -chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent - -mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store - -for var in "mdsd" "mdm"; do -cat >/etc/systemd/system/download-$var-credentials.service </etc/systemd/system/download-$var-credentials.timer </usr/local/bin/download-credentials.sh </etc/systemd/system/watch-mdm-credentials.service </etc/systemd/system/watch-mdm-credentials.path </etc/systemd/system/mdsd.service.d/override.conf <<'EOF' +# configure_service_mdsd +configure_service_mdsd() { + local mdsd_service_dir="/etc/systemd/system/mdsd.service.d" + log "Creating $mdsd_service_dir" + mkdir "$mdsd_service_dir" + local mdsd_override_conf="$mdsd_service_dir/override.conf" + log "Writing $mdsd_override_conf" +cat >"$mdsd_override_conf" <<'EOF' [Unit] After=network-online.target EOF @@ -658,36 +856,39 @@ export MONITORING_ROLE_INSTANCE='$(hostname)' export MDSD_MSGPACK_SORT_COLUMNS=1 EOF +} -# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not -# to honour SSL_CERT_FILE any more, heaven only knows why. -mkdir -p /usr/lib/ssl/certs -csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null -c_rehash /usr/lib/ssl/certs - -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning -cat >/etc/default/vsa-nodescan-agent.config < Date: Wed, 10 Apr 2024 11:51:10 -0400 Subject: [PATCH 02/38] Move dnf package and repo operations into function, move all service configuration into a function --- pkg/deploy/generator/scripts/rpVMSS.sh | 130 +++++++++++++++++-------- 1 file changed, 91 insertions(+), 39 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index eb567b06443..c3eea7e0827 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -7,16 +7,15 @@ set -o errexit \ main() { configure_sshd - configure_rhui_repo - dnf_update_pkgs + configure_and_install_dnf_pkgs_repos configure_disk_partitions configure_logrotate - create_azure_rpm_repos configure_selinux mkdir -p /var/log/journal mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store configure_firewalld_rules pull_container_images + configure_system_services } # We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work @@ -28,6 +27,15 @@ configure_sshd() { systemctl is-active --quiet sshd || abort "sshd failed to reload" } +# configure_and_install_dnf_pkgs_repos +configure_and_install_dnf_pkgs_repos() { + configure_rhui_repo + dnf_update_pkgs + dnf_install_pkgs + create_azure_rpm_repos +} + +# configure_rhui_repo configure_rhui_repo() { log "running RHUI package updates" #Adding retry logic to yum commands in order to avoid stalling out on resource locks @@ -45,6 +53,7 @@ configure_rhui_repo() { done } +# dnf_update_pkgs dnf_update_pkgs() { log "running dnf update" for attempt in {1..5}; do @@ -61,13 +70,16 @@ dnf_update_pkgs() { done } +# dnf_install_pkgs dnf_install_pkgs() { log "importing rpm repositories" rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 rpm --import https://packages.microsoft.com/keys/microsoft.asc for attempt in {1..5}; do - yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break + dnf -y \ + install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm \ + && break if [[ ${attempt} -lt 5 ]]; then sleep 10 else @@ -76,7 +88,7 @@ dnf_install_pkgs() { done for attempt in {1..5}; do - yum -y \ + dnf -y \ install \ clamav \ azsec-clamav \ @@ -98,6 +110,7 @@ dnf_install_pkgs() { done } +# configure_disk_partitions configure_disk_partitions() { log "extending partition table" # Linux block devices are inconsistently named @@ -119,8 +132,9 @@ configure_disk_partitions() { # configure_logrotate clobbers /etc/logrotate.conf configure_logrotate() { - log "configuring logrotate" -cat >/etc/logrotate.conf <<'EOF' + local logrotate_conf_file="/etc/logrotate.conf" + log "Writing over $logrotate_conf_file" +cat >"$logrotate_conf_file" <<'EOF' # see "man logrotate" for details # rotate log files weekly weekly @@ -159,8 +173,9 @@ EOF # create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file create_azure_rpm_repos() { - log "configuring yum repository and running yum update" -cat >/etc/yum.repos.d/azure.repo <<'EOF' + local azure_repo_file="/etc/yum.repos.d/azure.repo" + log "Writing $azure_repo_file" +cat >"$azure_repo_file" <<'EOF' [azure-cli] name=azure-cli baseurl=https://packages.microsoft.com/yumrepos/azure-cli @@ -175,43 +190,54 @@ gpgcheck=no EOF } +# configure_selinux configure_selinux() { + local relabel="${1:-false}" semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent + + if relabel; then + restorecon -RF /var/log/* + fi } +# configure_firewalld_rules configure_firewalld_rules() { # https://access.redhat.com/security/cve/cve-2020-13401 - log "applying firewall rules" -cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF' + local prefix="/etc/sysctl.d" + local diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf" + log "Writing $diable_accept_ra_conf" +cat >"$diable_accept_ra_conf" <<'EOF' net.ipv6.conf.all.accept_ra=0 EOF -cat >/etc/sysctl.d/01-disable-core.conf <<'EOF' + local disable_core="$prefix/01-disable-core.conf" + log "Writing $disable_core" +cat >"$disable_core" <<'EOF' kernel.core_pattern = |/bin/true EOF sysctl --system - log "adding firewalld ports to default zone" - firewall-cmd \ - --add-port=443/tcp \ - --permanent - firewall-cmd \ - --add-port=444/tcp \ - --permanent - firewall-cmd \ - --add-port=445/tcp \ - --permanent - firewall-cmd \ - --add-port=2222/tcp \ - --permanent + enable_ports=( + "443/tcp" + "444/tcp" + "445/tcp" + "2222/tcp" + ) + log "Enabling ports ${enable_ports[*]} on default firewalld zone" + # shellcheck disable=SC2068 + for port in ${enable_ports[@]}; do + log "Enabling port $port now" + firewall-cmd "--add-port=$port" + done log "reloading firewalld" firewall-cmd reload -} -export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" + firewall-cmd --runtime-to-permanent +} +# pull_container_images pull_container_images() { echo "logging into prod acr" az login -i --allow-no-subscriptions @@ -316,9 +342,13 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' Port 29230 EOF - log "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit + local sysconfig_fluentbit="/etc/sysconfig/fluentbit" + log "Writing value FLUENTBITIMAGE=$FLUENTBITIMAGE to $sysconfig_fluentbit" + echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >"$sysconfig_fluentbit" -cat >/etc/systemd/system/fluentbit.service <<'EOF' + fluentbit_service_file="/etc/systemd/system/fluentbit.service" + log "Writing $fluentbit_service_file now" +cat >"$fluentbit_service_file" <<'EOF' [Unit] After=network-online.target Wants=network-online.target @@ -370,7 +400,9 @@ configure_certs() { # we leave clientId blank as long as only 1 managed identity assigned to vmss # if we have more than 1, we will need to populate with clientId used for off-node scanning -cat >/etc/default/vsa-nodescan-agent.config <"$nodescan_agent_file" </etc/sysconfig/mdm <"$sysconfig_mdm_file" </etc/systemd/system/mdm.service <<'EOF' + mdm_service_file="/etc/systemd/system/mdm.service" + log "Writing $mdm_service_file" +cat >"$mdm_service_file"<<'EOF' [Unit] After=network-online.target Wants=network-online.target @@ -435,7 +471,9 @@ EOF # configure_timers_mdm_mdsd configure_timers_mdm_mdsd() { for var in "mdsd" "mdm"; do -cat >/etc/systemd/system/download-$var-credentials.service <"$download_creds_service_file" </etc/systemd/system/download-$var-credentials.timer <"$download_creds_timer_file"</usr/local/bin/download-credentials.sh <"$download_creds_script_file" </etc/systemd/system/watch-mdm-credentials.service <"$watch_mdm_creds_service_file" </etc/systemd/system/watch-mdm-credentials.path <"$watch_mdm_creds_path_file" <"$mdsd_override_conf" <<'EOF' After=network-online.target EOF -cat >/etc/default/mdsd <"$default_mdsd_file" < Date: Wed, 10 Apr 2024 13:23:20 -0400 Subject: [PATCH 03/38] Move repository configuration higher in sequence of events, make unchanging variables readonly --- pkg/deploy/generator/scripts/rpVMSS.sh | 70 +++++++++++++------------- 1 file changed, 36 insertions(+), 34 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index c3eea7e0827..0677589931f 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -3,7 +3,7 @@ set -o errexit \ -o nounset \ -# trap 'catch' ERR +trap 'catch' ERR main() { configure_sshd @@ -11,11 +11,13 @@ main() { configure_disk_partitions configure_logrotate configure_selinux - mkdir -p /var/log/journal + journal_dir="/var/log/journal" + mkdir -p "$journal_dir" mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store configure_firewalld_rules pull_container_images configure_system_services + reboot_vm } # We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work @@ -30,9 +32,9 @@ configure_sshd() { # configure_and_install_dnf_pkgs_repos configure_and_install_dnf_pkgs_repos() { configure_rhui_repo + create_azure_rpm_repos dnf_update_pkgs dnf_install_pkgs - create_azure_rpm_repos } # configure_rhui_repo @@ -192,26 +194,28 @@ EOF # configure_selinux configure_selinux() { - local relabel="${1:-false}" - semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" + local -r relabel="${1:-false}" + + already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" + semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent - if relabel; then - restorecon -RF /var/log/* + if "$relabel"; then + restorecon -RF /var/log/* || log "$already_defined_ignore_error" fi } # configure_firewalld_rules configure_firewalld_rules() { # https://access.redhat.com/security/cve/cve-2020-13401 - local prefix="/etc/sysctl.d" - local diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf" + local -r prefix="/etc/sysctl.d" + local -r diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf" log "Writing $diable_accept_ra_conf" cat >"$diable_accept_ra_conf" <<'EOF' net.ipv6.conf.all.accept_ra=0 EOF - local disable_core="$prefix/01-disable-core.conf" + local -r disable_core="$prefix/01-disable-core.conf" log "Writing $disable_core" cat >"$disable_core" <<'EOF' kernel.core_pattern = |/bin/true @@ -230,9 +234,6 @@ EOF log "Enabling port $port now" firewall-cmd "--add-port=$port" done - - log "reloading firewalld" - firewall-cmd reload firewall-cmd --runtime-to-permanent } @@ -279,7 +280,7 @@ configure_system_services() { # enable_aro_services enables all services required for aro rp enable_aro_services() { - local -a aro_services=( + local -ra aro_services=( "aro-dbtoken" "aro-monitor" "aro-portal" @@ -342,7 +343,7 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' Port 29230 EOF - local sysconfig_fluentbit="/etc/sysconfig/fluentbit" + local -r sysconfig_fluentbit="/etc/sysconfig/fluentbit" log "Writing value FLUENTBITIMAGE=$FLUENTBITIMAGE to $sysconfig_fluentbit" echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >"$sysconfig_fluentbit" @@ -429,7 +430,7 @@ MDMSOURCEROLE=rp MDMSOURCEROLEINSTANCE='$(hostname)' EOF - mkdir /var/etw + mkdir -p /var/etw mdm_service_file="/etc/systemd/system/mdm.service" log "Writing $mdm_service_file" cat >"$mdm_service_file"<<'EOF' @@ -482,7 +483,7 @@ Type=oneshot ExecStart=/usr/local/bin/download-credentials.sh $var EOF - download_creds_timer_file="/etc/systemd/system/download-$var-credentials.timer" + local -r download_creds_timer_file="/etc/systemd/system/download-$var-credentials.timer" log "Writing $download_creds_timer_file" cat >"$download_creds_timer_file"<"$download_creds_script_file" <"$watch_mdm_creds_service_file" <"$arp_rp_config_file"<"$aro_rp_service_file" <<'EOF' [Unit] @@ -699,7 +700,7 @@ EOF # configure_service_aro_dbtoken configure_service_aro_dbtoken() { - local aro_dbtoken_service_config_file="/etc/sysconfig/aro-dbtoken" + local -r aro_dbtoken_service_config_file="/etc/sysconfig/aro-dbtoken" log "Writing $aro_dbtoken_service_file" cat >"$aro_dbtoken_service_file" <"$aro_dbtoken_service_config_file" <<'EOF' [Unit] @@ -751,7 +752,7 @@ EOF # configure_service_aro_monitor configure_service_aro_monitor() { - local aro_monitor_service_config="/etc/sysconfig/aro-monitor" + local -r aro_monitor_service_config="/etc/sysconfig/aro-monitor" log "configuring aro-monitor service" # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE # are not used, but can't easily be refactored out. Should be revisited in the future. @@ -773,7 +774,7 @@ MDM_NAMESPACE=BBM RPIMAGE='$RPIMAGE' EOF - local aro_monitor_service_file="/etc/systemd/system/aro-monitor.service" + local -r aro_monitor_service_file="/etc/systemd/system/aro-monitor.service" log "Writing $aro_monitor_service_file" cat >"$aro_monitor_service_file" <<'EOF' [Unit] @@ -818,7 +819,7 @@ EOF # configure_service_aro_portal configure_service_aro_portal() { - local aro_portal_service_config="/etc/sysconfig/aro-portal" + local -r aro_portal_service_config="/etc/sysconfig/aro-portal" log "Writing $aro_portal_service_config" cat >"$aro_portal_service_config" <"$aro_portal_service_file" <<'EOF' [Unit] @@ -873,10 +874,10 @@ EOF # configure_service_mdsd configure_service_mdsd() { - local mdsd_service_dir="/etc/systemd/system/mdsd.service.d" + local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" log "Creating $mdsd_service_dir" mkdir "$mdsd_service_dir" - local mdsd_override_conf="$mdsd_service_dir/override.conf" + local -r mdsd_override_conf="$mdsd_service_dir/override.conf" log "Writing $mdsd_override_conf" cat >"$mdsd_override_conf" <<'EOF' [Unit] @@ -908,7 +909,7 @@ EOF # run_azsecd_config_scan run_azsecd_config_scan() { - local -a configs=( + local -ar configs=( "baseline" "clamav" "software" @@ -930,14 +931,15 @@ reboot_vm() { # log is a wrapper for echo that includes the function name log() { - local msg="${1:-"log message is empty"}" - local stack_level="${2:-1}" + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" echo "${FUNCNAME[${stack_level}]}: ${msg}" } # abort is a wrapper for log that exits with an error code abort() { - log "${1}" "2" + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" exit 1 } From 91bcccd9847edea6571fe3bee121922e870ac41a Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 10 Apr 2024 16:28:10 -0400 Subject: [PATCH 04/38] Add write_file function to cleanup creation of new files, appending to existing files --- pkg/deploy/assets/gateway-production.json | 2 +- pkg/deploy/assets/rp-production.json | 2 +- pkg/deploy/generator/scripts/gatewayVMSS.sh | 3 +- pkg/deploy/generator/scripts/rpVMSS.sh | 378 ++++++++++---------- 4 files changed, 198 insertions(+), 187 deletions(-) diff --git a/pkg/deploy/assets/gateway-production.json b/pkg/deploy/assets/gateway-production.json index 1a3296cd889..e539ddfd02a 100644 --- a/pkg/deploy/assets/gateway-production.json +++ b/pkg/deploy/assets/gateway-production.json @@ -309,7 +309,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','DBTOKENURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenUrl')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','GATEWAYMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayMdsdConfigVersion')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayFeatures')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

echo "setting ssh password authentication"
# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work
sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config
systemctl reload sshd.service

#Adding retry logic to yum commands in order to avoid stalling out on resource locks
echo "running RHUI fix"
for attempt in {1..5}; do
  yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "running yum update"
for attempt in {1..5}; do
  yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "extending partition table"
# Linux block devices are inconsistently named
# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
growpart "$physical_disk" 2

echo "extending filesystems"
lvextend -l +20%FREE /dev/rootvg/rootlv
xfs_growfs /

lvextend -l +100%FREE /dev/rootvg/varlv
xfs_growfs /var

rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
rpm --import https://packages.microsoft.com/keys/microsoft.asc

for attempt in {1..5}; do
  yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "configuring logrotate"

# gateway_logdir is a readonly variable that specifies the host path mount point for the gateway container log file
# for the purpose of rotating the gateway logs
declare -r gateway_logdir='/var/log/aro-gateway'

cat >/etc/logrotate.conf <<EOF
# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we'll rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}

# Maximum log directory size is 100G with this configuration
# Setting limit to 100G to allow space for other logging services
# copytruncate is a critical option used to prevent logs from being shipped twice
${gateway_logdir} {
    size 20G
    rotate 5
    create 0600 root root
    copytruncate
    noolddir
    compress
}
EOF

echo "configuring yum repository and running yum update"
cat >/etc/yum.repos.d/azure.repo <<'EOF'
[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no
EOF

semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?"
mkdir -p /var/log/journal

for attempt in {1..5}; do
  yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman-docker openssl-perl python3 && break
  # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "applying firewall rules"
# https://access.redhat.com/security/cve/cve-2020-13401
cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

cat >/etc/sysctl.d/01-disable-core.conf <<'EOF'
kernel.core_pattern = |/bin/true
EOF
sysctl --system

firewall-cmd --add-port=80/tcp --permanent
firewall-cmd --add-port=8081/tcp --permanent
firewall-cmd --add-port=443/tcp --permanent

echo "logging into prod acr"
export AZURE_CLOUD_NAME=$AZURECLOUDNAME
az login -i --allow-no-subscriptions

# The managed identity that the VM runs as only has a single roleassignment.
# This role assignment is ACRPull which is not necessarily present in the
# subscription we're deploying into.  If the identity does not have any
# role assignments scoped on the subscription we're deploying into, it will
# not show on az login -i, which is why the below line is commented.
# az account set -s "$SUBSCRIPTIONID"

# Suppress emulation output for podman instead of docker for az acr compatability
mkdir -p /etc/containers/
touch /etc/containers/nodocker

mkdir -p /root/.docker
REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
docker pull "$MDMIMAGE"
docker pull "$RPIMAGE"
docker pull "$FLUENTBITIMAGE"

az logout

echo "configuring fluentbit service"
mkdir -p /etc/fluentbit/
mkdir -p /var/lib/fluent

cat >/etc/fluentbit/fluentbit.conf <<'EOF'
[INPUT]
	Name systemd
	Tag journald
	Systemd_Filter _COMM=aro
	DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[OUTPUT]
	Name forward
	Match *
	Port 29230
EOF

echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit

cat >/etc/systemd/system/fluentbit.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring mdm service"
cat >/etc/sysconfig/mdm <<EOF
MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=gateway
MDMSOURCEROLEINSTANCE='$(hostname)'
EOF

mkdir /var/etw
cat >/etc/systemd/system/mdm.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-gateway service"
cat >/etc/sysconfig/aro-gateway <<EOF
ACR_RESOURCE_ID='$ACRRESOURCEID'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT="$RPMDMACCOUNT"
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-gateway.service <<EOF
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${gateway_logdir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

echo "configuring mdsd and mdm services"
for var in "mdsd" "mdm"; do
cat >/etc/systemd/system/download-$var-credentials.service <<EOF
[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var
EOF

cat >/etc/systemd/system/download-$var-credentials.timer <<EOF
[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target
EOF
done

cat >/usr/local/bin/download-credentials.sh <<EOF
#!/bin/bash
set -eu

COMPONENT="\$1"
echo "Download \$COMPONENT credentials"

TEMP_DIR=\$(mktemp -d)
export AZURE_CONFIG_DIR=\$(mktemp -d)

echo "Logging into Azure..."
RETRIES=3
while [ "\$RETRIES" -gt 0 ]; do
    if az login -i --allow-no-subscriptions
    then
        echo "az login successful"
        break
    else
        echo "az login failed. Retrying..."
        let RETRIES-=1
        sleep 5
    fi
done

trap "cleanup" EXIT

cleanup() {
  az logout
  [[ "\$TEMP_DIR" =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ "\$AZURE_CONFIG_DIR" =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [ "\$COMPONENT" = "mdm" ]; then
  CURRENT_CERT_FILE="/etc/mdm.pem"
elif [ "\$COMPONENT" = "mdsd" ]; then
  CURRENT_CERT_FILE="/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME="gwy-\${COMPONENT}"
NEW_CERT_FILE="\$TEMP_DIR/\$COMPONENT.pem"
for attempt in {1..5}; do
  az keyvault secret download --file \$NEW_CERT_FILE --id "https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME" && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [ "\$COMPONENT" = "mdsd" ]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn="\$(openssl x509 -in "\$NEW_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  current_cert_sn="\$(openssl x509 -in "\$CURRENT_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != "\$current_cert_sn" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi
EOF

chmod u+x /usr/local/bin/download-credentials.sh

systemctl enable download-mdsd-credentials.timer
systemctl enable download-mdm-credentials.timer

/usr/local/bin/download-credentials.sh mdsd
/usr/local/bin/download-credentials.sh mdm
MDSDCERTIFICATESAN=$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')

cat >/etc/systemd/system/watch-mdm-credentials.service <<EOF
[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target
EOF

cat >/etc/systemd/system/watch-mdm-credentials.path <<EOF
[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target
EOF

systemctl enable watch-mdm-credentials.path
systemctl start watch-mdm-credentials.path

mkdir /etc/systemd/system/mdsd.service.d
cat >/etc/systemd/system/mdsd.service.d/override.conf <<'EOF'
[Unit]
After=network-online.target
EOF

cat >/etc/default/mdsd <<EOF
MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS="-A -d -r \$MDSD_ROLE_PREFIX"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=gateway
export MONITORING_ROLE_INSTANCE='$(hostname)'

export MDSD_MSGPACK_SORT_COLUMNS=1
EOF

# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
# to honour SSL_CERT_FILE any more, heaven only knows why.
mkdir -p /usr/lib/ssl/certs
csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null
c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
cat >/etc/default/vsa-nodescan-agent.config <<EOF
{
    "Nice": 19,
    "Timeout": 10800,
    "ClientId": "",
    "TenantId": "$AZURESECPACKVSATENANTID",
    "QualysStoreBaseUrl": "$AZURESECPACKQUALYSURL",
    "ProcessTimeout": 300,
    "CommandDelay": 0
  }
EOF

echo "enabling aro services"
for service in aro-gateway auoms azsecd azsecmond mdsd mdm chronyd fluentbit; do
  systemctl enable $service.service
done

for scan in baseline clamav software; do
  /usr/local/bin/azsecd config -s $scan -d P1D
done

echo "rebooting"
restorecon -RF /var/log/*
(sleep 30; reboot) &
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','DBTOKENURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenUrl')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','GATEWAYMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayMdsdConfigVersion')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayFeatures')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

echo "setting ssh password authentication"
# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work
sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config
systemctl reload sshd.service

#Adding retry logic to yum commands in order to avoid stalling out on resource locks
echo "running RHUI fix"
for attempt in {1..5}; do
  yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "running yum update"
for attempt in {1..5}; do
  yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "extending partition table"
# Linux block devices are inconsistently named
# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
growpart "$physical_disk" 2

echo "extending filesystems"
lvextend -l +20%FREE /dev/rootvg/rootlv
xfs_growfs /

lvextend -l +100%FREE /dev/rootvg/varlv
xfs_growfs /var

rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
rpm --import https://packages.microsoft.com/keys/microsoft.asc

for attempt in {1..5}; do
  yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "configuring logrotate"

# gateway_logdir is a readonly variable that specifies the host path mount point for the gateway container log file
# for the purpose of rotating the gateway logs
declare -r gateway_logdir='/var/log/aro-gateway'

cat >/etc/logrotate.conf <<EOF
# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we'll rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}

# Maximum log directory size is 100G with this configuration
# Setting limit to 100G to allow space for other logging services
# copytruncate is a critical option used to prevent logs from being shipped twice
${gateway_logdir} {
    size 20G
    rotate 5
    create 0600 root root
    copytruncate
    noolddir
    compress
}
EOF

echo "configuring yum repository and running yum update"
cat >/etc/yum.repos.d/azure.repo <<'EOF'
[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no
EOF

semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?"
mkdir -p /var/log/journal

for attempt in {1..5}; do
  yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman-docker openssl-perl python3 && break
  # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "applying firewall rules"
# https://access.redhat.com/security/cve/cve-2020-13401
cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

cat >/etc/sysctl.d/01-disable-core.conf <<'EOF'
kernel.core_pattern = |/bin/true
EOF
sysctl --system

firewall-cmd --add-port=80/tcp --permanent
firewall-cmd --add-port=8081/tcp --permanent
firewall-cmd --add-port=443/tcp --permanent

echo "logging into prod acr"
export AZURE_CLOUD_NAME=$AZURECLOUDNAME
az login -i --allow-no-subscriptions

# The managed identity that the VM runs as only has a single roleassignment.
# This role assignment is ACRPull which is not necessarily present in the
# subscription we're deploying into.  If the identity does not have any
# role assignments scoped on the subscription we're deploying into, it will
# not show on az login -i, which is why the below line is commented.
# az account set -s "$SUBSCRIPTIONID"

# Suppress emulation output for podman instead of docker for az acr compatability
mkdir -p /etc/containers/
touch /etc/containers/nodocker

mkdir -p /root/.docker
REGISTRY_AUTH_FILE="/root/.docker/config.json"
az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
docker pull "$MDMIMAGE"
docker pull "$RPIMAGE"
docker pull "$FLUENTBITIMAGE"

az logout

echo "configuring fluentbit service"
mkdir -p /etc/fluentbit/
mkdir -p /var/lib/fluent

cat >/etc/fluentbit/fluentbit.conf <<'EOF'
[INPUT]
	Name systemd
	Tag journald
	Systemd_Filter _COMM=aro
	DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[OUTPUT]
	Name forward
	Match *
	Port 29230
EOF

echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit

cat >/etc/systemd/system/fluentbit.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring mdm service"
cat >/etc/sysconfig/mdm <<EOF
MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=gateway
MDMSOURCEROLEINSTANCE='$(hostname)'
EOF

mkdir /var/etw
cat >/etc/systemd/system/mdm.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-gateway service"
cat >/etc/sysconfig/aro-gateway <<EOF
ACR_RESOURCE_ID='$ACRRESOURCEID'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT="$RPMDMACCOUNT"
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-gateway.service <<EOF
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${gateway_logdir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

echo "configuring mdsd and mdm services"
for var in "mdsd" "mdm"; do
cat >/etc/systemd/system/download-$var-credentials.service <<EOF
[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var
EOF

cat >/etc/systemd/system/download-$var-credentials.timer <<EOF
[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target
EOF
done

cat >/usr/local/bin/download-credentials.sh <<EOF
#!/bin/bash
set -eu

COMPONENT="\$1"
echo "Download \$COMPONENT credentials"

TEMP_DIR=\$(mktemp -d)
export AZURE_CONFIG_DIR=\$(mktemp -d)

echo "Logging into Azure..."
RETRIES=3
while [ "\$RETRIES" -gt 0 ]; do
    if az login -i --allow-no-subscriptions
    then
        echo "az login successful"
        break
    else
        echo "az login failed. Retrying..."
        let RETRIES-=1
        sleep 5
    fi
done

trap "cleanup" EXIT

cleanup() {
  az logout
  [[ "\$TEMP_DIR" =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ "\$AZURE_CONFIG_DIR" =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [ "\$COMPONENT" = "mdm" ]; then
  CURRENT_CERT_FILE="/etc/mdm.pem"
elif [ "\$COMPONENT" = "mdsd" ]; then
  CURRENT_CERT_FILE="/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME="gwy-\${COMPONENT}"
NEW_CERT_FILE="\$TEMP_DIR/\$COMPONENT.pem"
for attempt in {1..5}; do
  az keyvault secret download --file \$NEW_CERT_FILE --id "https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME" && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [ "\$COMPONENT" = "mdsd" ]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn="\$(openssl x509 -in "\$NEW_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  current_cert_sn="\$(openssl x509 -in "\$CURRENT_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != "\$current_cert_sn" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi
EOF

chmod u+x /usr/local/bin/download-credentials.sh

systemctl enable download-mdsd-credentials.timer
systemctl enable download-mdm-credentials.timer

/usr/local/bin/download-credentials.sh mdsd
/usr/local/bin/download-credentials.sh mdm
MDSDCERTIFICATESAN=$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')

cat >/etc/systemd/system/watch-mdm-credentials.service <<EOF
[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target
EOF

cat >/etc/systemd/system/watch-mdm-credentials.path <<EOF
[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target
EOF

systemctl enable watch-mdm-credentials.path
systemctl start watch-mdm-credentials.path

mkdir /etc/systemd/system/mdsd.service.d
cat >/etc/systemd/system/mdsd.service.d/override.conf <<'EOF'
[Unit]
After=network-online.target
EOF

cat >/etc/default/mdsd <<EOF
MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS="-A -d -r \$MDSD_ROLE_PREFIX"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=gateway
export MONITORING_ROLE_INSTANCE='$(hostname)'

export MDSD_MSGPACK_SORT_COLUMNS=1
EOF

# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
# to honour SSL_CERT_FILE any more, heaven only knows why.
mkdir -p /usr/lib/ssl/certs
csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null
c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
cat >/etc/default/vsa-nodescan-agent.config <<EOF
{
    "Nice": 19,
    "Timeout": 10800,
    "ClientId": "",
    "TenantId": "$AZURESECPACKVSATENANTID",
    "QualysStoreBaseUrl": "$AZURESECPACKQUALYSURL",
    "ProcessTimeout": 300,
    "CommandDelay": 0
  }
EOF

echo "enabling aro services"
for service in aro-gateway auoms azsecd azsecmond mdsd mdm chronyd fluentbit; do
  systemctl enable $service.service
done

for scan in baseline clamav software; do
  /usr/local/bin/azsecd config -s $scan -d P1D
done

echo "rebooting"
restorecon -RF /var/log/*
(sleep 30; reboot) &
')))]" } } } diff --git a/pkg/deploy/assets/rp-production.json b/pkg/deploy/assets/rp-production.json index 7b80cdb2236..eec290c2170 100644 --- a/pkg/deploy/assets/rp-production.json +++ b/pkg/deploy/assets/rp-production.json @@ -516,7 +516,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

echo "setting ssh password authentication"
# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work
sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config
systemctl reload sshd.service

#Adding retry logic to yum commands in order to avoid stalling out on resource locks
echo "running RHUI fix"
for attempt in {1..5}; do
  yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "running yum update"
for attempt in {1..5}; do
  yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "extending partition table"
# Linux block devices are inconsistently named
# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
growpart "$physicalDisk" 2

echo "extending filesystems"
lvextend -l +20%FREE /dev/rootvg/rootlv
xfs_growfs /

lvextend -l +100%FREE /dev/rootvg/varlv
xfs_growfs /var

echo "importing rpm repositories"
rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
rpm --import https://packages.microsoft.com/keys/microsoft.asc

for attempt in {1..5}; do
  yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "configuring logrotate"
cat >/etc/logrotate.conf <<'EOF'
# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we'll rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}
EOF

echo "configuring yum repository and running yum update"
cat >/etc/yum.repos.d/azure.repo <<'EOF'
[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no
EOF

semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?"
mkdir -p /var/log/journal

for attempt in {1..5}; do
yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman podman-docker openssl-perl python3 && break
  # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

# https://access.redhat.com/security/cve/cve-2020-13401
echo "applying firewall rules"
cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

cat >/etc/sysctl.d/01-disable-core.conf <<'EOF'
kernel.core_pattern = |/bin/true
EOF
sysctl --system

firewall-cmd --add-port=443/tcp --permanent
firewall-cmd --add-port=444/tcp --permanent
firewall-cmd --add-port=445/tcp --permanent
firewall-cmd --add-port=2222/tcp --permanent

export AZURE_CLOUD_NAME=$AZURECLOUDNAME

echo "logging into prod acr"
az login -i --allow-no-subscriptions

# Suppress emulation output for podman instead of docker for az acr compatability
mkdir -p /etc/containers/
touch /etc/containers/nodocker

mkdir -p /root/.docker
REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
docker pull "$MDMIMAGE"
docker pull "$RPIMAGE"
docker pull "$FLUENTBITIMAGE"

az logout

echo "configuring fluentbit service"
mkdir -p /etc/fluentbit/
mkdir -p /var/lib/fluent

cat >/etc/fluentbit/fluentbit.conf <<'EOF'
[INPUT]
	Name systemd
	Tag journald
	Systemd_Filter _COMM=aro
	DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230
EOF

echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit

cat >/etc/systemd/system/fluentbit.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

mkdir /etc/aro-rp
base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
if [[ -n "$ARMAPICABUNDLE" ]]; then
  base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
fi
chown -R 1000:1000 /etc/aro-rp

echo "configuring mdm service"
cat >/etc/sysconfig/mdm <<EOF
MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE='$(hostname)'
EOF

mkdir /var/etw
cat >/etc/systemd/system/mdm.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-rp service"
cat >/etc/sysconfig/aro-rp <<EOF
ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'
EOF

cat >/etc/systemd/system/aro-rp.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-dbtoken service"
cat >/etc/sysconfig/aro-dbtoken <<EOF
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-dbtoken.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

# DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
# are not used, but can't easily be refactored out. Should be revisited in the future.
echo "configuring aro-monitor service"
cat >/etc/sysconfig/aro-monitor <<EOF
AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-monitor.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-portal service"
cat >/etc/sysconfig/aro-portal <<EOF
AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-portal.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target
EOF

echo "configuring mdsd and mdm services"
chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

for var in "mdsd" "mdm"; do
cat >/etc/systemd/system/download-$var-credentials.service <<EOF
[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var
EOF

cat >/etc/systemd/system/download-$var-credentials.timer <<EOF
[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target
EOF
done

cat >/usr/local/bin/download-credentials.sh <<EOF
#!/bin/bash
set -eu

COMPONENT="\$1"
echo "Download \$COMPONENT credentials"

TEMP_DIR=\$(mktemp -d)
export AZURE_CONFIG_DIR=\$(mktemp -d)

echo "Logging into Azure..."
RETRIES=3
while [ "\$RETRIES" -gt 0 ]; do
    if az login -i --allow-no-subscriptions
    then
        echo "az login successful"
        break
    else
        echo "az login failed. Retrying..."
        let RETRIES-=1
        sleep 5
    fi
done

trap "cleanup" EXIT

cleanup() {
  az logout
  [[ "\$TEMP_DIR" =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ "\$AZURE_CONFIG_DIR" =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [ "\$COMPONENT" = "mdm" ]; then
  CURRENT_CERT_FILE="/etc/mdm.pem"
elif [ "\$COMPONENT" = "mdsd" ]; then
  CURRENT_CERT_FILE="/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME="rp-\${COMPONENT}"
NEW_CERT_FILE="\$TEMP_DIR/\$COMPONENT.pem"
for attempt in {1..5}; do
  az keyvault secret download --file \$NEW_CERT_FILE --id "https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME" && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [ "\$COMPONENT" = "mdsd" ]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn="\$(openssl x509 -in "\$NEW_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  current_cert_sn="\$(openssl x509 -in "\$CURRENT_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != "\$current_cert_sn" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi
EOF

chmod u+x /usr/local/bin/download-credentials.sh

systemctl enable download-mdsd-credentials.timer
systemctl enable download-mdm-credentials.timer

/usr/local/bin/download-credentials.sh mdsd
/usr/local/bin/download-credentials.sh mdm
MDSDCERTIFICATESAN=$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')

cat >/etc/systemd/system/watch-mdm-credentials.service <<EOF
[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target
EOF

cat >/etc/systemd/system/watch-mdm-credentials.path <<EOF
[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target
EOF

systemctl enable watch-mdm-credentials.path
systemctl start watch-mdm-credentials.path

mkdir /etc/systemd/system/mdsd.service.d
cat >/etc/systemd/system/mdsd.service.d/override.conf <<'EOF'
[Unit]
After=network-online.target
EOF

cat >/etc/default/mdsd <<EOF
MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS="-A -d -r \$MDSD_ROLE_PREFIX"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE='$(hostname)'

export MDSD_MSGPACK_SORT_COLUMNS=1
EOF

# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
# to honour SSL_CERT_FILE any more, heaven only knows why.
mkdir -p /usr/lib/ssl/certs
csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null
c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
cat >/etc/default/vsa-nodescan-agent.config <<EOF
{
    "Nice": 19,
    "Timeout": 10800,
    "ClientId": "",
    "TenantId": "$AZURESECPACKVSATENANTID",
    "QualysStoreBaseUrl": "$AZURESECPACKQUALYSURL",
    "ProcessTimeout": 300,
    "CommandDelay": 0
  }
EOF

echo "enabling aro services"
for service in aro-dbtoken aro-monitor aro-portal aro-rp auoms azsecd azsecmond mdsd mdm chronyd fluentbit; do
  systemctl enable $service.service
done

for scan in baseline clamav software; do
  /usr/local/bin/azsecd config -s $scan -d P1D
done

echo "rebooting"
restorecon -RF /var/log/*
(sleep 30; reboot) &
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

trap 'catch' ERR

main() {
    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    configure_rhui_repo
    create_azure_rpm_repos
    dnf_update_pkgs
    dnf_install_pkgs
}

# configure_rhui_repo
configure_rhui_repo() {
    log "running RHUI package updates"
    #Adding retry logic to yum commands in order to avoid stalling out on resource locks
    for attempt in {1..5}; do
        dnf update \
            -y \
            --disablerepo='*' \
            --enablerepo='rhui-microsoft-azure*' \
            && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            abort "failed to run dnf update"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    log "running dnf update"
    for attempt in {1..5}; do
        dnf -y \
            -x WALinuxAgent \
            -x WALinuxAgent-udev \
            update --allowerasing \
            && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            return 1
        fi
    done
}

# dnf_install_pkgs
dnf_install_pkgs() {
    log "importing rpm repositories"
    rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
    rpm --import https://packages.microsoft.com/keys/microsoft.asc

    for attempt in {1..5}; do
        dnf -y \
            install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm \
            && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            return 1
        fi
    done

    for attempt in {1..5}; do
        dnf -y \
            install \
            clamav \
            azsec-clamav \
            azsec-monitor \
            azure-cli \
            azure-mdsd \
            azure-security \
            podman \
            podman-docker \
            openssl-perl \
            python3 \
            && break
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            abort "failed to install required packages"
        fi
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "extending partition table"
    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physicalDisk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file
}

# configure_selinux
configure_selinux() {
    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf"
    log "Writing $diable_accept_ra_conf"
cat >"$diable_accept_ra_conf" <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file

    sysctl --system

    enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )
    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    echo "logging into prod acr"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    touch /etc/containers/nodocker

    mkdir -p /root/.docker
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "configuring fluentbit service"
    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file
}

# configure_certs
configure_certs() {
    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file
}

# configure_service_mdm
configure_service_mdm() {
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_conf_file
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "configuring aro-monitor service"
    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file
}

# configure_service_aro_portal
configure_service_aro_portal() {
    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file
}

# configure_service_mdsd
configure_service_mdsd() {
    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main
')))]" } } } diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 4034eed3675..613adc8d5e3 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -148,7 +148,8 @@ mkdir -p /etc/containers/ touch /etc/containers/nodocker mkdir -p /root/.docker -REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" +REGISTRY_AUTH_FILE="/root/.docker/config.json" +az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" docker pull "$MDMIMAGE" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 0677589931f..a2704b10406 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -1,7 +1,7 @@ #!/bin/bash set -o errexit \ - -o nounset \ + -o nounset trap 'catch' ERR @@ -11,9 +11,10 @@ main() { configure_disk_partitions configure_logrotate configure_selinux - journal_dir="/var/log/journal" - mkdir -p "$journal_dir" + + mkdir -p /var/log/journal mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store + configure_firewalld_rules pull_container_images configure_system_services @@ -134,10 +135,8 @@ configure_disk_partitions() { # configure_logrotate clobbers /etc/logrotate.conf configure_logrotate() { - local logrotate_conf_file="/etc/logrotate.conf" - log "Writing over $logrotate_conf_file" -cat >"$logrotate_conf_file" <<'EOF' -# see "man logrotate" for details + local -r logrotate_conf_filename='/etc/logrotate.conf' + local -r logrotate_conf_file='# see "man logrotate" for details # rotate log files weekly weekly @@ -156,7 +155,7 @@ compress # RPM packages drop log rotation information into this directory include /etc/logrotate.d -# no packages own wtmp and btmp -- we'll rotate them here +# no packages own wtmp and btmp -- we will rotate them here /var/log/wtmp { monthly create 0664 root utmp @@ -169,16 +168,15 @@ include /etc/logrotate.d monthly create 0600 root utmp rotate 1 -} -EOF +}' + + write_file logrotate_conf_filename logrotate_conf_file true } # create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file create_azure_rpm_repos() { - local azure_repo_file="/etc/yum.repos.d/azure.repo" - log "Writing $azure_repo_file" -cat >"$azure_repo_file" <<'EOF' -[azure-cli] + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] name=azure-cli baseurl=https://packages.microsoft.com/yumrepos/azure-cli enabled=yes @@ -188,8 +186,9 @@ gpgcheck=yes name=azurecore baseurl=https://packages.microsoft.com/yumrepos/azurecore enabled=yes -gpgcheck=no -EOF +gpgcheck=no' + + write_file azure_repo_filename azure_repo_file } # configure_selinux @@ -215,11 +214,11 @@ cat >"$diable_accept_ra_conf" <<'EOF' net.ipv6.conf.all.accept_ra=0 EOF - local -r disable_core="$prefix/01-disable-core.conf" - log "Writing $disable_core" -cat >"$disable_core" <<'EOF' -kernel.core_pattern = |/bin/true -EOF + local -r disable_core_filename="$prefix/01-disable-core.conf" + local -r disable_core_file="kernel.core_pattern = |/bin/true + " + write_file disable_core_filename disable_core_file + sysctl --system enable_ports=( @@ -248,7 +247,9 @@ pull_container_images() { touch /etc/containers/nodocker mkdir -p /root/.docker - REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + + az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" docker pull "$MDMIMAGE" @@ -307,12 +308,12 @@ configure_service_fluentbit() { mkdir -p /etc/fluentbit/ mkdir -p /var/lib/fluent -cat >/etc/fluentbit/fluentbit.conf <<'EOF' -[INPUT] - Name systemd - Tag journald - Systemd_Filter _COMM=aro - DB /var/lib/fluent/journaldb + local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' + local -r fluentbit_conf_file="[INPUT] +Name systemd +Tag journald +Systemd_Filter _COMM=aro +DB /var/lib/fluent/journaldb [FILTER] Name modify @@ -340,17 +341,18 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' [OUTPUT] Name forward Match * - Port 29230 -EOF + Port 29230" + + write_file fluentbit_conf_filename fluentbit_conf_file + + local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' + local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" + + write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file - local -r sysconfig_fluentbit="/etc/sysconfig/fluentbit" - log "Writing value FLUENTBITIMAGE=$FLUENTBITIMAGE to $sysconfig_fluentbit" - echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >"$sysconfig_fluentbit" + local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' - fluentbit_service_file="/etc/systemd/system/fluentbit.service" - log "Writing $fluentbit_service_file now" -cat >"$fluentbit_service_file" <<'EOF' -[Unit] + local -r fluentbit_service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitIntervalSec=0 @@ -380,8 +382,9 @@ RestartSec=5 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file fluentbit_conf_filename fluentbit_conf_file } # configure_certs @@ -396,45 +399,41 @@ configure_certs() { # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not # to honour SSL_CERT_FILE any more, heaven only knows why. mkdir -p /usr/lib/ssl/certs - csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null + csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null c_rehash /usr/lib/ssl/certs # we leave clientId blank as long as only 1 managed identity assigned to vmss # if we have more than 1, we will need to populate with clientId used for off-node scanning - nodescan_agent_file="/etc/default/vsa-nodescan-agent.config" - log "Writing $nodescan_agent_file" -cat >"$nodescan_agent_file" <"$sysconfig_mdm_file" <"$mdm_service_file"<<'EOF' -[Unit] + local -r mdm_service_filename="/etc/systemd/system/mdm.service" + local -r mdm_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -465,28 +464,26 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file mdm_service_filename mdm_service_file } # configure_timers_mdm_mdsd configure_timers_mdm_mdsd() { for var in "mdsd" "mdm"; do - download_creds_service_file="/etc/systemd/system/download-$var-credentials.service" - log "Writing $download_creds_service_file" -cat >"$download_creds_service_file" <"$download_creds_timer_file"<"$download_creds_script_file" <"$watch_mdm_creds_service_file" <"$watch_mdm_creds_path_file" <"$arp_rp_config_file"<"$aro_rp_service_file" <<'EOF' -[Unit] + local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service' + local -r aro_rp_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -694,28 +690,26 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file aro_rp_service_filename aro_rp_conf_file } # configure_service_aro_dbtoken configure_service_aro_dbtoken() { - local -r aro_dbtoken_service_config_file="/etc/sysconfig/aro-dbtoken" - log "Writing $aro_dbtoken_service_file" -cat >"$aro_dbtoken_service_file" <"$aro_dbtoken_service_config_file" <<'EOF' -[Unit] + local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' + local -r aro_dbtoken_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -746,18 +740,18 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file aro_dbtoken_service_filename aro_dbtoken_service_file } # configure_service_aro_monitor configure_service_aro_monitor() { - local -r aro_monitor_service_config="/etc/sysconfig/aro-monitor" log "configuring aro-monitor service" -# DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE -# are not used, but can't easily be refactored out. Should be revisited in the future. -cat >"$aro_monitor_service_config" <"$aro_monitor_service_file" <<'EOF' -[Unit] + local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service' + local -r aro_monitor_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -813,16 +806,15 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file aro_monitor_service_filename aro_monitor_service_file } # configure_service_aro_portal configure_service_aro_portal() { - local -r aro_portal_service_config="/etc/sysconfig/aro-portal" - log "Writing $aro_portal_service_config" -cat >"$aro_portal_service_config" <"$aro_portal_service_file" <<'EOF' -[Unit] + write_file aro_portal_service_conf_filename aro_portal_service_conf_file + + local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service' + local -r aro_portal_service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitInterval=0 @@ -868,27 +859,25 @@ Restart=always RestartSec=1 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file aro_portal_service_conf_filename aro_portal_service_conf_file } # configure_service_mdsd configure_service_mdsd() { local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" - log "Creating $mdsd_service_dir" mkdir "$mdsd_service_dir" - local -r mdsd_override_conf="$mdsd_service_dir/override.conf" - log "Writing $mdsd_override_conf" -cat >"$mdsd_override_conf" <<'EOF' -[Unit] -After=network-online.target -EOF - default_mdsd_file="/etc/default/mdsd" - log "Writing $default_mdsd_file" -cat >"$default_mdsd_file" < "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} + # reboot_vm restores all selinux file contexts, waits 30 seconds then reboots reboot_vm() { configure_selinux "true" From 1e35003594dfdafba999fbb614af6b2bd3ef5419 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 11 Apr 2024 14:39:53 -0400 Subject: [PATCH 05/38] move packages to install and rpm keys to import into arrays This will make adding new packages and keys easier --- pkg/deploy/generator/scripts/rpVMSS.sh | 53 +++++++++++++++----------- 1 file changed, 31 insertions(+), 22 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index a2704b10406..45c11634ad5 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -58,8 +58,8 @@ configure_rhui_repo() { # dnf_update_pkgs dnf_update_pkgs() { - log "running dnf update" for attempt in {1..5}; do + log "running dnf update attempt #${attempt}" dnf -y \ -x WALinuxAgent \ -x WALinuxAgent-udev \ @@ -68,47 +68,56 @@ dnf_update_pkgs() { if [[ ${attempt} -lt 5 ]]; then sleep 10 else - return 1 + abort "Failed to update packages after ${attempt} attempts" fi done } # dnf_install_pkgs dnf_install_pkgs() { - log "importing rpm repositories" - rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 - rpm --import https://packages.microsoft.com/keys/microsoft.asc + local -ra repo_keys=( + https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + https://packages.microsoft.com/keys/microsoft.asc + ) + # shellcheck disable=SC2068 for attempt in {1..5}; do - dnf -y \ - install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm \ - && break + for key in ${repo_keys[@]}; do + log "importing rpm repository key $key attempt #$attempt" + rpm --import "$key" + done if [[ ${attempt} -lt 5 ]]; then sleep 10 else - return 1 + abort "Failed to import rpm repository key $key after $attempt attempts" fi done + local -ra install_pkgs=( + install + clamav + azsec-clamav + azsec-monitor + azure-cli + azure-mdsd + azure-security + podman + podman-docker + openssl-perl + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + python3 + https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm + ) + for attempt in {1..5}; do + log "Installing packages ${install_pkgs[*]} attempt #$attempt" dnf -y \ - install \ - clamav \ - azsec-clamav \ - azsec-monitor \ - azure-cli \ - azure-mdsd \ - azure-security \ - podman \ - podman-docker \ - openssl-perl \ - python3 \ + "${install_pkgs[@]}" \ && break - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 if [[ ${attempt} -lt 5 ]]; then sleep 10 else - abort "failed to install required packages" + abort "Failed to install packages ${install_pkgs[*]} after $attempt attempts" fi done } From eb62848828bd95874737673b41687b9f61a3e607 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 11 Apr 2024 15:50:31 -0400 Subject: [PATCH 06/38] Add retry loop for rpm repo key imports, remove erroneous package from install_pkgs array --- pkg/deploy/generator/scripts/rpVMSS.sh | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 45c11634ad5..8eaecbb8d69 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -84,7 +84,10 @@ dnf_install_pkgs() { for attempt in {1..5}; do for key in ${repo_keys[@]}; do log "importing rpm repository key $key attempt #$attempt" - rpm --import "$key" + rpm --import \ + -v \ + "$key" \ + && break done if [[ ${attempt} -lt 5 ]]; then sleep 10 @@ -94,7 +97,6 @@ dnf_install_pkgs() { done local -ra install_pkgs=( - install clamav azsec-clamav azsec-monitor @@ -111,7 +113,8 @@ dnf_install_pkgs() { for attempt in {1..5}; do log "Installing packages ${install_pkgs[*]} attempt #$attempt" - dnf -y \ + dnf install \ + -y \ "${install_pkgs[@]}" \ && break if [[ ${attempt} -lt 5 ]]; then From 104bb2ec980861f9126a23d9b4234b13d69c1835 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 11 Apr 2024 16:40:20 -0400 Subject: [PATCH 07/38] Pass dnf packages and rpm keys to function calls via nameref to allow reuse Editing the packages and keys passed will allow for easier modification later. This also allows for function reuse. --- pkg/deploy/generator/scripts/rpVMSS.sh | 132 ++++++++++++++----------- 1 file changed, 74 insertions(+), 58 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 8eaecbb8d69..c08656c2995 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -35,7 +35,34 @@ configure_and_install_dnf_pkgs_repos() { configure_rhui_repo create_azure_rpm_repos dnf_update_pkgs - dnf_install_pkgs + + local -ra rpm_keys=( + https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + https://packages.microsoft.com/keys/microsoft.asc + ) + + rpm_import_keys rpm_keys + + local -ra repo_rpm_pkgs=( + https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm + ) + + local -ra install_pkgs=( + clamav + azsec-clamav + azsec-monitor + azure-cli + azure-mdsd + azure-security + podman + podman-docker + openssl-perl + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + python3 + ) + + dnf_install_pkgs repo_rpm_pkgs + dnf_install_pkgs install_pkgs } # configure_rhui_repo @@ -75,54 +102,43 @@ dnf_update_pkgs() { # dnf_install_pkgs dnf_install_pkgs() { - local -ra repo_keys=( - https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 - https://packages.microsoft.com/keys/microsoft.asc - ) + local -n pkgs="$1" + for attempt in {1..5}; do + log "Installing packages ${pkgs[*]} attempt #$attempt" + dnf -y \ + install \ + "${install_pkgs[@]}" \ + && break + if [[ ${attempt} -lt 5 ]]; then + sleep 10 + else + abort "Failed to install packages ${pkgs[*]} after $attempt attempts" + fi + done +} +# rpm_import_keys +rpm_import_keys() { + local -n keys="$1" # shellcheck disable=SC2068 - for attempt in {1..5}; do - for key in ${repo_keys[@]}; do + for key in ${keys[@]}; do + if [ ${#keys[@]} -eq 0 ]; then + break + fi + for attempt in {1..5}; do log "importing rpm repository key $key attempt #$attempt" rpm --import \ -v \ "$key" \ + && unset key \ && break done - if [[ ${attempt} -lt 5 ]]; then + if [ -z ${key+x} ] && [[ ${attempt} -lt 5 ]]; then sleep 10 else abort "Failed to import rpm repository key $key after $attempt attempts" fi done - - local -ra install_pkgs=( - clamav - azsec-clamav - azsec-monitor - azure-cli - azure-mdsd - azure-security - podman - podman-docker - openssl-perl - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 - python3 - https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm - ) - - for attempt in {1..5}; do - log "Installing packages ${install_pkgs[*]} attempt #$attempt" - dnf install \ - -y \ - "${install_pkgs[@]}" \ - && break - if [[ ${attempt} -lt 5 ]]; then - sleep 10 - else - abort "Failed to install packages ${install_pkgs[*]} after $attempt attempts" - fi - done } # configure_disk_partitions @@ -229,7 +245,7 @@ EOF local -r disable_core_filename="$prefix/01-disable-core.conf" local -r disable_core_file="kernel.core_pattern = |/bin/true " - write_file disable_core_filename disable_core_file + write_file disable_core_filename disable_core_file true sysctl --system @@ -355,12 +371,12 @@ DB /var/lib/fluent/journaldb Match * Port 29230" - write_file fluentbit_conf_filename fluentbit_conf_file + write_file fluentbit_conf_filename fluentbit_conf_file true local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" - write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file + write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' @@ -396,7 +412,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file fluentbit_conf_filename fluentbit_conf_file + write_file fluentbit_conf_filename fluentbit_conf_file true } # configure_certs @@ -427,7 +443,7 @@ configure_certs() { \"CommandDelay\": 0 }" - write_file nodescan_agent_filename nodescan_agent_file + write_file nodescan_agent_filename nodescan_agent_file true } # configure_service_mdm @@ -441,7 +457,7 @@ MDMSOURCEENVIRONMENT='$LOCATION' MDMSOURCEROLE=rp MDMSOURCEROLEINSTANCE=\"$(hostname)\"" - write_file sysconfig_mdm_filename sysconfig_mdm_file + write_file sysconfig_mdm_filename sysconfig_mdm_file true mkdir -p /var/etw local -r mdm_service_filename="/etc/systemd/system/mdm.service" @@ -478,7 +494,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file mdm_service_filename mdm_service_file + write_file mdm_service_filename mdm_service_file true } # configure_timers_mdm_mdsd @@ -492,7 +508,7 @@ Description=Periodic $var credentials refresh Type=oneshot ExecStart=/usr/local/bin/download-credentials.sh $var" - write_file download_creds_service_filename download_creds_service_file + write_file download_creds_service_filename download_creds_service_file true local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer" local download_creds_timer_file="[Unit] @@ -508,7 +524,7 @@ AccuracySec=5s [Install] WantedBy=timers.target" - write_file download_creds_timer_filename download_creds_timer_file + write_file download_creds_timer_filename download_creds_timer_file true done local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh" @@ -581,7 +597,7 @@ else echo Failed to refresh certificate for \$COMPONENT && exit 1 fi" - write_file download_creds_script_filename download_creds_script_file + write_file download_creds_script_filename download_creds_script_file true chmod u+x /usr/local/bin/download-credentials.sh @@ -603,7 +619,7 @@ ExecStart=/usr/bin/systemctl restart mdm.service [Install] WantedBy=multi-user.target" - write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file + write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path' local -r watch_mdm_creds_path_file='[Path] @@ -612,7 +628,7 @@ PathModified=/etc/mdm.pem [Install] WantedBy=multi-user.target' - write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file + write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true local -r watch_mdm_creds='watch-mdm-credentials.path' systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds" @@ -649,7 +665,7 @@ ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC' ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE' USE_CHECKACCESS='$USECHECKACCESS'" - write_file aro_rp_conf_filename aro_rp_conf_file + write_file aro_rp_conf_filename aro_rp_conf_file true local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service' local -r aro_rp_service_file="[Unit] @@ -704,7 +720,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file aro_rp_service_filename aro_rp_conf_file + write_file aro_rp_service_filename aro_rp_conf_file true } # configure_service_aro_dbtoken @@ -718,7 +734,7 @@ MDM_ACCOUNT='$RPMDMACCOUNT' MDM_NAMESPACE=DBToken RPIMAGE='$RPIMAGE'" - write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file + write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' local -r aro_dbtoken_service_file="[Unit] @@ -754,7 +770,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file aro_dbtoken_service_filename aro_dbtoken_service_file + write_file aro_dbtoken_service_filename aro_dbtoken_service_file true } # configure_service_aro_monitor @@ -779,7 +795,7 @@ MDM_ACCOUNT='$RPMDMACCOUNT' MDM_NAMESPACE=BBM RPIMAGE='$RPIMAGE'" - write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file + write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service' local -r aro_monitor_service_file="[Unit] @@ -820,7 +836,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file aro_monitor_service_filename aro_monitor_service_file + write_file aro_monitor_service_filename aro_monitor_service_file true } # configure_service_aro_portal @@ -836,7 +852,7 @@ MDM_NAMESPACE=Portal PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME' RPIMAGE='$RPIMAGE'" - write_file aro_portal_service_conf_filename aro_portal_service_conf_file + write_file aro_portal_service_conf_filename aro_portal_service_conf_file true local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service' local -r aro_portal_service_file="[Unit] @@ -873,7 +889,7 @@ RestartSec=1 [Install] WantedBy=multi-user.target" - write_file aro_portal_service_conf_filename aro_portal_service_conf_file + write_file aro_portal_service_conf_filename aro_portal_service_conf_file true } # configure_service_mdsd @@ -885,7 +901,7 @@ configure_service_mdsd() { local -r mdsd_override_conf_file="[Unit] After=network-online.target" - write_file mdsd_override_conf_filename mdsd_override_conf_file + write_file mdsd_override_conf_filename mdsd_override_conf_file true local -r default_mdsd_filename="/etc/default/mdsd" local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default @@ -906,7 +922,7 @@ export MONITORING_ROLE_INSTANCE=\"$(hostname)\" export MDSD_MSGPACK_SORT_COLUMNS=1\"" - write_file default_mdsd_filename default_mdsd_file + write_file default_mdsd_filename default_mdsd_file true } From 3643a06648d448f76ac6f90c9e54eacf49e7895f Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Fri, 12 Apr 2024 07:44:34 -0400 Subject: [PATCH 08/38] Add wait for all rpm related transactions to avoid rpm database corruption Add starting log message for each function call rpm database corruption has been seen in testing, and Prod deployments due to concurrent rpm database operations between rpm and dnf. wait is needed due to this. remove ERR trap, we aren't attempting to trap any specific errors yet. --- pkg/deploy/generator/scripts/rpVMSS.sh | 93 ++++++++++++++++++++------ 1 file changed, 74 insertions(+), 19 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index c08656c2995..e2ba4c71ee7 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -3,8 +3,6 @@ set -o errexit \ -o nounset -trap 'catch' ERR - main() { configure_sshd configure_and_install_dnf_pkgs_repos @@ -23,6 +21,7 @@ main() { # We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work configure_sshd() { + log "starting" log "setting ssh password authentication" sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config @@ -32,9 +31,16 @@ configure_sshd() { # configure_and_install_dnf_pkgs_repos configure_and_install_dnf_pkgs_repos() { + log "starting" configure_rhui_repo create_azure_rpm_repos - dnf_update_pkgs + + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + dnf_update_pkgs exclude_pkgs local -ra rpm_keys=( https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 @@ -67,35 +73,44 @@ configure_and_install_dnf_pkgs_repos() { # configure_rhui_repo configure_rhui_repo() { + log "starting" log "running RHUI package updates" + #Adding retry logic to yum commands in order to avoid stalling out on resource locks for attempt in {1..5}; do + log "attempt #${attempt} - running dnf update" dnf update \ -y \ --disablerepo='*' \ - --enablerepo='rhui-microsoft-azure*' \ - && break + --enablerepo='rhui-microsoft-azure*' & + + wait $! && break if [[ ${attempt} -lt 5 ]]; then sleep 10 else - abort "failed to run dnf update" + abort "attempt #${attempt} - Failed to update packages" fi done } # dnf_update_pkgs dnf_update_pkgs() { + local -n excludes="$1" + log "starting" + for attempt in {1..5}; do - log "running dnf update attempt #${attempt}" + log "attempt #${attempt} - running dnf update" + # shellcheck disable=SC2068 dnf -y \ - -x WALinuxAgent \ - -x WALinuxAgent-udev \ - update --allowerasing \ - && break + ${excludes[@]} \ + update \ + --allowerasing & + + wait $! && break if [[ ${attempt} -lt 5 ]]; then sleep 10 else - abort "Failed to update packages after ${attempt} attempts" + abort "attempt #${attempt} - Failed to update packages" fi done } @@ -103,16 +118,19 @@ dnf_update_pkgs() { # dnf_install_pkgs dnf_install_pkgs() { local -n pkgs="$1" + log "starting" + for attempt in {1..5}; do - log "Installing packages ${pkgs[*]} attempt #$attempt" + log "attempt #$attempt - Installing packages ${pkgs[*]}" dnf -y \ install \ - "${install_pkgs[@]}" \ - && break + "${pkgs[@]}" & + + wait $! && break if [[ ${attempt} -lt 5 ]]; then sleep 10 else - abort "Failed to install packages ${pkgs[*]} after $attempt attempts" + abort "attempt #${attempt} - Failed to install packages ${pkgs[*]}" fi done } @@ -120,13 +138,15 @@ dnf_install_pkgs() { # rpm_import_keys rpm_import_keys() { local -n keys="$1" + log "starting" + # shellcheck disable=SC2068 for key in ${keys[@]}; do if [ ${#keys[@]} -eq 0 ]; then break fi for attempt in {1..5}; do - log "importing rpm repository key $key attempt #$attempt" + log "attempt #$attempt - importing rpm repository key $key" rpm --import \ -v \ "$key" \ @@ -136,14 +156,16 @@ rpm_import_keys() { if [ -z ${key+x} ] && [[ ${attempt} -lt 5 ]]; then sleep 10 else - abort "Failed to import rpm repository key $key after $attempt attempts" + abort "attempt #${attempt} - Failed to import rpm repository key $key" fi done } # configure_disk_partitions configure_disk_partitions() { + log "starting" log "extending partition table" + # Linux block devices are inconsistently named # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" @@ -163,6 +185,8 @@ configure_disk_partitions() { # configure_logrotate clobbers /etc/logrotate.conf configure_logrotate() { + log "starting" + local -r logrotate_conf_filename='/etc/logrotate.conf' local -r logrotate_conf_file='# see "man logrotate" for details # rotate log files weekly @@ -203,6 +227,8 @@ include /etc/logrotate.d # create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file create_azure_rpm_repos() { + log "starting" + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' local -r azure_repo_file='[azure-cli] name=azure-cli @@ -216,11 +242,13 @@ baseurl=https://packages.microsoft.com/yumrepos/azurecore enabled=yes gpgcheck=no' - write_file azure_repo_filename azure_repo_file + write_file azure_repo_filename azure_repo_file true } # configure_selinux configure_selinux() { + log "starting" + local -r relabel="${1:-false}" already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" @@ -234,6 +262,8 @@ configure_selinux() { # configure_firewalld_rules configure_firewalld_rules() { + log "starting" + # https://access.redhat.com/security/cve/cve-2020-13401 local -r prefix="/etc/sysctl.d" local -r diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf" @@ -267,6 +297,8 @@ EOF # pull_container_images pull_container_images() { + log "starting" + echo "logging into prod acr" az login -i --allow-no-subscriptions @@ -309,6 +341,8 @@ configure_system_services() { # enable_aro_services enables all services required for aro rp enable_aro_services() { + log "starting" + local -ra aro_services=( "aro-dbtoken" "aro-monitor" @@ -332,7 +366,9 @@ enable_aro_services() { # configure_service_fluentbit configure_service_fluentbit() { + log "starting" log "configuring fluentbit service" + mkdir -p /etc/fluentbit/ mkdir -p /var/lib/fluent @@ -417,6 +453,8 @@ WantedBy=multi-user.target" # configure_certs configure_certs() { + log "starting" + mkdir /etc/aro-rp base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem if [[ -n "$ARMAPICABUNDLE" ]]; then @@ -448,6 +486,7 @@ configure_certs() { # configure_service_mdm configure_service_mdm() { + log "starting" log "configuring mdm service" local -r sysconfig_mdm_filename="/etc/sysconfig/mdm" @@ -499,6 +538,8 @@ WantedBy=multi-user.target" # configure_timers_mdm_mdsd configure_timers_mdm_mdsd() { + log "starting" + for var in "mdsd" "mdm"; do local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service" local download_creds_service_file="[Unit] @@ -637,6 +678,8 @@ WantedBy=multi-user.target' # configure_service_aro_rp configure_service_aro_rp() { + log "starting" + local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp' local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID' ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME' @@ -725,6 +768,8 @@ WantedBy=multi-user.target" # configure_service_aro_dbtoken configure_service_aro_dbtoken() { + log "starting" + local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken' local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' @@ -775,7 +820,9 @@ WantedBy=multi-user.target" # configure_service_aro_monitor configure_service_aro_monitor() { + log "starting" log "configuring aro-monitor service" + # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE # are not used, but can't easily be refactored out. Should be revisited in the future. local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor' @@ -841,6 +888,8 @@ WantedBy=multi-user.target" # configure_service_aro_portal configure_service_aro_portal() { + log "starting" + local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal' local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS' AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID' @@ -894,6 +943,8 @@ WantedBy=multi-user.target" # configure_service_mdsd configure_service_mdsd() { + log "starting" + local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" mkdir "$mdsd_service_dir" @@ -928,6 +979,8 @@ export MDSD_MSGPACK_SORT_COLUMNS=1\"" # run_azsecd_config_scan run_azsecd_config_scan() { + log "starting" + local -ar configs=( "baseline" "clamav" @@ -963,6 +1016,8 @@ write_file() { # reboot_vm restores all selinux file contexts, waits 30 seconds then reboots reboot_vm() { + log "starting" + configure_selinux "true" (sleep 30 && log "rebooting vm now"; reboot) & } From 23f1a336c9034cbd08a9db9d1411e58730bc698f Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 10:25:41 -0400 Subject: [PATCH 09/38] Increase dnf & rpm retry time to 1 minute, 5 minutes total Pass wait time as a nameref variable to allow easier modification --- pkg/deploy/generator/scripts/rpVMSS.sh | 28 +++++++++++++++++--------- 1 file changed, 18 insertions(+), 10 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index e2ba4c71ee7..dc536ba6f5c 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -32,8 +32,11 @@ configure_sshd() { # configure_and_install_dnf_pkgs_repos configure_and_install_dnf_pkgs_repos() { log "starting" - configure_rhui_repo - create_azure_rpm_repos + + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + configure_rhui_repo retry_wait_time + create_azure_rpm_repos retry_wait_time local -ar exclude_pkgs=( "-x WALinuxAgent" @@ -67,12 +70,13 @@ configure_and_install_dnf_pkgs_repos() { python3 ) - dnf_install_pkgs repo_rpm_pkgs - dnf_install_pkgs install_pkgs + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time } # configure_rhui_repo configure_rhui_repo() { + local -n wait_time="$1" log "starting" log "running RHUI package updates" @@ -86,7 +90,7 @@ configure_rhui_repo() { wait $! && break if [[ ${attempt} -lt 5 ]]; then - sleep 10 + sleep "$wait_time" else abort "attempt #${attempt} - Failed to update packages" fi @@ -96,6 +100,7 @@ configure_rhui_repo() { # dnf_update_pkgs dnf_update_pkgs() { local -n excludes="$1" + local -n wait_time="$2" log "starting" for attempt in {1..5}; do @@ -108,7 +113,7 @@ dnf_update_pkgs() { wait $! && break if [[ ${attempt} -lt 5 ]]; then - sleep 10 + sleep "$wait_time" else abort "attempt #${attempt} - Failed to update packages" fi @@ -118,6 +123,7 @@ dnf_update_pkgs() { # dnf_install_pkgs dnf_install_pkgs() { local -n pkgs="$1" + local -n wait_time="$2" log "starting" for attempt in {1..5}; do @@ -128,7 +134,7 @@ dnf_install_pkgs() { wait $! && break if [[ ${attempt} -lt 5 ]]; then - sleep 10 + sleep "$wait_time" else abort "attempt #${attempt} - Failed to install packages ${pkgs[*]}" fi @@ -138,6 +144,7 @@ dnf_install_pkgs() { # rpm_import_keys rpm_import_keys() { local -n keys="$1" + local -n wait_time="$2" log "starting" # shellcheck disable=SC2068 @@ -150,11 +157,12 @@ rpm_import_keys() { rpm --import \ -v \ "$key" \ - && unset key \ - && break + && unset key + + wait $! && break done if [ -z ${key+x} ] && [[ ${attempt} -lt 5 ]]; then - sleep 10 + sleep "$wait_time" else abort "attempt #${attempt} - Failed to import rpm repository key $key" fi From 0b8104f9b514e79dd53c7f9015b34e57104831a3 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 11:54:06 -0400 Subject: [PATCH 10/38] Add parse_run_options to run individual steps for testing --- pkg/deploy/generator/scripts/rpVMSS.sh | 67 ++++++++++++++++++++++++-- 1 file changed, 64 insertions(+), 3 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index dc536ba6f5c..d854c93a5fd 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -3,7 +3,14 @@ set -o errexit \ -o nounset +if [ "${DEBUG:-false}" == true ]; then + set -x +fi + main() { + parse_run_options "$@" + + configure_sshd configure_and_install_dnf_pkgs_repos configure_disk_partitions @@ -19,6 +26,59 @@ main() { reboot_vm } +parse_run_options() { + local -a options=("$1") + if [ "${#options[@]}" -eq 0 ]; then + log "Running all steps" + return 0 + fi + + local OPTIND + + while getopts "dplsrfui" options; do + case "${options}" in + d) + log "Running step configure_disk_partitions" + configure_disk_partitions + ;; + p) + log "Running step configure_and_install_dnf_pkgs_repos" + configure_and_install_dnf_pkgs_repos + ;; + l) + log "Running configure_logrotate" + configure_logrotate + ;; + s) + log "Running configure_selinux" + configure_selinux + ;; + r) + log "Running configure_sshd" + configure_sshd + ;; + f) + log "Running configure_firewalld_rules" + configure_firewalld_rules + ;; + u) + log "Running pull_container_images & configure_system_services" + pull_container_images + configure_system_services + ;; + i) + log "Running pull_container_images" + pull_container_images + ;; + *) + abort "Unkown option" + ;; + esac + done + + exit 0 +} + # We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work configure_sshd() { log "starting" @@ -43,14 +103,14 @@ configure_and_install_dnf_pkgs_repos() { "-x WALinuxAgent-udev" ) - dnf_update_pkgs exclude_pkgs + dnf_update_pkgs exclude_pkgs retry_wait_time local -ra rpm_keys=( https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 https://packages.microsoft.com/keys/microsoft.asc ) - rpm_import_keys rpm_keys + rpm_import_keys rpm_keys retry_wait_time local -ra repo_rpm_pkgs=( https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm @@ -1041,9 +1101,10 @@ log() { abort() { local -ri origin_stacklevel=2 log "${1}" "$origin_stacklevel" + log "Exiting" exit 1 } export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -main +main "$@" From fd6b96e4a5a55c3713fb5d93fc0e44ce07d300b1 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 12:17:06 -0400 Subject: [PATCH 11/38] Add usage statement --- pkg/deploy/generator/scripts/rpVMSS.sh | 20 +++++++++++++++++++- 1 file changed, 19 insertions(+), 1 deletion(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index d854c93a5fd..4965a17393a 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -26,6 +26,23 @@ main() { reboot_vm } +usage() { + log "$(basename "$0") [-dplsrfui] + -d Configure Disk Partitions + -p Configure rpm repositories, import required rpm keys, update & install packages with dnf + -l Configure logrotate.conf + -s Make selinux modifications required for ARO RP + -r Configure sshd - Allow password authenticaiton + -f Configure firewalld default zone rules + -u Pull container images and configure systemd unit files for ARO RP + -i Pull container images + " +} + +# parse_run_options takes all arguements passed to main and parses them +# allowing individual step(s) to be ran, rather than all steps +# +# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline parse_run_options() { local -a options=("$1") if [ "${#options[@]}" -eq 0 ]; then @@ -71,7 +88,8 @@ parse_run_options() { pull_container_images ;; *) - abort "Unkown option" + usage + abort "Unkown option provided" ;; esac done From 051f6335e7b33d78e74f9fa3ccc682446eef51b3 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 14:18:34 -0400 Subject: [PATCH 12/38] Add az login -i comment found in gatewayVMSS.sh, change variable syntex to snake case for consistency --- pkg/deploy/generator/scripts/rpVMSS.sh | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 4965a17393a..2198ae2103c 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -254,8 +254,8 @@ configure_disk_partitions() { # Linux block devices are inconsistently named # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here - physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" - growpart "$physicalDisk" 2 + physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" + growpart "$physical_disk" 2 log "extending filesystems" log "extending root lvm" @@ -386,6 +386,13 @@ pull_container_images() { log "starting" echo "logging into prod acr" + + # The managed identity that the VM runs as only has a single roleassignment. + # This role assignment is ACRPull which is not necessarily present in the + # subscription we're deploying into. If the identity does not have any + # role assignments scoped on the subscription we're deploying into, it will + # not show on az login -i, which is why the below line is commented. + # az account set -s "$SUBSCRIPTIONID" az login -i --allow-no-subscriptions # Suppress emulation output for podman instead of docker for az acr compatability From 15f71f9d42e6898a100a6115fcc0e851f75a01d3 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 14:19:49 -0400 Subject: [PATCH 13/38] Port changes made in rpVMSS.sh to gatewayVMSS.sh Make gateway log directory to be passed in to functions where it is needed, this allows the value to be set in one location. Move retry steps into a single retry function call This is to reduce code duplication Move configure_fiewall_rules file creation to use write_file Correct accept_ra_conf variable name spelling --- pkg/deploy/generator/scripts/gatewayVMSS.sh | 1028 ++++++++++++++----- pkg/deploy/generator/scripts/rpVMSS.sh | 112 +- 2 files changed, 814 insertions(+), 326 deletions(-) diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 613adc8d5e3..3751446891e 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -1,52 +1,276 @@ #!/bin/bash -echo "setting ssh password authentication" -# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work -sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config -systemctl reload sshd.service +set -o errexit \ + -o nounset -#Adding retry logic to yum commands in order to avoid stalling out on resource locks -echo "running RHUI fix" -for attempt in {1..5}; do - yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +if [ "${DEBUG:-false}" == true ]; then + set -x +fi -echo "running yum update" -for attempt in {1..5}; do - yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +main() { + local -r gateway_logdir='/var/log/aro-gateway' + parse_run_options "$@" gateway_logdir -echo "extending partition table" -# Linux block devices are inconsistently named -# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here -physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" -growpart "$physical_disk" 2 -echo "extending filesystems" -lvextend -l +20%FREE /dev/rootvg/rootlv -xfs_growfs / + configure_sshd + configure_and_install_dnf_pkgs_repos + configure_disk_partitions + configure_logrotate gateway_logdir + configure_selinux -lvextend -l +100%FREE /dev/rootvg/varlv -xfs_growfs /var + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store -rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 -rpm --import https://packages.microsoft.com/keys/microsoft.asc + configure_firewalld_rules + pull_container_images + configure_system_services gateway_logdir + reboot_vm +} -for attempt in {1..5}; do - yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +usage() { + log "$(basename "$0") [-dplsrfui] + -d Configure Disk Partitions + -p Configure rpm repositories, import required rpm keys, update & install packages with dnf + -l Configure logrotate.conf + -s Make selinux modifications required for ARO RP + -r Configure sshd - Allow password authenticaiton + -f Configure firewalld default zone rules + -u Pull container images and configure systemd unit files for ARO RP + -i Pull container images + " +} + +# parse_run_options takes all arguements passed to main and parses them +# allowing individual step(s) to be ran, rather than all steps +# +# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline +parse_run_options() { + local -a options=("$1") + if [ "${#options[@]}" -eq 0 ]; then + log "Running all steps" + return 0 + fi + + local OPTIND + + while getopts "dplsrfui" options; do + case "${options}" in + d) + log "Running step configure_disk_partitions" + configure_disk_partitions + ;; + p) + log "Running step configure_and_install_dnf_pkgs_repos" + configure_and_install_dnf_pkgs_repos + ;; + l) + log "Running configure_logrotate" + configure_logrotate "$2" + ;; + s) + log "Running configure_selinux" + configure_selinux + ;; + r) + log "Running configure_sshd" + configure_sshd + ;; + f) + log "Running configure_firewalld_rules" + configure_firewalld_rules + ;; + u) + log "Running pull_container_images & configure_system_services" + configure_system_services "$2" + ;; + i) + log "Running pull_container_images" + pull_container_images + ;; + *) + usage + abort "Unkown option provided" + ;; + esac + done + + exit 0 +} + +# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work +configure_sshd() { + log "starting" + log "setting ssh password authentication" + sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config + + systemctl reload sshd.service + systemctl is-active --quiet sshd || abort "sshd failed to reload" +} + +# configure_and_install_dnf_pkgs_repos +configure_and_install_dnf_pkgs_repos() { + log "starting" + + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + configure_rhui_repo retry_wait_time + create_azure_rpm_repos retry_wait_time + + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + dnf_update_pkgs exclude_pkgs retry_wait_time + + local -ra rpm_keys=( + https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + https://packages.microsoft.com/keys/microsoft.asc + ) + + rpm_import_keys rpm_keys retry_wait_time + + local -ra repo_rpm_pkgs=( + https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm + ) + + local -ra install_pkgs=( + clamav + azsec-clamav + azsec-monitor + azure-cli + azure-mdsd + azure-security + podman + podman-docker + openssl-perl + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + python3 + ) + + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time +} + +# configure_rhui_repo +configure_rhui_repo() { + log "starting" + + local -ra cmd=( + dnf + update + -y + --disablerepo='*' + --enablerepo='rhui-microsoft-azure*' + ) + + log "running RHUI package updates" + retry cmd "$1" +} + +# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks +retry() { + local -n cmd_retry="$1" + local -n wait_time="$2" + + for attempt in {1..5}; do + log "attempt #${attempt} - ${FUNCNAME[2]}" + ${cmd_retry[@]} & + + wait $! && break + if [[ ${attempt} -lt 5 ]]; then + sleep "$wait_time" + else + abort "attempt #${attempt} - Failed to update packages" + fi + done +} + +# dnf_update_pkgs +dnf_update_pkgs() { + local -n excludes="$1" + log "starting" + + local -ra cmd=( + dnf + -y + ${excludes[@]} + update + --allowerasing + ) + + log "Updating all packages" + retry cmd "$2" +} + +# dnf_install_pkgs +dnf_install_pkgs() { + local -n pkgs="$1" + log "starting" + + local -ra cmd=( + dnf + -y + install + ${pkgs[@]} + ) + + log "Attempting to install packages: ${pkgs[*]}" + retry cmd "$2" +} + +# rpm_import_keys +rpm_import_keys() { + local -n keys="$1" + log "starting" + + + # shellcheck disable=SC2068 + for key in ${keys[@]}; do + if [ ${#keys[@]} -eq 0 ]; then + break + fi + local -a cmd=( + rpm + --import + -v + "$key" + ) + + log "attempt #$attempt - importing rpm repository key $key" + retry cmd "$2" && unset key + done +} -echo "configuring logrotate" +# configure_disk_partitions +configure_disk_partitions() { + log "starting" + log "extending partition table" + + # Linux block devices are inconsistently named + # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here + physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" + growpart "$physical_disk" 2 + + log "extending filesystems" + log "extending root lvm" + lvextend -l +20%FREE /dev/rootvg/rootlv + log "growing root filesystem" + xfs_growfs / + + log "extending var lvm" + lvextend -l +100%FREE /dev/rootvg/varlv + log "growing var filesystem" + xfs_growfs /var +} -# gateway_logdir is a readonly variable that specifies the host path mount point for the gateway container log file -# for the purpose of rotating the gateway logs -declare -r gateway_logdir='/var/log/aro-gateway' +# configure_logrotate clobbers /etc/logrotate.conf +configure_logrotate() { + local -n log_dir="$1" + log "starting" -cat >/etc/logrotate.conf </etc/yum.repos.d/azure.repo <<'EOF' -[azure-cli] +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { + log "starting" + + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] name=azure-cli baseurl=https://packages.microsoft.com/yumrepos/azure-cli enabled=yes @@ -105,69 +334,144 @@ gpgcheck=yes name=azurecore baseurl=https://packages.microsoft.com/yumrepos/azurecore enabled=yes -gpgcheck=no -EOF +gpgcheck=no' -semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" -mkdir -p /var/log/journal + write_file azure_repo_filename azure_repo_file true +} -for attempt in {1..5}; do - yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman-docker openssl-perl python3 && break - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +# configure_selinux +configure_selinux() { + log "starting" + + local -r relabel="${1:-false}" + + already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" + semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" + chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent + + if "$relabel"; then + restorecon -RF /var/log/* || log "$already_defined_ignore_error" + fi +} + +# configure_firewalld_rules +configure_firewalld_rules() { + log "starting" + + # https://access.redhat.com/security/cve/cve-2020-13401 + local -r prefix="/etc/sysctl.d" + local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" + local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" + + write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true + + local -r disable_core_filename="$prefix/01-disable-core.conf" + local -r disable_core_file="kernel.core_pattern = |/bin/true + " + write_file disable_core_filename disable_core_file true + + sysctl --system + + enable_ports=( + "443/tcp" + "444/tcp" + "445/tcp" + "2222/tcp" + ) + log "Enabling ports ${enable_ports[*]} on default firewalld zone" + # shellcheck disable=SC2068 + for port in ${enable_ports[@]}; do + log "Enabling port $port now" + firewall-cmd "--add-port=$port" + done + + firewall-cmd --runtime-to-permanent +} + +# pull_container_images +pull_container_images() { + log "starting" + + echo "logging into prod acr" -echo "applying firewall rules" -# https://access.redhat.com/security/cve/cve-2020-13401 -cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF' -net.ipv6.conf.all.accept_ra=0 -EOF - -cat >/etc/sysctl.d/01-disable-core.conf <<'EOF' -kernel.core_pattern = |/bin/true -EOF -sysctl --system - -firewall-cmd --add-port=80/tcp --permanent -firewall-cmd --add-port=8081/tcp --permanent -firewall-cmd --add-port=443/tcp --permanent - -echo "logging into prod acr" -export AZURE_CLOUD_NAME=$AZURECLOUDNAME -az login -i --allow-no-subscriptions - -# The managed identity that the VM runs as only has a single roleassignment. -# This role assignment is ACRPull which is not necessarily present in the -# subscription we're deploying into. If the identity does not have any -# role assignments scoped on the subscription we're deploying into, it will -# not show on az login -i, which is why the below line is commented. -# az account set -s "$SUBSCRIPTIONID" - -# Suppress emulation output for podman instead of docker for az acr compatability -mkdir -p /etc/containers/ -touch /etc/containers/nodocker - -mkdir -p /root/.docker -REGISTRY_AUTH_FILE="/root/.docker/config.json" -az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" - -MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" -docker pull "$MDMIMAGE" -docker pull "$RPIMAGE" -docker pull "$FLUENTBITIMAGE" - -az logout - -echo "configuring fluentbit service" -mkdir -p /etc/fluentbit/ -mkdir -p /var/lib/fluent - -cat >/etc/fluentbit/fluentbit.conf <<'EOF' -[INPUT] - Name systemd - Tag journald - Systemd_Filter _COMM=aro - DB /var/lib/fluent/journaldb + # The managed identity that the VM runs as only has a single roleassignment. + # This role assignment is ACRPull which is not necessarily present in the + # subscription we're deploying into. If the identity does not have any + # role assignments scoped on the subscription we're deploying into, it will + # not show on az login -i, which is why the below line is commented. + # az account set -s "$SUBSCRIPTIONID" + az login -i --allow-no-subscriptions + + # Suppress emulation output for podman instead of docker for az acr compatability + mkdir -p /etc/containers/ + touch /etc/containers/nodocker + + mkdir -p /root/.docker + local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + + az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + + MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + docker pull "$MDMIMAGE" + docker pull "$RPIMAGE" + docker pull "$FLUENTBITIMAGE" + + az logout +} + +# configure_system_services creates, configures, and enables the following systemd services and timers +# services +# fluentbit +# mdm +# mdsd +# arp-rp +# aro-dbtoken +# aro-monitor +# aro-portal +configure_system_services() { + configure_service_fluentbit + configure_service_mdm + configure_timers_mdm_mdsd + configure_service_aro_gateway "$1" + configure_service_mdsd +} + +# enable_aro_services enables all services required for aro rp +enable_aro_services() { + log "starting" + + local -ra aro_services=( + aro-gateway + auoms + azsecd + azsecmond + mdsd + mdm + chronyd + fluentbit + ) + log "enabling gateway services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} + +# configure_service_fluentbit +configure_service_fluentbit() { + log "starting" + log "configuring fluentbit service" + + mkdir -p /etc/fluentbit/ + mkdir -p /var/lib/fluent + + local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' + local -r fluentbit_conf_file="[INPUT] +Name systemd +Tag journald +Systemd_Filter _COMM=aro +DB /var/lib/fluent/journaldb [FILTER] Name modify @@ -178,13 +482,18 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' [OUTPUT] Name forward Match * - Port 29230 -EOF + Port 29230" + + write_file fluentbit_conf_filename fluentbit_conf_file true + + local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' + local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" + + write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true -echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit + local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' -cat >/etc/systemd/system/fluentbit.service <<'EOF' -[Unit] + local -r fluentbit_service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitIntervalSec=0 @@ -214,21 +523,61 @@ RestartSec=5 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file fluentbit_conf_filename fluentbit_conf_file true +} + +# configure_certs +configure_certs() { + log "starting" + + mkdir /etc/aro-rp + base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + if [[ -n "$ARMAPICABUNDLE" ]]; then + base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + fi + chown -R 1000:1000 /etc/aro-rp + + # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not + # to honour SSL_CERT_FILE any more, heaven only knows why. + mkdir -p /usr/lib/ssl/certs + csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null + c_rehash /usr/lib/ssl/certs + +# we leave clientId blank as long as only 1 managed identity assigned to vmss +# if we have more than 1, we will need to populate with clientId used for off-node scanning + local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" + local -r nodescan_agent_file="{ + \"Nice\": 19, + \"Timeout\": 10800, + \"ClientId\": \"\", + \"TenantId\": $AZURESECPACKVSATENANTID, + \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL, + \"ProcessTimeout\": 300, + \"CommandDelay\": 0 + }" + + write_file nodescan_agent_filename nodescan_agent_file true +} + +# configure_service_mdm +configure_service_mdm() { + log "starting" + log "configuring mdm service" -echo "configuring mdm service" -cat >/etc/sysconfig/mdm </etc/systemd/system/mdm.service <<'EOF' -[Unit] + write_file sysconfig_mdm_filename sysconfig_mdm_file true + + mkdir -p /var/etw + local -r mdm_service_filename="/etc/systemd/system/mdm.service" + local -r mdm_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -259,80 +608,28 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF - -echo "configuring aro-gateway service" -cat >/etc/sysconfig/aro-gateway </etc/systemd/system/aro-gateway.service </etc/systemd/system/download-$var-credentials.service </etc/systemd/system/download-$var-credentials.timer </usr/local/bin/download-credentials.sh </etc/systemd/system/watch-mdm-credentials.service </etc/systemd/system/watch-mdm-credentials.path </etc/systemd/system/mdsd.service.d/override.conf <<'EOF' -[Unit] + local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' + local -r aro_dbtoken_service_file="[Unit] After=network-online.target -EOF +Wants=network-online.target + +[Service] +EnvironmentFile=/etc/sysconfig/aro-gateway +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir} +ExecStart=/usr/bin/docker run \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -e ACR_RESOURCE_ID \ + -e DATABASE_ACCOUNT_NAME \ + -e AZURE_DBTOKEN_CLIENT_ID \ + -e DBTOKEN_URL \ + -e GATEWAY_DOMAINS \ + -e GATEWAY_FEATURES \ + -e MDM_ACCOUNT \ + -e MDM_NAMESPACE \ + -m 2g \ + -p 80:8080 \ + -p 8081:8081 \ + -p 443:8443 \ + -v /run/systemd/journal:/run/systemd/journal \ + -v /var/etw:/var/etw:z \ + -v ${gateway_logdir}:/ctr.log:z \ + \$RPIMAGE \ + gateway +ExecStop=/usr/bin/docker stop -t 3600 %N +TimeoutStopSec=3600 +Restart=always +RestartSec=1 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + write_file aro_dbtoken_service_filename aro_dbtoken_service_file true +} + +# configure_service_mdsd +configure_service_mdsd() { + log "starting" + + local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" + mkdir "$mdsd_service_dir" + + local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf" + local -r mdsd_override_conf_file="[Unit] +After=network-online.target" -cat >/etc/default/mdsd </dev/null -c_rehash /usr/lib/ssl/certs + write_file default_mdsd_filename default_mdsd_file true -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning -cat >/etc/default/vsa-nodescan-agent.config < "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} + +# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots +reboot_vm() { + log "starting" + + configure_selinux "true" + (sleep 30 && log "rebooting vm now"; reboot) & +} + +# log is a wrapper for echo that includes the function name +log() { + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" + echo "${FUNCNAME[${stack_level}]}: ${msg}" +} + +# abort is a wrapper for log that exits with an error code +abort() { + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" + log "Exiting" + exit 1 +} + +export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -echo "rebooting" -restorecon -RF /var/log/* -(sleep 30; reboot) & +main "$@" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 2198ae2103c..f978ef2e00a 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -154,19 +154,30 @@ configure_and_install_dnf_pkgs_repos() { # configure_rhui_repo configure_rhui_repo() { - local -n wait_time="$1" log "starting" + + local -ra cmd=( + dnf + update + -y + --disablerepo='*' + --enablerepo='rhui-microsoft-azure*' + ) + log "running RHUI package updates" + retry cmd "$1" +} + +# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks +retry() { + local -n cmd_retry="$1" + local -n wait_time="$2" - #Adding retry logic to yum commands in order to avoid stalling out on resource locks for attempt in {1..5}; do - log "attempt #${attempt} - running dnf update" - dnf update \ - -y \ - --disablerepo='*' \ - --enablerepo='rhui-microsoft-azure*' & + log "attempt #${attempt} - ${FUNCNAME[2]}" + ${cmd_retry[@]} & - wait $! && break + wait $! && break if [[ ${attempt} -lt 5 ]]; then sleep "$wait_time" else @@ -178,72 +189,56 @@ configure_rhui_repo() { # dnf_update_pkgs dnf_update_pkgs() { local -n excludes="$1" - local -n wait_time="$2" log "starting" - for attempt in {1..5}; do - log "attempt #${attempt} - running dnf update" - # shellcheck disable=SC2068 - dnf -y \ - ${excludes[@]} \ - update \ - --allowerasing & - - wait $! && break - if [[ ${attempt} -lt 5 ]]; then - sleep "$wait_time" - else - abort "attempt #${attempt} - Failed to update packages" - fi - done + local -ra cmd=( + dnf + -y + ${excludes[@]} + update + --allowerasing + ) + + log "Updating all packages" + retry cmd "$2" } # dnf_install_pkgs dnf_install_pkgs() { local -n pkgs="$1" - local -n wait_time="$2" log "starting" - for attempt in {1..5}; do - log "attempt #$attempt - Installing packages ${pkgs[*]}" - dnf -y \ - install \ - "${pkgs[@]}" & + local -ra cmd=( + dnf + -y + install + ${pkgs[@]} + ) - wait $! && break - if [[ ${attempt} -lt 5 ]]; then - sleep "$wait_time" - else - abort "attempt #${attempt} - Failed to install packages ${pkgs[*]}" - fi - done + log "Attempting to install packages: ${pkgs[*]}" + retry cmd "$2" } # rpm_import_keys rpm_import_keys() { local -n keys="$1" - local -n wait_time="$2" log "starting" + # shellcheck disable=SC2068 for key in ${keys[@]}; do - if [ ${#keys[@]} -eq 0 ]; then - break - fi - for attempt in {1..5}; do - log "attempt #$attempt - importing rpm repository key $key" - rpm --import \ - -v \ - "$key" \ - && unset key - - wait $! && break - done - if [ -z ${key+x} ] && [[ ${attempt} -lt 5 ]]; then - sleep "$wait_time" - else - abort "attempt #${attempt} - Failed to import rpm repository key $key" + if [ ${#keys[@]} -eq 0 ]; then + break fi + local -a cmd=( + rpm + --import + -v + "$key" + ) + + log "attempt #$attempt - importing rpm repository key $key" + retry cmd "$2" && unset key done } @@ -352,11 +347,10 @@ configure_firewalld_rules() { # https://access.redhat.com/security/cve/cve-2020-13401 local -r prefix="/etc/sysctl.d" - local -r diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf" - log "Writing $diable_accept_ra_conf" -cat >"$diable_accept_ra_conf" <<'EOF' -net.ipv6.conf.all.accept_ra=0 -EOF + local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" + local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" + + write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true local -r disable_core_filename="$prefix/01-disable-core.conf" local -r disable_core_file="kernel.core_pattern = |/bin/true From e899ae17e575b1cac17e750161a078a18c398af7 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 15:53:38 -0400 Subject: [PATCH 14/38] Pass usage options via nameref variable that is also used by getops Move docker file creation to more logical location --- pkg/deploy/generator/scripts/gatewayVMSS.sh | 30 ++++++++++++--------- pkg/deploy/generator/scripts/rpVMSS.sh | 26 ++++++++++-------- 2 files changed, 32 insertions(+), 24 deletions(-) diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 3751446891e..64b4232309f 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -28,15 +28,18 @@ main() { } usage() { - log "$(basename "$0") [-dplsrfui] + local -n options="$1" + log "$(basename "$0") [$options] -d Configure Disk Partitions -p Configure rpm repositories, import required rpm keys, update & install packages with dnf -l Configure logrotate.conf -s Make selinux modifications required for ARO RP -r Configure sshd - Allow password authenticaiton -f Configure firewalld default zone rules - -u Pull container images and configure systemd unit files for ARO RP + -u Configure systemd unit files for ARO RP -i Pull container images + + Note: steps will be executed in the order that flags are provided " } @@ -45,15 +48,16 @@ usage() { # # This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline parse_run_options() { - local -a options=("$1") + # shellcheck disable=SC2206 + local -a options=(${1:-}) if [ "${#options[@]}" -eq 0 ]; then log "Running all steps" return 0 fi local OPTIND - - while getopts "dplsrfui" options; do + local -r allowed_options="dplsrfui" + while getopts ${allowed_options} options; do case "${options}" in d) log "Running step configure_disk_partitions" @@ -88,7 +92,7 @@ parse_run_options() { pull_container_images ;; *) - usage + usage allowed_options abort "Unkown option provided" ;; esac @@ -372,12 +376,12 @@ configure_firewalld_rules() { sysctl --system - enable_ports=( + local -ra enable_ports=( + "80/tcp" + "8081/tcp" "443/tcp" - "444/tcp" - "445/tcp" - "2222/tcp" ) + log "Enabling ports ${enable_ports[*]} on default firewalld zone" # shellcheck disable=SC2068 for port in ${enable_ports[@]}; do @@ -392,8 +396,6 @@ configure_firewalld_rules() { pull_container_images() { log "starting" - echo "logging into prod acr" - # The managed identity that the VM runs as only has a single roleassignment. # This role assignment is ACRPull which is not necessarily present in the # subscription we're deploying into. If the identity does not have any @@ -404,11 +406,13 @@ pull_container_images() { # Suppress emulation output for podman instead of docker for az acr compatability mkdir -p /etc/containers/ + mkdir -p /root/.docker touch /etc/containers/nodocker - mkdir -p /root/.docker + # This name is used in the case that az acr login searches for this in it's environment local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + log "logging into prod acr" az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index f978ef2e00a..3c00da1185c 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -27,15 +27,18 @@ main() { } usage() { - log "$(basename "$0") [-dplsrfui] + local -n options="$1" + log "$(basename "$0") [$options] -d Configure Disk Partitions -p Configure rpm repositories, import required rpm keys, update & install packages with dnf -l Configure logrotate.conf -s Make selinux modifications required for ARO RP -r Configure sshd - Allow password authenticaiton -f Configure firewalld default zone rules - -u Pull container images and configure systemd unit files for ARO RP + -u Configure systemd unit files for ARO RP -i Pull container images + + Note: steps will be executed in the order that flags are provided " } @@ -44,15 +47,16 @@ usage() { # # This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline parse_run_options() { - local -a options=("$1") + # shellcheck disable=SC2206 + local -a options=(${1:-}) if [ "${#options[@]}" -eq 0 ]; then log "Running all steps" return 0 fi local OPTIND - - while getopts "dplsrfui" options; do + local -r allowed_options="dplsrfui" + while getopts ${allowed_options} options; do case "${options}" in d) log "Running step configure_disk_partitions" @@ -80,7 +84,6 @@ parse_run_options() { ;; u) log "Running pull_container_images & configure_system_services" - pull_container_images configure_system_services ;; i) @@ -88,7 +91,7 @@ parse_run_options() { pull_container_images ;; *) - usage + usage allowed_options abort "Unkown option provided" ;; esac @@ -359,12 +362,13 @@ configure_firewalld_rules() { sysctl --system - enable_ports=( + local -ra enable_ports=( "443/tcp" "444/tcp" "445/tcp" "2222/tcp" ) + log "Enabling ports ${enable_ports[*]} on default firewalld zone" # shellcheck disable=SC2068 for port in ${enable_ports[@]}; do @@ -379,8 +383,6 @@ configure_firewalld_rules() { pull_container_images() { log "starting" - echo "logging into prod acr" - # The managed identity that the VM runs as only has a single roleassignment. # This role assignment is ACRPull which is not necessarily present in the # subscription we're deploying into. If the identity does not have any @@ -391,11 +393,13 @@ pull_container_images() { # Suppress emulation output for podman instead of docker for az acr compatability mkdir -p /etc/containers/ + mkdir -p /root/.docker touch /etc/containers/nodocker - mkdir -p /root/.docker + # This name is used in the case that az acr login searches for this in it's environment local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + log "logging into prod acr" az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" From df11d619c872a45a80ce83b3b25552e37164ebc0 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Mon, 15 Apr 2024 15:54:12 -0400 Subject: [PATCH 15/38] Port changes to devProxyVMSS.sh --- pkg/deploy/assets/env-development.json | 2 +- pkg/deploy/assets/gateway-production.json | 2 +- pkg/deploy/assets/rp-production.json | 2 +- pkg/deploy/generator/scripts/devProxyVMSS.sh | 440 ++++++++++++++++--- 4 files changed, 378 insertions(+), 68 deletions(-) diff --git a/pkg/deploy/assets/env-development.json b/pkg/deploy/assets/env-development.json index 10057c04528..1da1cb9fb5b 100644 --- a/pkg/deploy/assets/env-development.json +++ b/pkg/deploy/assets/env-development.json @@ -296,7 +296,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('I0FkZGluZyByZXRyeSBsb2dpYyB0byB5dW0gY29tbWFuZHMgaW4gb3JkZXIgdG8gYXZvaWQgc3RhbGxpbmcgb3V0IG9uIHJlc291cmNlIGxvY2tzCmVjaG8gInJ1bm5pbmcgUkhVSSBmaXgiCmZvciBhdHRlbXB0IGluIHsxLi41fTsgZG8KICB5dW0gdXBkYXRlIC15IC0tZGlzYWJsZXJlcG89JyonIC0tZW5hYmxlcmVwbz0ncmh1aS1taWNyb3NvZnQtYXp1cmUqJyAmJiBicmVhawogIGlmIFtbICR7YXR0ZW1wdH0gLWx0IDUgXV07IHRoZW4gc2xlZXAgMTA7IGVsc2UgZXhpdCAxOyBmaQpkb25lCgplY2hvICJydW5uaW5nIHl1bSB1cGRhdGUiCmZvciBhdHRlbXB0IGluIHsxLi41fTsgZG8KICB5dW0gLXkgLXggV0FMaW51eEFnZW50IC14IFdBTGludXhBZ2VudC11ZGV2IHVwZGF0ZSAtLWFsbG93ZXJhc2luZyAmJiBicmVhawogIGlmIFtbICR7YXR0ZW1wdH0gLWx0IDUgXV07IHRoZW4gc2xlZXAgMTA7IGVsc2UgZXhpdCAxOyBmaQpkb25lCgplY2hvICJpbnN0YWxsaW5nIHBvZG1hbi1kb2NrZXIiCmZvciBhdHRlbXB0IGluIHsxLi41fTsgZG8KICB5dW0gLXkgaW5zdGFsbCBwb2RtYW4tZG9ja2VyICYmIGJyZWFrCiAgaWYgW1sgJHthdHRlbXB0fSAtbHQgNSBdXTsgdGhlbiBzbGVlcCAxMDsgZWxzZSBleGl0IDE7IGZpCmRvbmUKCmZpcmV3YWxsLWNtZCAtLWFkZC1wb3J0PTQ0My90Y3AgLS1wZXJtYW5lbnQKCm1rZGlyIC9yb290Ly5kb2NrZXIKY2F0ID4vcm9vdC8uZG9ja2VyL2NvbmZpZy5qc29uIDw8RU9GCnsKCSJhdXRocyI6IHsKCQkiJHtQUk9YWUlNQUdFJSUvKn0iOiB7CgkJCSJhdXRoIjogIiRQUk9YWUlNQUdFQVVUSCIKCQl9Cgl9Cn0KRU9GCgpta2RpciAtcCAvZXRjL2NvbnRhaW5lcnMvCnRvdWNoIC9ldGMvY29udGFpbmVycy9ub2RvY2tlcgoKZG9ja2VyIHB1bGwgIiRQUk9YWUlNQUdFIgoKbWtkaXIgL2V0Yy9wcm94eQpiYXNlNjQgLWQgPDw8IiRQUk9YWUNFUlQiID4vZXRjL3Byb3h5L3Byb3h5LmNydApiYXNlNjQgLWQgPDw8IiRQUk9YWUtFWSIgPi9ldGMvcHJveHkvcHJveHkua2V5CmJhc2U2NCAtZCA8PDwiJFBST1hZQ0xJRU5UQ0VSVCIgPi9ldGMvcHJveHkvcHJveHktY2xpZW50LmNydApjaG93biAtUiAxMDAwOjEwMDAgL2V0Yy9wcm94eQpjaG1vZCAwNjAwIC9ldGMvcHJveHkvcHJveHkua2V5CgpjYXQgPi9ldGMvc3lzY29uZmlnL3Byb3h5IDw8RU9GClBST1hZX0lNQUdFPSckUFJPWFlJTUFHRScKRU9GCgpjYXQgPi9ldGMvc3lzdGVtZC9zeXN0ZW0vcHJveHkuc2VydmljZSA8PCdFT0YnCltVbml0XQpBZnRlcj1uZXR3b3JrLW9ubGluZS50YXJnZXQKV2FudHM9bmV0d29yay1vbmxpbmUudGFyZ2V0CgpbU2VydmljZV0KRW52aXJvbm1lbnRGaWxlPS9ldGMvc3lzY29uZmlnL3Byb3h5CkV4ZWNTdGFydFByZT0tL3Vzci9iaW4vZG9ja2VyIHJtIC1mICVuCkV4ZWNTdGFydD0vdXNyL2Jpbi9kb2NrZXIgcnVuIC0tcm0gLS1uYW1lICVuIC1wIDQ0Mzo4NDQzIC12IC9ldGMvcHJveHk6L3NlY3JldHMgJFBST1hZX0lNQUdFCkV4ZWNTdG9wPS91c3IvYmluL2RvY2tlciBzdG9wICVuClJlc3RhcnQ9YWx3YXlzClJlc3RhcnRTZWM9MQpTdGFydExpbWl0SW50ZXJ2YWw9MAoKW0luc3RhbGxdCldhbnRlZEJ5PW11bHRpLXVzZXIudGFyZ2V0CkVPRgoKc3lzdGVtY3RsIGVuYWJsZSBwcm94eS5zZXJ2aWNlCgpjYXQgPi9ldGMvY3Jvbi53ZWVrbHkvcHVsbC1pbWFnZSA8PCdFT0YnCiMhL2Jpbi9iYXNoCgpkb2NrZXIgcHVsbCAkUFJPWFlJTUFHRQpzeXN0ZW1jdGwgcmVzdGFydCBwcm94eS5zZXJ2aWNlCkVPRgpjaG1vZCAreCAvZXRjL2Nyb24ud2Vla2x5L3B1bGwtaW1hZ2UKCmNhdCA+L2V0Yy9jcm9uLndlZWtseS95dW11cGRhdGUgPDwnRU9GJwojIS9iaW4vYmFzaAoKeXVtIHVwZGF0ZSAteQpFT0YKY2htb2QgK3ggL2V0Yy9jcm9uLndlZWtseS95dW11cGRhdGUKCmNhdCA+L2V0Yy9jcm9uLmRhaWx5L3Jlc3RhcnQtcHJveHkgPDwnRU9GJwojIS9iaW4vYmFzaAoKc3lzdGVtY3RsIHJlc3RhcnQgcHJveHkuc2VydmljZQpFT0YKY2htb2QgK3ggL2V0Yy9jcm9uLmRhaWx5L3Jlc3RhcnQtcHJveHkKCigKCXNsZWVwIDMwCglyZWJvb3QKKSAmCg==')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    parse_run_options "$@"

    configure_and_install_dnf_pkgs_repos

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
	local -r allowed_options="pfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        podman
        podman-docker
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time

	local -r cron_weekly_dnf_update_filename='/etc/cron.weekly/dnfupdate'
	local -r cron_weekly_dnf_update_file="#!/bin/bash
dnf update -y"

	write_file cron_weekly_dnf_update_filename cron_weekly_dnf_update_file true
	chmod +x "$cron_weekly_dnf_update_filename"
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "443/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
	local -r registry_config_file="{
	"auths": {
		\"${PROXYIMAGE%%/*}\": {
			\"auth\": \"$PROXYIMAGEAUTH\"
		}
	}"

	write_file REGISTRY_AUTH_FILE registry_config_file true

    log "logging into prod acr"

    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    docker pull "$PROXYIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#	proxy
configure_system_services() {
	configure_service_proxy
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
		proxy
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_certs
configure_certs() {
    log "starting"

	base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt
	base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key
	base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt
	chown -R 1000:1000 /etc/proxy
	chmod 0600 /etc/proxy/proxy.key
}

configure_service_proxy() {
	local -r sysconfig_proxy_filename='/etc/sysconfig/proxy'
	local -r sysconfig_proxy_file="PROXY_IMAGE='$PROXYIMAGE'"

	write_file sysconfig_proxy_filename sysconfig_proxy_file true

	local -r proxy_service_filename='/etc/systemd/system/proxy.service'
	local -r proxy_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/proxy
ExecStartPre=-/usr/bin/docker rm -f %n
ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $PROXY_IMAGE
ExecStop=/usr/bin/docker stop %n
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

	local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image'
	local -r cron_weekly_pull_image_file="#!/bin/bash
docker pull $PROXYIMAGE
systemctl restart proxy.service"
	
	write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true
	chmod +x "$cron_weekly_pull_image_filename"

	local -r cron_daily_restart_proxy_filename='/etc/cron.daily/restart-proxy'
	local -r cron_daily_restart_proxy_file="#!/bin/bash
systemctl restart proxy.service"
	
	write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file
	chmod +x "$cron_daily_restart_proxy_filename"
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" }, "provisionAfterExtensions": [ "Microsoft.Azure.Monitor.AzureMonitorLinuxAgent", diff --git a/pkg/deploy/assets/gateway-production.json b/pkg/deploy/assets/gateway-production.json index e539ddfd02a..ecbbe148c12 100644 --- a/pkg/deploy/assets/gateway-production.json +++ b/pkg/deploy/assets/gateway-production.json @@ -309,7 +309,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','DBTOKENURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenUrl')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','GATEWAYMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayMdsdConfigVersion')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayFeatures')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

echo "setting ssh password authentication"
# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work
sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config
systemctl reload sshd.service

#Adding retry logic to yum commands in order to avoid stalling out on resource locks
echo "running RHUI fix"
for attempt in {1..5}; do
  yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "running yum update"
for attempt in {1..5}; do
  yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "extending partition table"
# Linux block devices are inconsistently named
# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
growpart "$physical_disk" 2

echo "extending filesystems"
lvextend -l +20%FREE /dev/rootvg/rootlv
xfs_growfs /

lvextend -l +100%FREE /dev/rootvg/varlv
xfs_growfs /var

rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
rpm --import https://packages.microsoft.com/keys/microsoft.asc

for attempt in {1..5}; do
  yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "configuring logrotate"

# gateway_logdir is a readonly variable that specifies the host path mount point for the gateway container log file
# for the purpose of rotating the gateway logs
declare -r gateway_logdir='/var/log/aro-gateway'

cat >/etc/logrotate.conf <<EOF
# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we'll rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}

# Maximum log directory size is 100G with this configuration
# Setting limit to 100G to allow space for other logging services
# copytruncate is a critical option used to prevent logs from being shipped twice
${gateway_logdir} {
    size 20G
    rotate 5
    create 0600 root root
    copytruncate
    noolddir
    compress
}
EOF

echo "configuring yum repository and running yum update"
cat >/etc/yum.repos.d/azure.repo <<'EOF'
[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no
EOF

semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?"
mkdir -p /var/log/journal

for attempt in {1..5}; do
  yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman-docker openssl-perl python3 && break
  # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "applying firewall rules"
# https://access.redhat.com/security/cve/cve-2020-13401
cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

cat >/etc/sysctl.d/01-disable-core.conf <<'EOF'
kernel.core_pattern = |/bin/true
EOF
sysctl --system

firewall-cmd --add-port=80/tcp --permanent
firewall-cmd --add-port=8081/tcp --permanent
firewall-cmd --add-port=443/tcp --permanent

echo "logging into prod acr"
export AZURE_CLOUD_NAME=$AZURECLOUDNAME
az login -i --allow-no-subscriptions

# The managed identity that the VM runs as only has a single roleassignment.
# This role assignment is ACRPull which is not necessarily present in the
# subscription we're deploying into.  If the identity does not have any
# role assignments scoped on the subscription we're deploying into, it will
# not show on az login -i, which is why the below line is commented.
# az account set -s "$SUBSCRIPTIONID"

# Suppress emulation output for podman instead of docker for az acr compatability
mkdir -p /etc/containers/
touch /etc/containers/nodocker

mkdir -p /root/.docker
REGISTRY_AUTH_FILE="/root/.docker/config.json"
az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
docker pull "$MDMIMAGE"
docker pull "$RPIMAGE"
docker pull "$FLUENTBITIMAGE"

az logout

echo "configuring fluentbit service"
mkdir -p /etc/fluentbit/
mkdir -p /var/lib/fluent

cat >/etc/fluentbit/fluentbit.conf <<'EOF'
[INPUT]
	Name systemd
	Tag journald
	Systemd_Filter _COMM=aro
	DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[OUTPUT]
	Name forward
	Match *
	Port 29230
EOF

echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit

cat >/etc/systemd/system/fluentbit.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring mdm service"
cat >/etc/sysconfig/mdm <<EOF
MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=gateway
MDMSOURCEROLEINSTANCE='$(hostname)'
EOF

mkdir /var/etw
cat >/etc/systemd/system/mdm.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-gateway service"
cat >/etc/sysconfig/aro-gateway <<EOF
ACR_RESOURCE_ID='$ACRRESOURCEID'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT="$RPMDMACCOUNT"
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-gateway.service <<EOF
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${gateway_logdir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

echo "configuring mdsd and mdm services"
for var in "mdsd" "mdm"; do
cat >/etc/systemd/system/download-$var-credentials.service <<EOF
[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var
EOF

cat >/etc/systemd/system/download-$var-credentials.timer <<EOF
[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target
EOF
done

cat >/usr/local/bin/download-credentials.sh <<EOF
#!/bin/bash
set -eu

COMPONENT="\$1"
echo "Download \$COMPONENT credentials"

TEMP_DIR=\$(mktemp -d)
export AZURE_CONFIG_DIR=\$(mktemp -d)

echo "Logging into Azure..."
RETRIES=3
while [ "\$RETRIES" -gt 0 ]; do
    if az login -i --allow-no-subscriptions
    then
        echo "az login successful"
        break
    else
        echo "az login failed. Retrying..."
        let RETRIES-=1
        sleep 5
    fi
done

trap "cleanup" EXIT

cleanup() {
  az logout
  [[ "\$TEMP_DIR" =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ "\$AZURE_CONFIG_DIR" =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [ "\$COMPONENT" = "mdm" ]; then
  CURRENT_CERT_FILE="/etc/mdm.pem"
elif [ "\$COMPONENT" = "mdsd" ]; then
  CURRENT_CERT_FILE="/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME="gwy-\${COMPONENT}"
NEW_CERT_FILE="\$TEMP_DIR/\$COMPONENT.pem"
for attempt in {1..5}; do
  az keyvault secret download --file \$NEW_CERT_FILE --id "https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME" && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [ "\$COMPONENT" = "mdsd" ]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn="\$(openssl x509 -in "\$NEW_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  current_cert_sn="\$(openssl x509 -in "\$CURRENT_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != "\$current_cert_sn" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi
EOF

chmod u+x /usr/local/bin/download-credentials.sh

systemctl enable download-mdsd-credentials.timer
systemctl enable download-mdm-credentials.timer

/usr/local/bin/download-credentials.sh mdsd
/usr/local/bin/download-credentials.sh mdm
MDSDCERTIFICATESAN=$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')

cat >/etc/systemd/system/watch-mdm-credentials.service <<EOF
[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target
EOF

cat >/etc/systemd/system/watch-mdm-credentials.path <<EOF
[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target
EOF

systemctl enable watch-mdm-credentials.path
systemctl start watch-mdm-credentials.path

mkdir /etc/systemd/system/mdsd.service.d
cat >/etc/systemd/system/mdsd.service.d/override.conf <<'EOF'
[Unit]
After=network-online.target
EOF

cat >/etc/default/mdsd <<EOF
MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS="-A -d -r \$MDSD_ROLE_PREFIX"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=gateway
export MONITORING_ROLE_INSTANCE='$(hostname)'

export MDSD_MSGPACK_SORT_COLUMNS=1
EOF

# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
# to honour SSL_CERT_FILE any more, heaven only knows why.
mkdir -p /usr/lib/ssl/certs
csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null
c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
cat >/etc/default/vsa-nodescan-agent.config <<EOF
{
    "Nice": 19,
    "Timeout": 10800,
    "ClientId": "",
    "TenantId": "$AZURESECPACKVSATENANTID",
    "QualysStoreBaseUrl": "$AZURESECPACKQUALYSURL",
    "ProcessTimeout": 300,
    "CommandDelay": 0
  }
EOF

echo "enabling aro services"
for service in aro-gateway auoms azsecd azsecmond mdsd mdm chronyd fluentbit; do
  systemctl enable $service.service
done

for scan in baseline clamav software; do
  /usr/local/bin/azsecd config -s $scan -d P1D
done

echo "rebooting"
restorecon -RF /var/log/*
(sleep 30; reboot) &
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','DBTOKENURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenUrl')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','GATEWAYMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayMdsdConfigVersion')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayFeatures')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    local -r gateway_logdir='/var/log/aro-gateway'
    parse_run_options "$@" gateway_logdir


    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate gateway_logdir
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services gateway_logdir
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Make selinux modifications required for ARO RP
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate "$2"
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services "$2"
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "starting"
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time
    create_azure_rpm_repos retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    rpm_import_keys rpm_keys retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# rpm_import_keys
rpm_import_keys() {
    local -n keys="$1"
    log "starting"


    # shellcheck disable=SC2068
    for key in ${keys[@]}; do
        if [ ${#keys[@]} -eq 0 ]; then
            break
        fi
            local -a cmd=(
                rpm
                --import
                -v
                "$key"
            )

            log "attempt #$attempt - importing rpm repository key $key"
            retry cmd "$2" && unset key
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    local -n log_dir="$1"
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file="# see 'man logrotate' for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}

# Maximum log directory size is 100G with this configuration
# Setting limit to 100G to allow space for other logging services
# copytruncate is a critical option used to prevent logs from being shipped twice
${log_dir} {
    size 20G
    rotate 5
    create 0600 root root
    copytruncate
    noolddir
    compress
}"

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_selinux
configure_selinux() {
    log "starting"

    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "80/tcp"
        "8081/tcp"
        "443/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    log "logging into prod acr"
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_gateway "$1"
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
      aro-gateway
      auoms
      azsecd
      azsecmond
      mdsd
      mdm
      chronyd
      fluentbit
    )
    log "enabling gateway services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=gateway
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"gwy-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_gateway() {
    local -n log_dir="$1"
    log "starting"

    local -r aro_gateway_conf_filename='/etc/sysconfig/aro-gateway'
    local -r aro_gateway_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_gateway_conf_filename aro_gateway_conf_file true

    local -r aro_gateway_service_filename='/etc/systemd/system/aro-gateway.service'

    local -r aro_gateway_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${log_dir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${log_dir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
    "

    write_file aro_gateway_service_filename aro_gateway_service_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${gateway_logdir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=gateway
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" } } } diff --git a/pkg/deploy/assets/rp-production.json b/pkg/deploy/assets/rp-production.json index eec290c2170..99f72f4d6ff 100644 --- a/pkg/deploy/assets/rp-production.json +++ b/pkg/deploy/assets/rp-production.json @@ -516,7 +516,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

trap 'catch' ERR

main() {
    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    configure_rhui_repo
    create_azure_rpm_repos
    dnf_update_pkgs
    dnf_install_pkgs
}

# configure_rhui_repo
configure_rhui_repo() {
    log "running RHUI package updates"
    #Adding retry logic to yum commands in order to avoid stalling out on resource locks
    for attempt in {1..5}; do
        dnf update \
            -y \
            --disablerepo='*' \
            --enablerepo='rhui-microsoft-azure*' \
            && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            abort "failed to run dnf update"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    log "running dnf update"
    for attempt in {1..5}; do
        dnf -y \
            -x WALinuxAgent \
            -x WALinuxAgent-udev \
            update --allowerasing \
            && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            return 1
        fi
    done
}

# dnf_install_pkgs
dnf_install_pkgs() {
    log "importing rpm repositories"
    rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
    rpm --import https://packages.microsoft.com/keys/microsoft.asc

    for attempt in {1..5}; do
        dnf -y \
            install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm \
            && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            return 1
        fi
    done

    for attempt in {1..5}; do
        dnf -y \
            install \
            clamav \
            azsec-clamav \
            azsec-monitor \
            azure-cli \
            azure-mdsd \
            azure-security \
            podman \
            podman-docker \
            openssl-perl \
            python3 \
            && break
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        if [[ ${attempt} -lt 5 ]]; then
            sleep 10
        else
            abort "failed to install required packages"
        fi
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "extending partition table"
    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physicalDisk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file
}

# configure_selinux
configure_selinux() {
    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r diable_accept_ra_conf="$prefix/02-disable-accept-ra.conf"
    log "Writing $diable_accept_ra_conf"
cat >"$diable_accept_ra_conf" <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file

    sysctl --system

    enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )
    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    echo "logging into prod acr"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    touch /etc/containers/nodocker

    mkdir -p /root/.docker
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "configuring fluentbit service"
    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file
}

# configure_certs
configure_certs() {
    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file
}

# configure_service_mdm
configure_service_mdm() {
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_conf_file
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "configuring aro-monitor service"
    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file
}

# configure_service_aro_portal
configure_service_aro_portal() {
    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file
}

# configure_service_mdsd
configure_service_mdsd() {
    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    parse_run_options "$@"


    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Make selinux modifications required for ARO RP
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "starting"
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time
    create_azure_rpm_repos retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    rpm_import_keys rpm_keys retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# rpm_import_keys
rpm_import_keys() {
    local -n keys="$1"
    log "starting"


    # shellcheck disable=SC2068
    for key in ${keys[@]}; do
        if [ ${#keys[@]} -eq 0 ]; then
            break
        fi
            local -a cmd=(
                rpm
                --import
                -v
                "$key"
            )

            log "attempt #$attempt - importing rpm repository key $key"
            retry cmd "$2" && unset key
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_selinux
configure_selinux() {
    log "starting"

    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    log "logging into prod acr"
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    log "starting"

    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file true

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_conf_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "starting"
    log "configuring aro-monitor service"

    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file true
}

# configure_service_aro_portal
configure_service_aro_portal() {
    log "starting"

    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" } } } diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index bdbb8fe35b3..2b405881bce 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -1,53 +1,331 @@ -#Adding retry logic to yum commands in order to avoid stalling out on resource locks -echo "running RHUI fix" -for attempt in {1..5}; do - yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done - -echo "running yum update" -for attempt in {1..5}; do - yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done - -echo "installing podman-docker" -for attempt in {1..5}; do - yum -y install podman-docker && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done - -firewall-cmd --add-port=443/tcp --permanent - -mkdir /root/.docker -cat >/root/.docker/config.json </etc/proxy/proxy.crt -base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key -base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt -chown -R 1000:1000 /etc/proxy -chmod 0600 /etc/proxy/proxy.key + local -ra aro_services=( + proxy + ) + log "enabling aro services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} -cat >/etc/sysconfig/proxy </etc/systemd/system/proxy.service <<'EOF' -[Unit] + base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt + base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key + base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt + chown -R 1000:1000 /etc/proxy + chmod 0600 /etc/proxy/proxy.key +} + +configure_service_proxy() { + local -r sysconfig_proxy_filename='/etc/sysconfig/proxy' + local -r sysconfig_proxy_file="PROXY_IMAGE='$PROXYIMAGE'" + + write_file sysconfig_proxy_filename sysconfig_proxy_file true + + local -r proxy_service_filename='/etc/systemd/system/proxy.service' + local -r proxy_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -61,34 +339,66 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" -systemctl enable proxy.service + local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image' + local -r cron_weekly_pull_image_file="#!/bin/bash +docker pull $PROXYIMAGE +systemctl restart proxy.service" + + write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true + chmod +x "$cron_weekly_pull_image_filename" -cat >/etc/cron.weekly/pull-image <<'EOF' -#!/bin/bash + local -r cron_daily_restart_proxy_filename='/etc/cron.daily/restart-proxy' + local -r cron_daily_restart_proxy_file="#!/bin/bash +systemctl restart proxy.service" + + write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file + chmod +x "$cron_daily_restart_proxy_filename" +} -docker pull $PROXYIMAGE -systemctl restart proxy.service -EOF -chmod +x /etc/cron.weekly/pull-image +# write_file +# Args +# 1) filename - string +# 2) file_contents - string +# 3) clobber - boolean; optional - defaults to false +write_file() { + local -n filename="$1" + local -n file_contents="$2" + local -r clobber="${3:-false}" -cat >/etc/cron.weekly/yumupdate <<'EOF' -#!/bin/bash + if $clobber; then + log "Overwriting file $filename" + echo "$file_contents" > "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} -yum update -y -EOF -chmod +x /etc/cron.weekly/yumupdate +# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots +reboot_vm() { + log "starting" -cat >/etc/cron.daily/restart-proxy <<'EOF' -#!/bin/bash + configure_selinux "true" + (sleep 30 && log "rebooting vm now"; reboot) & +} + +# log is a wrapper for echo that includes the function name +log() { + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" + echo "${FUNCNAME[${stack_level}]}: ${msg}" +} + +# abort is a wrapper for log that exits with an error code +abort() { + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" + log "Exiting" + exit 1 +} -systemctl restart proxy.service -EOF -chmod +x /etc/cron.daily/restart-proxy +export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -( - sleep 30 - reboot -) & +main "$@" From ff7c3721e2ce402cbc70b03eb839f3c0156213b9 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 15:19:10 -0400 Subject: [PATCH 16/38] WIP start moving common functions into common.sh for reuse --- pkg/deploy/generator/scripts/common.sh | 116 ++++++++++++ pkg/deploy/generator/scripts/rpVMSS.sh | 234 +++++++------------------ 2 files changed, 184 insertions(+), 166 deletions(-) create mode 100644 pkg/deploy/generator/scripts/common.sh diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh new file mode 100644 index 00000000000..9064da4782a --- /dev/null +++ b/pkg/deploy/generator/scripts/common.sh @@ -0,0 +1,116 @@ +#!/bin/bash +# This file is intended to be sourced by bootstrapping scripts for commonly used functions + +# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks +retry() { + local -n cmd_retry="$1" + local -n wait_time="$2" + + for attempt in {1..5}; do + log "attempt #${attempt} - ${FUNCNAME[2]}" + ${cmd_retry[@]} & + + wait $! && break + if [[ ${attempt} -lt 5 ]]; then + sleep "$wait_time" + else + abort "attempt #${attempt} - Failed to update packages" + fi + done +} + + +# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work +configure_sshd() { + log "starting" + local sshd_config="/etc/ssh/sshd_config" + + log "Editing $sshd_config to allow password authentication" + sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' "$sshd_config" + + systemctl reload sshd.service || abort "sshd failed to reload" +} + +# dnf_update_pkgs +dnf_update_pkgs() { + local -n excludes="$1" + log "starting" + + local -ra cmd=( + dnf + -y + ${excludes[@]} + update + --allowerasing + ) + + log "Updating all packages excluding ${excludes[*]}" + retry cmd "$2" +} + +# rpm_import_keys +rpm_import_keys() { + local -n keys="$1" + log "starting" + + + # shellcheck disable=SC2068 + for key in ${keys[@]}; do + if [ ${#keys[@]} -eq 0 ]; then + break + fi + local -a cmd=( + rpm + --import + -v + "$key" + ) + + log "attempt #$attempt - importing rpm repository key $key" + retry cmd "$2" && unset key + done +} + +# configure_selinux +configure_selinux() { + log "starting" + + local -r relabel="${1:-false}" + + already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" + semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" + chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent + + if "$relabel"; then + restorecon -RF /var/log/* || log "$already_defined_ignore_error" + fi +} + +# configure_firewalld_rules +configure_firewalld_rules() { + local -n ports="$1" + log "starting" + + # https://access.redhat.com/security/cve/cve-2020-13401 + local -r prefix="/etc/sysctl.d" + local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" + local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" + + write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true + + local -r disable_core_filename="$prefix/01-disable-core.conf" + local -r disable_core_file="kernel.core_pattern = |/bin/true + " + write_file disable_core_filename disable_core_file true + + sysctl --system + + log "Enabling ports ${enable_ports[*]} on default firewalld zone" + # shellcheck disable=SC2068 + for port in ${ports[@]}; do + log "Enabling port $port now" + firewall-cmd "--add-port=$port" + done + + firewall-cmd --runtime-to-permanent +} \ No newline at end of file diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 3c00da1185c..26c0055b35c 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -8,11 +8,53 @@ if [ "${DEBUG:-false}" == true ]; then fi main() { + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + + # shellcheck source=common.sh + source common.sh + parse_run_options "$@" configure_sshd - configure_and_install_dnf_pkgs_repos + configure_rpm_repos retry_wait_time + + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + dnf_update_pkgs exclude_pkgs retry_wait_time + + local -ra rpm_keys=( + https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + https://packages.microsoft.com/keys/microsoft.asc + ) + + rpm_import_keys rpm_keys retry_wait_time + + local -ra repo_rpm_pkgs=( + https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm + ) + + local -ra install_pkgs=( + clamav + azsec-clamav + azsec-monitor + azure-cli + azure-mdsd + azure-security + podman + podman-docker + openssl-perl + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + python3 + ) + + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time + configure_disk_partitions configure_logrotate configure_selinux @@ -20,8 +62,22 @@ main() { mkdir -p /var/log/journal mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store - configure_firewalld_rules - pull_container_images + local -ra enable_ports=( + "443/tcp" + "444/tcp" + "445/tcp" + "2222/tcp" + ) + configure_firewalld_rules enable_ports + + MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + local -ra images=( + "$MDMIMAGE" + "$RPIMAGE" + "$FLUENTBITIMAGE" + ) + + pull_container_images images configure_system_services reboot_vm } @@ -100,59 +156,11 @@ parse_run_options() { exit 0 } -# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work -configure_sshd() { +configure_rpm_repos() { log "starting" - log "setting ssh password authentication" - sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config - systemctl reload sshd.service - systemctl is-active --quiet sshd || abort "sshd failed to reload" -} - -# configure_and_install_dnf_pkgs_repos -configure_and_install_dnf_pkgs_repos() { - log "starting" - - # transaction attempt retry time in seconds - local -ri retry_wait_time=60 - configure_rhui_repo retry_wait_time - create_azure_rpm_repos retry_wait_time - - local -ar exclude_pkgs=( - "-x WALinuxAgent" - "-x WALinuxAgent-udev" - ) - - dnf_update_pkgs exclude_pkgs retry_wait_time - - local -ra rpm_keys=( - https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 - https://packages.microsoft.com/keys/microsoft.asc - ) - - rpm_import_keys rpm_keys retry_wait_time - - local -ra repo_rpm_pkgs=( - https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm - ) - - local -ra install_pkgs=( - clamav - azsec-clamav - azsec-monitor - azure-cli - azure-mdsd - azure-security - podman - podman-docker - openssl-perl - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 - python3 - ) - - dnf_install_pkgs repo_rpm_pkgs retry_wait_time - dnf_install_pkgs install_pkgs retry_wait_time + configure_rhui_repo "$1" + create_azure_rpm_repos "$1" } # configure_rhui_repo @@ -171,41 +179,6 @@ configure_rhui_repo() { retry cmd "$1" } -# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks -retry() { - local -n cmd_retry="$1" - local -n wait_time="$2" - - for attempt in {1..5}; do - log "attempt #${attempt} - ${FUNCNAME[2]}" - ${cmd_retry[@]} & - - wait $! && break - if [[ ${attempt} -lt 5 ]]; then - sleep "$wait_time" - else - abort "attempt #${attempt} - Failed to update packages" - fi - done -} - -# dnf_update_pkgs -dnf_update_pkgs() { - local -n excludes="$1" - log "starting" - - local -ra cmd=( - dnf - -y - ${excludes[@]} - update - --allowerasing - ) - - log "Updating all packages" - retry cmd "$2" -} - # dnf_install_pkgs dnf_install_pkgs() { local -n pkgs="$1" @@ -222,29 +195,6 @@ dnf_install_pkgs() { retry cmd "$2" } -# rpm_import_keys -rpm_import_keys() { - local -n keys="$1" - log "starting" - - - # shellcheck disable=SC2068 - for key in ${keys[@]}; do - if [ ${#keys[@]} -eq 0 ]; then - break - fi - local -a cmd=( - rpm - --import - -v - "$key" - ) - - log "attempt #$attempt - importing rpm repository key $key" - retry cmd "$2" && unset key - done -} - # configure_disk_partitions configure_disk_partitions() { log "starting" @@ -329,58 +279,9 @@ gpgcheck=no' write_file azure_repo_filename azure_repo_file true } -# configure_selinux -configure_selinux() { - log "starting" - - local -r relabel="${1:-false}" - - already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" - semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" - chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent - - if "$relabel"; then - restorecon -RF /var/log/* || log "$already_defined_ignore_error" - fi -} - -# configure_firewalld_rules -configure_firewalld_rules() { - log "starting" - - # https://access.redhat.com/security/cve/cve-2020-13401 - local -r prefix="/etc/sysctl.d" - local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" - local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" - - write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true - - local -r disable_core_filename="$prefix/01-disable-core.conf" - local -r disable_core_file="kernel.core_pattern = |/bin/true - " - write_file disable_core_filename disable_core_file true - - sysctl --system - - local -ra enable_ports=( - "443/tcp" - "444/tcp" - "445/tcp" - "2222/tcp" - ) - - log "Enabling ports ${enable_ports[*]} on default firewalld zone" - # shellcheck disable=SC2068 - for port in ${enable_ports[@]}; do - log "Enabling port $port now" - firewall-cmd "--add-port=$port" - done - - firewall-cmd --runtime-to-permanent -} - # pull_container_images pull_container_images() { + local -n pull_images="$1" log "starting" # The managed identity that the VM runs as only has a single roleassignment. @@ -402,10 +303,11 @@ pull_container_images() { log "logging into prod acr" az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" - MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" - docker pull "$MDMIMAGE" - docker pull "$RPIMAGE" - docker pull "$FLUENTBITIMAGE" + # shellcheck disable=SC2068 + for i in ${pull_images[@]}; do + log "Pulling image $i now" + podman pull "$i" + done az logout } From 9dd98cb3a1419b7d2855c2a70924aa03392773f7 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 15:21:41 -0400 Subject: [PATCH 17/38] WIP Move log rotate configuration to common.sh Need to allow addition of drop in files as well for gatewayVMSS.sh --- pkg/deploy/generator/scripts/common.sh | 44 +++++++++++++++++++++++++- pkg/deploy/generator/scripts/rpVMSS.sh | 42 ------------------------ 2 files changed, 43 insertions(+), 43 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 9064da4782a..25b249fee42 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -113,4 +113,46 @@ configure_firewalld_rules() { done firewall-cmd --runtime-to-permanent -} \ No newline at end of file +} + +# configure_logrotate clobbers /etc/logrotate.conf +configure_logrotate() { + log "starting" + + local -r logrotate_conf_filename='/etc/logrotate.conf' + local -r logrotate_conf_file='# see "man logrotate" for details +# rotate log files weekly +weekly + +# keep 2 weeks worth of backlogs +rotate 2 + +# create new (empty) log files after rotating old ones +create + +# use date as a suffix of the rotated file +dateext + +# uncomment this if you want your log files compressed +compress + +# RPM packages drop log rotation information into this directory +include /etc/logrotate.d + +# no packages own wtmp and btmp -- we will rotate them here +/var/log/wtmp { + monthly + create 0664 root utmp + minsize 1M + rotate 1 +} + +/var/log/btmp { + missingok + monthly + create 0600 root utmp + rotate 1 +}' + + write_file logrotate_conf_filename logrotate_conf_file true +} diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 26c0055b35c..e74da4d3fc9 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -217,48 +217,6 @@ configure_disk_partitions() { xfs_growfs /var } -# configure_logrotate clobbers /etc/logrotate.conf -configure_logrotate() { - log "starting" - - local -r logrotate_conf_filename='/etc/logrotate.conf' - local -r logrotate_conf_file='# see "man logrotate" for details -# rotate log files weekly -weekly - -# keep 2 weeks worth of backlogs -rotate 2 - -# create new (empty) log files after rotating old ones -create - -# use date as a suffix of the rotated file -dateext - -# uncomment this if you want your log files compressed -compress - -# RPM packages drop log rotation information into this directory -include /etc/logrotate.d - -# no packages own wtmp and btmp -- we will rotate them here -/var/log/wtmp { - monthly - create 0664 root utmp - minsize 1M - rotate 1 -} - -/var/log/btmp { - missingok - monthly - create 0600 root utmp - rotate 1 -}' - - write_file logrotate_conf_filename logrotate_conf_file true -} - # create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file create_azure_rpm_repos() { log "starting" From 2f1d24b5a520a29cf16d193a8707cd92ddc42ac2 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 15:22:10 -0400 Subject: [PATCH 18/38] WIP Move image pull function to common.sh --- pkg/deploy/generator/scripts/common.sh | 33 ++++++++++++++++++++++++++ pkg/deploy/generator/scripts/rpVMSS.sh | 33 -------------------------- 2 files changed, 33 insertions(+), 33 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 25b249fee42..f7b95116aa8 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -156,3 +156,36 @@ include /etc/logrotate.d write_file logrotate_conf_filename logrotate_conf_file true } + +# pull_container_images +pull_container_images() { + local -n pull_images="$1" + log "starting" + + # The managed identity that the VM runs as only has a single roleassignment. + # This role assignment is ACRPull which is not necessarily present in the + # subscription we're deploying into. If the identity does not have any + # role assignments scoped on the subscription we're deploying into, it will + # not show on az login -i, which is why the below line is commented. + # az account set -s "$SUBSCRIPTIONID" + az login -i --allow-no-subscriptions + + # Suppress emulation output for podman instead of docker for az acr compatability + mkdir -p /etc/containers/ + mkdir -p /root/.docker + touch /etc/containers/nodocker + + # This name is used in the case that az acr login searches for this in it's environment + local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + + log "logging into prod acr" + az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + + # shellcheck disable=SC2068 + for i in ${pull_images[@]}; do + log "Pulling image $i now" + podman pull "$i" + done + + az logout +} diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index e74da4d3fc9..eb45315853c 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -237,39 +237,6 @@ gpgcheck=no' write_file azure_repo_filename azure_repo_file true } -# pull_container_images -pull_container_images() { - local -n pull_images="$1" - log "starting" - - # The managed identity that the VM runs as only has a single roleassignment. - # This role assignment is ACRPull which is not necessarily present in the - # subscription we're deploying into. If the identity does not have any - # role assignments scoped on the subscription we're deploying into, it will - # not show on az login -i, which is why the below line is commented. - # az account set -s "$SUBSCRIPTIONID" - az login -i --allow-no-subscriptions - - # Suppress emulation output for podman instead of docker for az acr compatability - mkdir -p /etc/containers/ - mkdir -p /root/.docker - touch /etc/containers/nodocker - - # This name is used in the case that az acr login searches for this in it's environment - local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" - - log "logging into prod acr" - az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" - - # shellcheck disable=SC2068 - for i in ${pull_images[@]}; do - log "Pulling image $i now" - podman pull "$i" - done - - az logout -} - # configure_system_services creates, configures, and enables the following systemd services and timers # services # fluentbit From 7aeda490a9ddfbdfd5efee2719c3bcf911b99461 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 15:27:03 -0400 Subject: [PATCH 19/38] WIP move enable services to common.sh --- pkg/deploy/generator/scripts/common.sh | 13 +++++++ pkg/deploy/generator/scripts/rpVMSS.sh | 48 +++++++++++--------------- 2 files changed, 33 insertions(+), 28 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index f7b95116aa8..e7985a93017 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -189,3 +189,16 @@ pull_container_images() { az logout } + +# enable_services enables all services required for aro rp +enable_services() { + local -n services="$1" + log "starting" + + log "enabling aro services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index eb45315853c..fcdbcafc921 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -78,7 +78,24 @@ main() { ) pull_container_images images - configure_system_services + configure_aro_services + + local -ra aro_services=( + "aro-dbtoken" + "aro-monitor" + "aro-portal" + "aro-rp" + "auoms" + "azsecd" + "azsecmond" + "mdsd" + "mdm" + "chronyd" + "fluentbit" + ) + + enable_services aro_services + reboot_vm } @@ -237,7 +254,7 @@ gpgcheck=no' write_file azure_repo_filename azure_repo_file true } -# configure_system_services creates, configures, and enables the following systemd services and timers +# configure_aro_services creates, configures, and enables the following systemd services and timers # services # fluentbit # mdm @@ -246,7 +263,7 @@ gpgcheck=no' # aro-dbtoken # aro-monitor # aro-portal -configure_system_services() { +configure_aro_services() { configure_service_fluentbit configure_service_mdm configure_timers_mdm_mdsd @@ -257,31 +274,6 @@ configure_system_services() { configure_service_mdsd } -# enable_aro_services enables all services required for aro rp -enable_aro_services() { - log "starting" - - local -ra aro_services=( - "aro-dbtoken" - "aro-monitor" - "aro-portal" - "aro-rp" - "auoms" - "azsecd" - "azsecmond" - "mdsd" - "mdm" - "chronyd" - "fluentbit" - ) - log "enabling aro services ${aro_services[*]}" - # shellcheck disable=SC2068 - for service in ${aro_services[@]}; do - log "Enabling $service now" - systemctl enable "$service.service" - done -} - # configure_service_fluentbit configure_service_fluentbit() { log "starting" From 6354b8e30217878834ef601f5c3f950fc35a4829 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 15:27:50 -0400 Subject: [PATCH 20/38] WIP add write_file, reboot_vm, log, and abort to common.sh --- pkg/deploy/generator/scripts/common.sh | 42 ++++++++++++++++++++++++++ pkg/deploy/generator/scripts/rpVMSS.sh | 42 -------------------------- 2 files changed, 42 insertions(+), 42 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index e7985a93017..69ee2e6de02 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -202,3 +202,45 @@ enable_services() { systemctl enable "$service.service" done } + +# write_file +# Args +# 1) filename - string +# 2) file_contents - string +# 3) clobber - boolean; optional - defaults to false +write_file() { + local -n filename="$1" + local -n file_contents="$2" + local -r clobber="${3:-false}" + + if $clobber; then + log "Overwriting file $filename" + echo "$file_contents" > "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} + +# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots +reboot_vm() { + log "starting" + + configure_selinux "true" + (sleep 30 && log "rebooting vm now"; reboot) & +} + +# log is a wrapper for echo that includes the function name +log() { + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" + echo "${FUNCNAME[${stack_level}]}: ${msg}" +} + +# abort is a wrapper for log that exits with an error code +abort() { + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" + log "Exiting" + exit 1 +} diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index fcdbcafc921..3d14e9173b6 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -905,48 +905,6 @@ run_azsecd_config_scan() { done } -# write_file -# Args -# 1) filename - string -# 2) file_contents - string -# 3) clobber - boolean; optional - defaults to false -write_file() { - local -n filename="$1" - local -n file_contents="$2" - local -r clobber="${3:-false}" - - if $clobber; then - log "Overwriting file $filename" - echo "$file_contents" > "$filename" - else - log "Appending to $filename" - echo "$file_contents" >> "$filename" - fi -} - -# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots -reboot_vm() { - log "starting" - - configure_selinux "true" - (sleep 30 && log "rebooting vm now"; reboot) & -} - -# log is a wrapper for echo that includes the function name -log() { - local -r msg="${1:-"log message is empty"}" - local -r stack_level="${2:-1}" - echo "${FUNCNAME[${stack_level}]}: ${msg}" -} - -# abort is a wrapper for log that exits with an error code -abort() { - local -ri origin_stacklevel=2 - log "${1}" "$origin_stacklevel" - log "Exiting" - exit 1 -} - export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" main "$@" From d55340cca565d06cfe32dd4badbc19ee50692656 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 15:29:26 -0400 Subject: [PATCH 21/38] WIP move dnf_install_pkgs to common.sh --- pkg/deploy/generator/scripts/common.sh | 15 +++++++++++++++ pkg/deploy/generator/scripts/rpVMSS.sh | 17 +---------------- 2 files changed, 16 insertions(+), 16 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 69ee2e6de02..4d39f1dd291 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -19,6 +19,21 @@ retry() { done } +# dnf_install_pkgs +dnf_install_pkgs() { + local -n pkgs="$1" + log "starting" + + local -ra cmd=( + dnf + -y + install + ${pkgs[@]} + ) + + log "Attempting to install packages: ${pkgs[*]}" + retry cmd "$2" +} # We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work configure_sshd() { diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 3d14e9173b6..7696fc41900 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -173,6 +173,7 @@ parse_run_options() { exit 0 } +# configure_rpm_repos configure_rpm_repos() { log "starting" @@ -196,22 +197,6 @@ configure_rhui_repo() { retry cmd "$1" } -# dnf_install_pkgs -dnf_install_pkgs() { - local -n pkgs="$1" - log "starting" - - local -ra cmd=( - dnf - -y - install - ${pkgs[@]} - ) - - log "Attempting to install packages: ${pkgs[*]}" - retry cmd "$2" -} - # configure_disk_partitions configure_disk_partitions() { log "starting" From d4eac32c7ed64c0d6ec79959e1fca115c21a67d5 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 16:39:04 -0400 Subject: [PATCH 22/38] WIP Fix parse_run_options to allow local testing --- pkg/deploy/generator/scripts/rpVMSS.sh | 98 +++++++++++++++++--------- 1 file changed, 63 insertions(+), 35 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 7696fc41900..1188757ed88 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -14,26 +14,16 @@ main() { # shellcheck source=common.sh source common.sh - parse_run_options "$@" - - - configure_sshd - configure_rpm_repos retry_wait_time - local -ar exclude_pkgs=( "-x WALinuxAgent" "-x WALinuxAgent-udev" ) - dnf_update_pkgs exclude_pkgs retry_wait_time - local -ra rpm_keys=( https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 https://packages.microsoft.com/keys/microsoft.asc ) - rpm_import_keys rpm_keys retry_wait_time - local -ra repo_rpm_pkgs=( https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm ) @@ -52,24 +42,6 @@ main() { python3 ) - dnf_install_pkgs repo_rpm_pkgs retry_wait_time - dnf_install_pkgs install_pkgs retry_wait_time - - configure_disk_partitions - configure_logrotate - configure_selinux - - mkdir -p /var/log/journal - mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store - - local -ra enable_ports=( - "443/tcp" - "444/tcp" - "445/tcp" - "2222/tcp" - ) - configure_firewalld_rules enable_ports - MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" local -ra images=( "$MDMIMAGE" @@ -77,8 +49,12 @@ main() { "$FLUENTBITIMAGE" ) - pull_container_images images - configure_aro_services + local -ra enable_ports=( + "443/tcp" + "444/tcp" + "445/tcp" + "2222/tcp" + ) local -ra aro_services=( "aro-dbtoken" @@ -94,6 +70,39 @@ main() { "fluentbit" ) + parse_run_options "$@" \ + retry_wait_time \ + exclude_pkgs \ + rpm_keys \ + repo_rpm_pkgs \ + install_pkgs \ + images \ + enable_ports \ + aro_services + + configure_sshd + configure_rpm_repos retry_wait_time + + dnf_update_pkgs exclude_pkgs retry_wait_time + + rpm_import_keys rpm_keys retry_wait_time + + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time + + configure_disk_partitions + configure_logrotate + configure_selinux + + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store + + configure_firewalld_rules enable_ports + + pull_container_images images + configure_aro_services + enable_services + enable_services aro_services reboot_vm @@ -122,6 +131,15 @@ usage() { parse_run_options() { # shellcheck disable=SC2206 local -a options=(${1:-}) + local -n retry_time="$2" + local -n pkgs_to_exclude="$3" + local -n keys_to_import="$4" + local -n rpm_pkgs="$5" + local -n pkgs_to_install="$6" + local -n images_to_pull="$7" + local -n ports_to_enable="$8" + local -n services_to_enable="$9" + if [ "${#options[@]}" -eq 0 ]; then log "Running all steps" return 0 @@ -136,8 +154,17 @@ parse_run_options() { configure_disk_partitions ;; p) - log "Running step configure_and_install_dnf_pkgs_repos" - configure_and_install_dnf_pkgs_repos + log "Running step configure_rpm_repos" + configure_rpm_repos keys_to_import + + log "Running step dnf_update_pkgs" + dnf_update_pkgs pkgs_to_exclude retry_time + + log "Running step dnf_install_pkgs rpm_pkgs" + dnf_install_pkgs rpm_pkgs retry_time + + log "Running step dnf_install_pkgs pkgs" + dnf_install_pkgs pkgs_to_install retry_time ;; l) log "Running configure_logrotate" @@ -153,15 +180,16 @@ parse_run_options() { ;; f) log "Running configure_firewalld_rules" - configure_firewalld_rules + configure_firewalld_rules ports_to_enable ;; u) log "Running pull_container_images & configure_system_services" - configure_system_services + configure_aro_services + enable_services services_to_enable ;; i) log "Running pull_container_images" - pull_container_images + pull_container_images images_to_pull ;; *) usage allowed_options From c8639d31be7ded54af5c202ab395b5d2ae92940d Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 16:40:52 -0400 Subject: [PATCH 23/38] WIP add -p to mkdir for mdsd.service.d to allow for existing directory --- pkg/deploy/generator/scripts/rpVMSS.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 1188757ed88..5012c8a9652 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -869,7 +869,7 @@ configure_service_mdsd() { log "starting" local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" - mkdir "$mdsd_service_dir" + mkdir -p "$mdsd_service_dir" local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf" local -r mdsd_override_conf_file="[Unit] From e91476ad4e60d4a2984ea785838fd7d574be8f91 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 16:43:54 -0400 Subject: [PATCH 24/38] WIP correct aro-portal.service, aro-rp.service and fluentbit.service file writing The config file was being written twice --- pkg/deploy/generator/scripts/rpVMSS.sh | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 5012c8a9652..e8cedfd1e25 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -371,7 +371,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file fluentbit_conf_filename fluentbit_conf_file true + write_file fluentbit_service_filename fluentbit_service_file true } # configure_certs @@ -686,7 +686,7 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file aro_rp_service_filename aro_rp_conf_file true + write_file aro_rp_service_filename aro_rp_service_file true } # configure_service_aro_dbtoken @@ -861,7 +861,7 @@ RestartSec=1 [Install] WantedBy=multi-user.target" - write_file aro_portal_service_conf_filename aro_portal_service_conf_file true + write_file aro_portal_service_filename aro_portal_service_file true } # configure_service_mdsd From 84cfcefa6ac3bc196902e50275216b21efffb955 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 17 Apr 2024 17:30:25 -0400 Subject: [PATCH 25/38] Rewrite devProxyVMSS.sh to reuse functions in common.sh --- pkg/deploy/assets/env-development.json | 2 +- pkg/deploy/assets/rp-production.json | 2 +- pkg/deploy/generator/scripts/common.sh | 38 ++- pkg/deploy/generator/scripts/devProxyVMSS.sh | 330 ++++--------------- pkg/deploy/generator/scripts/rpVMSS.sh | 24 +- 5 files changed, 103 insertions(+), 293 deletions(-) diff --git a/pkg/deploy/assets/env-development.json b/pkg/deploy/assets/env-development.json index 1da1cb9fb5b..af038e859b5 100644 --- a/pkg/deploy/assets/env-development.json +++ b/pkg/deploy/assets/env-development.json @@ -296,7 +296,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    parse_run_options "$@"

    configure_and_install_dnf_pkgs_repos

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
	local -r allowed_options="pfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        podman
        podman-docker
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time

	local -r cron_weekly_dnf_update_filename='/etc/cron.weekly/dnfupdate'
	local -r cron_weekly_dnf_update_file="#!/bin/bash
dnf update -y"

	write_file cron_weekly_dnf_update_filename cron_weekly_dnf_update_file true
	chmod +x "$cron_weekly_dnf_update_filename"
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "443/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
	local -r registry_config_file="{
	"auths": {
		\"${PROXYIMAGE%%/*}\": {
			\"auth\": \"$PROXYIMAGEAUTH\"
		}
	}"

	write_file REGISTRY_AUTH_FILE registry_config_file true

    log "logging into prod acr"

    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    docker pull "$PROXYIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#	proxy
configure_system_services() {
	configure_service_proxy
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
		proxy
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_certs
configure_certs() {
    log "starting"

	base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt
	base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key
	base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt
	chown -R 1000:1000 /etc/proxy
	chmod 0600 /etc/proxy/proxy.key
}

configure_service_proxy() {
	local -r sysconfig_proxy_filename='/etc/sysconfig/proxy'
	local -r sysconfig_proxy_file="PROXY_IMAGE='$PROXYIMAGE'"

	write_file sysconfig_proxy_filename sysconfig_proxy_file true

	local -r proxy_service_filename='/etc/systemd/system/proxy.service'
	local -r proxy_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/proxy
ExecStartPre=-/usr/bin/docker rm -f %n
ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $PROXY_IMAGE
ExecStop=/usr/bin/docker stop %n
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

	local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image'
	local -r cron_weekly_pull_image_file="#!/bin/bash
docker pull $PROXYIMAGE
systemctl restart proxy.service"
	
	write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true
	chmod +x "$cron_weekly_pull_image_filename"

	local -r cron_daily_restart_proxy_filename='/etc/cron.daily/restart-proxy'
	local -r cron_daily_restart_proxy_file="#!/bin/bash
systemctl restart proxy.service"
	
	write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file
	chmod +x "$cron_daily_restart_proxy_filename"
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('IyEvYmluL2Jhc2gKCnNldCAtbyBlcnJleGl0IFwKICAgIC1vIG5vdW5zZXQKCmlmIFsgIiR7REVCVUc6LWZhbHNlfSIgPT0gdHJ1ZSBdOyB0aGVuCiAgICBzZXQgLXgKZmkKCm1haW4oKSB7CiAgICAjIHRyYW5zYWN0aW9uIGF0dGVtcHQgcmV0cnkgdGltZSBpbiBzZWNvbmRzCiAgICBsb2NhbCAtcmkgcmV0cnlfd2FpdF90aW1lPTYwCgogICAgIyBzaGVsbGNoZWNrIHNvdXJjZT1jb21tb24uc2gKICAgIHNvdXJjZSBjb21tb24uc2gKCiAgICBsb2NhbCAtcmEgZW5hYmxlX3BvcnRzPSgKICAgICAgICAiNDQzL3RjcCIKICAgICkKCiAgICBsb2NhbCBwcm94eV9pbWFnZT0iJFBST1hZSU1BR0UiCglsb2NhbCAtciByZWdpc3RyeV9jb25maWdfZmlsZT0iewogICAgXCJhdXRoc1wiOiB7CiAgICAgICAgXCIke1BST1hZSU1BR0UlJS8qfVwiOiB7CiAgICAgICAgICAgIFwiYXV0aFwiOiBcIiRQUk9YWUlNQUdFQVVUSFwiCiAgICAgICAgfQogICAgfSIKCiAgICBsb2NhbCAtYXIgZXhjbHVkZV9wa2dzPSgKICAgICAgICAiLXggV0FMaW51eEFnZW50IgogICAgICAgICIteCBXQUxpbnV4QWdlbnQtdWRldiIKICAgICkKCiAgICBsb2NhbCAtcmEgaW5zdGFsbF9wa2dzPSgKICAgICAgICBwb2RtYW4KICAgICAgICBwb2RtYW4tZG9ja2VyCiAgICApCgogICAgbG9jYWwgLXJhIHByb3h5X3NlcnZpY2VzPSgKCQlwcm94eQogICAgKQoKICAgIHBhcnNlX3J1bl9vcHRpb25zICIkQCIKCiAgICBkbmZfdXBkYXRlX3BrZ3MgcGtnc190b19leGNsdWRlIHJldHJ5X3dhaXRfdGltZQogICAgZG5mX2luc3RhbGxfcGtncyBpbnN0YWxsX3BrZ3MgcmV0cnlfd2FpdF90aW1lCiAgICBjb25maWd1cmVfZG5mX2Nyb25fam9iCgogICAgY29uZmlndXJlX2ZpcmV3YWxsZF9ydWxlcyBlbmFibGVfcG9ydHMKICAgIHB1bGxfY29udGFpbmVyX2ltYWdlcyBwcm94eV9pbWFnZSByZWdpc3RyeV9jb25maWdfZmlsZQogICAgY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzCiAgICBlbmFibGVfc2VydmljZXMgcHJveHlfc2VydmljZXMKICAgIHJlYm9vdF92bQp9Cgp1c2FnZSgpIHsKICAgIGxvY2FsIC1uIG9wdGlvbnM9IiQxIgogICAgbG9nICIkKGJhc2VuYW1lICIkMCIpIFskb3B0aW9uc10KICAgICAgICAtcCBDb25maWd1cmUgcnBtIHJlcG9zaXRvcmllcywgaW1wb3J0IHJlcXVpcmVkIHJwbSBrZXlzLCB1cGRhdGUgJiBpbnN0YWxsIHBhY2thZ2VzIHdpdGggZG5mCiAgICAgICAgLWYgQ29uZmlndXJlIGZpcmV3YWxsZCBkZWZhdWx0IHpvbmUgcnVsZXMKICAgICAgICAtdSBDb25maWd1cmUgc3lzdGVtZCB1bml0IGZpbGVzCiAgICAgICAgLWkgUHVsbCBjb250YWluZXIgaW1hZ2VzCgogICAgICAgIE5vdGU6IHN0ZXBzIHdpbGwgYmUgZXhlY3V0ZWQgaW4gdGhlIG9yZGVyIHRoYXQgZmxhZ3MgYXJlIHByb3ZpZGVkCiAgICAiCn0KCiMgcGFyc2VfcnVuX29wdGlvbnMgdGFrZXMgYWxsIGFyZ3VlbWVudHMgcGFzc2VkIHRvIG1haW4gYW5kIHBhcnNlcyB0aGVtCiMgYWxsb3dpbmcgaW5kaXZpZHVhbCBzdGVwKHMpIHRvIGJlIHJhbiwgcmF0aGVyIHRoYW4gYWxsIHN0ZXBzCiMKIyBUaGlzIGlzIHVzZWZ1bCBmb3IgbG9jYWwgdGVzdGluZywgb3IgcG9zc2libHkgbW9kaWZ5aW5nIHRoZSBib290c3RyYXAgZXhlY3V0aW9uIHZpYSBlbnZpcm9ubWVudCB2YXJpYWJsZXMgaW4gdGhlIGRlcGxveW1lbnQgcGlwZWxpbmUKcGFyc2VfcnVuX29wdGlvbnMoKSB7CiAgICAjIHNoZWxsY2hlY2sgZGlzYWJsZT1TQzIyMDYKICAgIGxvY2FsIC1hIG9wdGlvbnM9KCR7MTotfSkKICAgIGxvY2FsIC1uIHBrZ3NfdG9fZXhjbHVkZT0iJDIiCiAgICBsb2NhbCAtbiBwa2dzX3RvX2luc3RhbGw9IiQzIgogICAgbG9jYWwgLW4gcG9ydHNfdG9fZW5hYmxlPSIkNCIKICAgIGxvY2FsIC1uIHNlcnZpY2VzX3RvX2VuYWJsZT0iJDUiCiAgICBsb2NhbCAtbiBpbWFnZXNfdG9fcHVsbD0iJDYiCgogICAgaWYgWyAiJHsjb3B0aW9uc1tAXX0iIC1lcSAwIF07IHRoZW4KICAgICAgICBsb2cgIlJ1bm5pbmcgYWxsIHN0ZXBzIgogICAgICAgIHJldHVybiAwCiAgICBmaQoKICAgIGxvY2FsIE9QVElORAoJbG9jYWwgLXIgYWxsb3dlZF9vcHRpb25zPSJwZnVpIgogICAgd2hpbGUgZ2V0b3B0cyAke2FsbG93ZWRfb3B0aW9uc30gb3B0aW9uczsgZG8KICAgICAgICBjYXNlICIke29wdGlvbnN9IiBpbgogICAgICAgICAgICBwKQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHN0ZXAgZG5mX3VwZGF0ZV9wa2dzIgogICAgICAgICAgICAgICAgZG5mX3VwZGF0ZV9wa2dzIHBrZ3NfdG9fZXhjbHVkZSByZXRyeV93YWl0X3RpbWUKCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgc3RlcCBkbmZfaW5zdGFsbF9wa2dzIgogICAgICAgICAgICAgICAgZG5mX2luc3RhbGxfcGtncyBwa2dzX3RvX2luc3RhbGwgcmV0cnlfd2FpdF90aW1lCgogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHN0ZXAgY29uZmlndXJlX2RuZl9jcm9uX2pvYiIKICAgICAgICAgICAgICAgIGNvbmZpZ3VyZV9kbmZfY3Jvbl9qb2IKICAgICAgICAgICAgICAgIDs7CiAgICAgICAgICAgIGYpCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgY29uZmlndXJlX2ZpcmV3YWxsZF9ydWxlcyIKICAgICAgICAgICAgICAgIGNvbmZpZ3VyZV9maXJld2FsbGRfcnVsZXMgcG9ydHNfdG9fZW5hYmxlCiAgICAgICAgICAgICAgICA7OwogICAgICAgICAgICB1KQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHN0ZXAgY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzIgogICAgICAgICAgICAgICAgY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzCiAgICAgICAgICAgICAgICBlbmFibGVfc2VydmljZXMgc2VydmljZXNfdG9fZW5hYmxlCiAgICAgICAgICAgICAgICA7OwogICAgICAgICAgICBpKQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHB1bGxfY29udGFpbmVyX2ltYWdlcyIKICAgICAgICAgICAgICAgIHB1bGxfY29udGFpbmVyX2ltYWdlcyBpbWFnZXNfdG9fcHVsbAogICAgICAgICAgICAgICAgOzsKICAgICAgICAgICAgKikKICAgICAgICAgICAgICAgIHVzYWdlIGFsbG93ZWRfb3B0aW9ucwogICAgICAgICAgICAgICAgYWJvcnQgIlVua293biBvcHRpb24gcHJvdmlkZWQiCiAgICAgICAgICAgICAgICA7OwogICAgICAgIGVzYWMKICAgIGRvbmUKICAgIAogICAgZXhpdCAwCn0KCiMgY29uZmlndXJlX3N5c3RlbV9zZXJ2aWNlcyBjcmVhdGVzLCBjb25maWd1cmVzLCBhbmQgZW5hYmxlcyB0aGUgZm9sbG93aW5nIHN5c3RlbWQgc2VydmljZXMgYW5kIHRpbWVycwojIHNlcnZpY2VzCiMJcHJveHkKY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzKCkgewoJY29uZmlndXJlX3NlcnZpY2VfcHJveHkKfQoKIyBlbmFibGVfYXJvX3NlcnZpY2VzIGVuYWJsZXMgYWxsIHNlcnZpY2VzIHJlcXVpcmVkIGZvciBhcm8gcnAKZW5hYmxlX2Fyb19zZXJ2aWNlcygpIHsKICAgIGxvZyAic3RhcnRpbmciCgogICAgbG9nICJlbmFibGluZyBhcm8gc2VydmljZXMgJHthcm9fc2VydmljZXNbKl19IgogICAgIyBzaGVsbGNoZWNrIGRpc2FibGU9U0MyMDY4CiAgICBmb3Igc2VydmljZSBpbiAke2Fyb19zZXJ2aWNlc1tAXX07IGRvCiAgICAgICAgbG9nICJFbmFibGluZyAkc2VydmljZSBub3ciCiAgICAgICAgc3lzdGVtY3RsIGVuYWJsZSAiJHNlcnZpY2Uuc2VydmljZSIKICAgIGRvbmUKfQoKIyBjb25maWd1cmVfY2VydHMKY29uZmlndXJlX2NlcnRzKCkgewogICAgbG9nICJzdGFydGluZyIKCgliYXNlNjQgLWQgPDw8IiRQUk9YWUNFUlQiID4vZXRjL3Byb3h5L3Byb3h5LmNydAoJYmFzZTY0IC1kIDw8PCIkUFJPWFlLRVkiID4vZXRjL3Byb3h5L3Byb3h5LmtleQoJYmFzZTY0IC1kIDw8PCIkUFJPWFlDTElFTlRDRVJUIiA+L2V0Yy9wcm94eS9wcm94eS1jbGllbnQuY3J0CgljaG93biAtUiAxMDAwOjEwMDAgL2V0Yy9wcm94eQoJY2htb2QgMDYwMCAvZXRjL3Byb3h5L3Byb3h5LmtleQp9Cgpjb25maWd1cmVfc2VydmljZV9wcm94eSgpIHsKCWxvY2FsIC1yIHN5c2NvbmZpZ19wcm94eV9maWxlbmFtZT0nL2V0Yy9zeXNjb25maWcvcHJveHknCglsb2NhbCAtciBzeXNjb25maWdfcHJveHlfZmlsZT0iUFJPWFlfSU1BR0U9JyRQUk9YWUlNQUdFJyIKCgl3cml0ZV9maWxlIHN5c2NvbmZpZ19wcm94eV9maWxlbmFtZSBzeXNjb25maWdfcHJveHlfZmlsZSB0cnVlCgoJbG9jYWwgLXIgcHJveHlfc2VydmljZV9maWxlbmFtZT0nL2V0Yy9zeXN0ZW1kL3N5c3RlbS9wcm94eS5zZXJ2aWNlJwoJbG9jYWwgLXIgcHJveHlfc2VydmljZV9maWxlPSJbVW5pdF0KQWZ0ZXI9bmV0d29yay1vbmxpbmUudGFyZ2V0CldhbnRzPW5ldHdvcmstb25saW5lLnRhcmdldAoKW1NlcnZpY2VdCkVudmlyb25tZW50RmlsZT0vZXRjL3N5c2NvbmZpZy9wcm94eQpFeGVjU3RhcnRQcmU9LS91c3IvYmluL2RvY2tlciBybSAtZiAlbgpFeGVjU3RhcnQ9L3Vzci9iaW4vZG9ja2VyIHJ1biAtLXJtIC0tbmFtZSAlbiAtcCA0NDM6ODQ0MyAtdiAvZXRjL3Byb3h5Oi9zZWNyZXRzICRQUk9YWV9JTUFHRQpFeGVjU3RvcD0vdXNyL2Jpbi9kb2NrZXIgc3RvcCAlbgpSZXN0YXJ0PWFsd2F5cwpSZXN0YXJ0U2VjPTEKU3RhcnRMaW1pdEludGVydmFsPTAKCltJbnN0YWxsXQpXYW50ZWRCeT1tdWx0aS11c2VyLnRhcmdldCIKCglsb2NhbCAtciBjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGVuYW1lPScvZXRjL2Nyb24ud2Vla2x5L3B1bGwtaW1hZ2UnCglsb2NhbCAtciBjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGU9IiMhL2Jpbi9iYXNoCmRvY2tlciBwdWxsICRQUk9YWUlNQUdFCnN5c3RlbWN0bCByZXN0YXJ0IHByb3h5LnNlcnZpY2UiCgkKCXdyaXRlX2ZpbGUgY3Jvbl93ZWVrbHlfcHVsbF9pbWFnZV9maWxlbmFtZSBjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGUgdHJ1ZQoJY2htb2QgK3ggIiRjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGVuYW1lIgoKCWxvY2FsIC1yIGNyb25fZGFpbHlfcmVzdGFydF9wcm94eV9maWxlbmFtZT0nL2V0Yy9jcm9uLmRhaWx5L3Jlc3RhcnQtcHJveHknCglsb2NhbCAtciBjcm9uX2RhaWx5X3Jlc3RhcnRfcHJveHlfZmlsZT0iIyEvYmluL2Jhc2gKc3lzdGVtY3RsIHJlc3RhcnQgcHJveHkuc2VydmljZSIKCQoJd3JpdGVfZmlsZSBjcm9uX2RhaWx5X3Jlc3RhcnRfcHJveHlfZmlsZW5hbWUgY3Jvbl9kYWlseV9yZXN0YXJ0X3Byb3h5X2ZpbGUKCWNobW9kICt4ICIkY3Jvbl9kYWlseV9yZXN0YXJ0X3Byb3h5X2ZpbGVuYW1lIgp9CgpleHBvcnQgQVpVUkVfQ0xPVURfTkFNRT0iJHtBWlVSRUNMT1VETkFNRTo/IkZhaWxlZCB0byBjYXJyeSBvdmVyIHZhcmlhYmxlcyJ9IgoKbWFpbiAiJEAiCg==')))]" }, "provisionAfterExtensions": [ "Microsoft.Azure.Monitor.AzureMonitorLinuxAgent", diff --git a/pkg/deploy/assets/rp-production.json b/pkg/deploy/assets/rp-production.json index 99f72f4d6ff..19c4eed5edc 100644 --- a/pkg/deploy/assets/rp-production.json +++ b/pkg/deploy/assets/rp-production.json @@ -516,7 +516,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    parse_run_options "$@"


    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Make selinux modifications required for ARO RP
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "starting"
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time
    create_azure_rpm_repos retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    rpm_import_keys rpm_keys retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# rpm_import_keys
rpm_import_keys() {
    local -n keys="$1"
    log "starting"


    # shellcheck disable=SC2068
    for key in ${keys[@]}; do
        if [ ${#keys[@]} -eq 0 ]; then
            break
        fi
            local -a cmd=(
                rpm
                --import
                -v
                "$key"
            )

            log "attempt #$attempt - importing rpm repository key $key"
            retry cmd "$2" && unset key
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_selinux
configure_selinux() {
    log "starting"

    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    log "logging into prod acr"
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    log "starting"

    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file true

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_conf_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "starting"
    log "configuring aro-monitor service"

    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file true
}

# configure_service_aro_portal
configure_service_aro_portal() {
    log "starting"

    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60

    # shellcheck source=common.sh
    source common.sh

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    local -ra images=(
        "$MDMIMAGE"
        "$RPIMAGE"
        "$FLUENTBITIMAGE"
    )

    local -ra enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )

    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )

    parse_run_options "$@" \
                        retry_wait_time \
                        exclude_pkgs \
                        rpm_keys \
                        repo_rpm_pkgs \
                        install_pkgs \
                        images \
                        enable_ports \
                        aro_services

    configure_sshd
    configure_rpm_repos retry_wait_time

    dnf_update_pkgs exclude_pkgs retry_wait_time

    rpm_import_keys rpm_keys retry_wait_time

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
    configure_dnf_cron_job

    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules enable_ports

    pull_container_images images
    configure_aro_services
    enable_services

    enable_services aro_services

    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Configure selinux
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    local -n retry_time="$2"
    local -n pkgs_to_exclude="$3"
    local -n keys_to_import="$4"
    local -n rpm_pkgs="$5"
    local -n pkgs_to_install="$6"
    local -n images_to_pull="$7"
    local -n ports_to_enable="$8"
    local -n services_to_enable="$9"

    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_rpm_repos"
                configure_rpm_repos keys_to_import

                log "Running step dnf_update_pkgs"
                dnf_update_pkgs pkgs_to_exclude retry_time

                log "Running step dnf_install_pkgs rpm_pkgs"
                dnf_install_pkgs rpm_pkgs retry_time

                log "Running step dnf_install_pkgs pkgs"
                dnf_install_pkgs pkgs_to_install retry_time
                
                log "Running step configure_dnf_crond_job"
                configure_dnf_cron_job
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules ports_to_enable
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_aro_services
                enable_services services_to_enable
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images images_to_pull
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# configure_rpm_repos
configure_rpm_repos() {
    log "starting"

    configure_rhui_repo "$1"
    create_azure_rpm_repos "$1"
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_aro_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_aro_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_service_filename fluentbit_service_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    log "starting"

    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file true

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_service_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "starting"
    log "configuring aro-monitor service"

    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file true
}

# configure_service_aro_portal
configure_service_aro_portal() {
    log "starting"

    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_filename aro_portal_service_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir -p "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" } } } diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 4d39f1dd291..436c89366a4 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -175,6 +175,7 @@ include /etc/logrotate.d # pull_container_images pull_container_images() { local -n pull_images="$1" + local -n registry_conf="${2:-}" log "starting" # The managed identity that the VM runs as only has a single roleassignment. @@ -190,9 +191,13 @@ pull_container_images() { mkdir -p /root/.docker touch /etc/containers/nodocker - # This name is used in the case that az acr login searches for this in it's environment + # This name is used in the case that az acr login searches for this in it's environment local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + if [[ -n $registry_conf ]]; then + write_file REGISTRY_AUTH_FILE registry_conf true + fi + log "logging into prod acr" az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" @@ -210,9 +215,9 @@ enable_services() { local -n services="$1" log "starting" - log "enabling aro services ${aro_services[*]}" + log "enabling services ${services[*]}" # shellcheck disable=SC2068 - for service in ${aro_services[@]}; do + for service in ${services[@]}; do log "Enabling $service now" systemctl enable "$service.service" done @@ -259,3 +264,30 @@ abort() { log "Exiting" exit 1 } + +# configure_rhui_repo +configure_rhui_repo() { + log "starting" + + local -ra cmd=( + dnf + update + -y + --disablerepo='*' + --enablerepo='rhui-microsoft-azure*' + ) + + log "running RHUI package updates" + retry cmd "$1" +} + +configure_dnf_cron_job() { + log "Starting" + local -r cron_weekly_dnf_update_filename='/etc/cron.weekly/dnfupdate' + local -r cron_weekly_dnf_update_file="#!/bin/bash +dnf update -y" + + write_file cron_weekly_dnf_update_filename cron_weekly_dnf_update_file true + chmod +x "$cron_weekly_dnf_update_filename" +} + diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index 2b405881bce..19289b8ee1a 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -8,13 +8,48 @@ if [ "${DEBUG:-false}" == true ]; then fi main() { + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + + # shellcheck source=common.sh + source common.sh + + local -ra enable_ports=( + "443/tcp" + ) + + local proxy_image="$PROXYIMAGE" + local -r registry_config_file="{ + \"auths\": { + \"${PROXYIMAGE%%/*}\": { + \"auth\": \"$PROXYIMAGEAUTH\" + } + }" + + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + local -ra install_pkgs=( + podman + podman-docker + ) + + local -ra proxy_services=( + proxy + ) + parse_run_options "$@" - configure_and_install_dnf_pkgs_repos + dnf_update_pkgs pkgs_to_exclude retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time + configure_dnf_cron_job - configure_firewalld_rules - pull_container_images - configure_system_services + configure_firewalld_rules enable_ports + pull_container_images proxy_image registry_config_file + configure_devproxy_services + enable_services proxy_services reboot_vm } @@ -23,7 +58,7 @@ usage() { log "$(basename "$0") [$options] -p Configure rpm repositories, import required rpm keys, update & install packages with dnf -f Configure firewalld default zone rules - -u Configure systemd unit files for ARO RP + -u Configure systemd unit files -i Pull container images Note: steps will be executed in the order that flags are provided @@ -37,6 +72,12 @@ usage() { parse_run_options() { # shellcheck disable=SC2206 local -a options=(${1:-}) + local -n pkgs_to_exclude="$2" + local -n pkgs_to_install="$3" + local -n ports_to_enable="$4" + local -n services_to_enable="$5" + local -n images_to_pull="$6" + if [ "${#options[@]}" -eq 0 ]; then log "Running all steps" return 0 @@ -47,20 +88,27 @@ parse_run_options() { while getopts ${allowed_options} options; do case "${options}" in p) - log "Running step configure_and_install_dnf_pkgs_repos" - configure_and_install_dnf_pkgs_repos + log "Running step dnf_update_pkgs" + dnf_update_pkgs pkgs_to_exclude retry_wait_time + + log "Running step dnf_install_pkgs" + dnf_install_pkgs pkgs_to_install retry_wait_time + + log "Running step configure_dnf_cron_job" + configure_dnf_cron_job ;; f) log "Running configure_firewalld_rules" - configure_firewalld_rules + configure_firewalld_rules ports_to_enable ;; u) - log "Running pull_container_images & configure_system_services" - configure_system_services + log "Running step configure_devproxy_services" + configure_devproxy_services + enable_services services_to_enable ;; i) log "Running pull_container_images" - pull_container_images + pull_container_images images_to_pull ;; *) usage allowed_options @@ -72,223 +120,10 @@ parse_run_options() { exit 0 } -# configure_and_install_dnf_pkgs_repos -configure_and_install_dnf_pkgs_repos() { - log "starting" - - # transaction attempt retry time in seconds - local -ri retry_wait_time=60 - configure_rhui_repo retry_wait_time - - local -ar exclude_pkgs=( - "-x WALinuxAgent" - "-x WALinuxAgent-udev" - ) - - dnf_update_pkgs exclude_pkgs retry_wait_time - - local -ra repo_rpm_pkgs=( - https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm - ) - - local -ra install_pkgs=( - podman - podman-docker - ) - - dnf_install_pkgs repo_rpm_pkgs retry_wait_time - dnf_install_pkgs install_pkgs retry_wait_time - - local -r cron_weekly_dnf_update_filename='/etc/cron.weekly/dnfupdate' - local -r cron_weekly_dnf_update_file="#!/bin/bash -dnf update -y" - - write_file cron_weekly_dnf_update_filename cron_weekly_dnf_update_file true - chmod +x "$cron_weekly_dnf_update_filename" -} - -# configure_rhui_repo -configure_rhui_repo() { - log "starting" - - local -ra cmd=( - dnf - update - -y - --disablerepo='*' - --enablerepo='rhui-microsoft-azure*' - ) - - log "running RHUI package updates" - retry cmd "$1" -} - -# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks -retry() { - local -n cmd_retry="$1" - local -n wait_time="$2" - - for attempt in {1..5}; do - log "attempt #${attempt} - ${FUNCNAME[2]}" - ${cmd_retry[@]} & - - wait $! && break - if [[ ${attempt} -lt 5 ]]; then - sleep "$wait_time" - else - abort "attempt #${attempt} - Failed to update packages" - fi - done -} - -# dnf_update_pkgs -dnf_update_pkgs() { - local -n excludes="$1" - log "starting" - - local -ra cmd=( - dnf - -y - ${excludes[@]} - update - --allowerasing - ) - - log "Updating all packages" - retry cmd "$2" -} - -# dnf_install_pkgs -dnf_install_pkgs() { - local -n pkgs="$1" - log "starting" - - local -ra cmd=( - dnf - -y - install - ${pkgs[@]} - ) - - log "Attempting to install packages: ${pkgs[*]}" - retry cmd "$2" -} - -# configure_logrotate clobbers /etc/logrotate.conf -configure_logrotate() { - log "starting" - - local -r logrotate_conf_filename='/etc/logrotate.conf' - local -r logrotate_conf_file='# see "man logrotate" for details -# rotate log files weekly -weekly - -# keep 2 weeks worth of backlogs -rotate 2 - -# create new (empty) log files after rotating old ones -create - -# use date as a suffix of the rotated file -dateext - -# uncomment this if you want your log files compressed -compress - -# RPM packages drop log rotation information into this directory -include /etc/logrotate.d - -# no packages own wtmp and btmp -- we will rotate them here -/var/log/wtmp { - monthly - create 0664 root utmp - minsize 1M - rotate 1 -} - -/var/log/btmp { - missingok - monthly - create 0600 root utmp - rotate 1 -}' - - write_file logrotate_conf_filename logrotate_conf_file true -} - -# configure_firewalld_rules -configure_firewalld_rules() { - log "starting" - - # https://access.redhat.com/security/cve/cve-2020-13401 - local -r prefix="/etc/sysctl.d" - local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" - local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" - - write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true - - local -r disable_core_filename="$prefix/01-disable-core.conf" - local -r disable_core_file="kernel.core_pattern = |/bin/true - " - write_file disable_core_filename disable_core_file true - - sysctl --system - - local -ra enable_ports=( - "443/tcp" - ) - - log "Enabling ports ${enable_ports[*]} on default firewalld zone" - # shellcheck disable=SC2068 - for port in ${enable_ports[@]}; do - log "Enabling port $port now" - firewall-cmd "--add-port=$port" - done - - firewall-cmd --runtime-to-permanent -} - -# pull_container_images -pull_container_images() { - log "starting" - - # The managed identity that the VM runs as only has a single roleassignment. - # This role assignment is ACRPull which is not necessarily present in the - # subscription we're deploying into. If the identity does not have any - # role assignments scoped on the subscription we're deploying into, it will - # not show on az login -i, which is why the below line is commented. - # az account set -s "$SUBSCRIPTIONID" - az login -i --allow-no-subscriptions - - # Suppress emulation output for podman instead of docker for az acr compatability - mkdir -p /etc/containers/ - mkdir -p /root/.docker - touch /etc/containers/nodocker - - # This name is used in the case that az acr login searches for this in it's environment - local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" - local -r registry_config_file="{ - "auths": { - \"${PROXYIMAGE%%/*}\": { - \"auth\": \"$PROXYIMAGEAUTH\" - } - }" - - write_file REGISTRY_AUTH_FILE registry_config_file true - - log "logging into prod acr" - - az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" - - docker pull "$PROXYIMAGE" - - az logout -} - # configure_system_services creates, configures, and enables the following systemd services and timers # services # proxy -configure_system_services() { +configure_devproxy_services() { configure_service_proxy } @@ -296,9 +131,6 @@ configure_system_services() { enable_aro_services() { log "starting" - local -ra aro_services=( - proxy - ) log "enabling aro services ${aro_services[*]}" # shellcheck disable=SC2068 for service in ${aro_services[@]}; do @@ -357,48 +189,6 @@ systemctl restart proxy.service" chmod +x "$cron_daily_restart_proxy_filename" } -# write_file -# Args -# 1) filename - string -# 2) file_contents - string -# 3) clobber - boolean; optional - defaults to false -write_file() { - local -n filename="$1" - local -n file_contents="$2" - local -r clobber="${3:-false}" - - if $clobber; then - log "Overwriting file $filename" - echo "$file_contents" > "$filename" - else - log "Appending to $filename" - echo "$file_contents" >> "$filename" - fi -} - -# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots -reboot_vm() { - log "starting" - - configure_selinux "true" - (sleep 30 && log "rebooting vm now"; reboot) & -} - -# log is a wrapper for echo that includes the function name -log() { - local -r msg="${1:-"log message is empty"}" - local -r stack_level="${2:-1}" - echo "${FUNCNAME[${stack_level}]}: ${msg}" -} - -# abort is a wrapper for log that exits with an error code -abort() { - local -ri origin_stacklevel=2 - log "${1}" "$origin_stacklevel" - log "Exiting" - exit 1 -} - export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" main "$@" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index e8cedfd1e25..decdfba6986 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -89,6 +89,7 @@ main() { dnf_install_pkgs repo_rpm_pkgs retry_wait_time dnf_install_pkgs install_pkgs retry_wait_time + configure_dnf_cron_job configure_disk_partitions configure_logrotate @@ -114,10 +115,10 @@ usage() { -d Configure Disk Partitions -p Configure rpm repositories, import required rpm keys, update & install packages with dnf -l Configure logrotate.conf - -s Make selinux modifications required for ARO RP + -s Configure selinux -r Configure sshd - Allow password authenticaiton -f Configure firewalld default zone rules - -u Configure systemd unit files for ARO RP + -u Configure systemd unit files -i Pull container images Note: steps will be executed in the order that flags are provided @@ -165,6 +166,9 @@ parse_run_options() { log "Running step dnf_install_pkgs pkgs" dnf_install_pkgs pkgs_to_install retry_time + + log "Running step configure_dnf_crond_job" + configure_dnf_cron_job ;; l) log "Running configure_logrotate" @@ -209,22 +213,6 @@ configure_rpm_repos() { create_azure_rpm_repos "$1" } -# configure_rhui_repo -configure_rhui_repo() { - log "starting" - - local -ra cmd=( - dnf - update - -y - --disablerepo='*' - --enablerepo='rhui-microsoft-azure*' - ) - - log "running RHUI package updates" - retry cmd "$1" -} - # configure_disk_partitions configure_disk_partitions() { log "starting" From 28b42a0848679165f547f73afa2bb457ce969192 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 18 Apr 2024 09:42:54 -0400 Subject: [PATCH 26/38] Correct parse_run_options by passing in user options as a nameref var --- pkg/deploy/generator/scripts/devProxyVMSS.sh | 14 ++++++++++---- pkg/deploy/generator/scripts/rpVMSS.sh | 5 +++-- 2 files changed, 13 insertions(+), 6 deletions(-) diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index 19289b8ee1a..2c35fa6ee88 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -18,10 +18,10 @@ main() { "443/tcp" ) - local proxy_image="$PROXYIMAGE" + local -ra proxy_images=("$PROXYIMAGE") local -r registry_config_file="{ \"auths\": { - \"${PROXYIMAGE%%/*}\": { + \"${proxy_images[0]%%/*}\": { \"auth\": \"$PROXYIMAGEAUTH\" } }" @@ -40,7 +40,13 @@ main() { proxy ) - parse_run_options "$@" + local -ra user_options=("$@") + parse_run_options user_options \ + exclude_pkgs \ + install_pkgs \ + enable_ports \ + proxy_services \ + proxy_images dnf_update_pkgs pkgs_to_exclude retry_wait_time dnf_install_pkgs install_pkgs retry_wait_time @@ -71,7 +77,7 @@ usage() { # This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline parse_run_options() { # shellcheck disable=SC2206 - local -a options=(${1:-}) + local -n run_options="$1" local -n pkgs_to_exclude="$2" local -n pkgs_to_install="$3" local -n ports_to_enable="$4" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index decdfba6986..b954a29fd19 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -70,7 +70,8 @@ main() { "fluentbit" ) - parse_run_options "$@" \ + local -ra user_options=("$@") + parse_run_options user_options \ retry_wait_time \ exclude_pkgs \ rpm_keys \ @@ -131,7 +132,7 @@ usage() { # This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline parse_run_options() { # shellcheck disable=SC2206 - local -a options=(${1:-}) + local -n run_options="$1" local -n retry_time="$2" local -n pkgs_to_exclude="$3" local -n keys_to_import="$4" From 9160d504d8b620f3de54fcbaae41403e088d45b2 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 18 Apr 2024 09:57:58 -0400 Subject: [PATCH 27/38] Correct options in parse_run_options to avoid curcuilar nameref, pass PROXY_IMAGE to configure_service_proxy function --- pkg/deploy/generator/scripts/devProxyVMSS.sh | 18 ++++++++++-------- pkg/deploy/generator/scripts/rpVMSS.sh | 4 ++-- 2 files changed, 12 insertions(+), 10 deletions(-) diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index 2c35fa6ee88..f7816f47294 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -54,7 +54,7 @@ main() { configure_firewalld_rules enable_ports pull_container_images proxy_image registry_config_file - configure_devproxy_services + configure_devproxy_services proxy_images enable_services proxy_services reboot_vm } @@ -84,7 +84,7 @@ parse_run_options() { local -n services_to_enable="$5" local -n images_to_pull="$6" - if [ "${#options[@]}" -eq 0 ]; then + if [ "${#run_options[@]}" -eq 0 ]; then log "Running all steps" return 0 fi @@ -92,7 +92,7 @@ parse_run_options() { local OPTIND local -r allowed_options="pfui" while getopts ${allowed_options} options; do - case "${options}" in + case "${run_options}" in p) log "Running step dnf_update_pkgs" dnf_update_pkgs pkgs_to_exclude retry_wait_time @@ -109,7 +109,7 @@ parse_run_options() { ;; u) log "Running step configure_devproxy_services" - configure_devproxy_services + configure_devproxy_services proxy_images enable_services services_to_enable ;; i) @@ -130,7 +130,7 @@ parse_run_options() { # services # proxy configure_devproxy_services() { - configure_service_proxy + configure_service_proxy "$1" } # enable_aro_services enables all services required for aro rp @@ -158,7 +158,7 @@ configure_certs() { configure_service_proxy() { local -r sysconfig_proxy_filename='/etc/sysconfig/proxy' - local -r sysconfig_proxy_file="PROXY_IMAGE='$PROXYIMAGE'" + local -r sysconfig_proxy_file="PROXY_IMAGE='$1'" write_file sysconfig_proxy_filename sysconfig_proxy_file true @@ -170,7 +170,7 @@ Wants=network-online.target [Service] EnvironmentFile=/etc/sysconfig/proxy ExecStartPre=-/usr/bin/docker rm -f %n -ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $PROXY_IMAGE +ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $1 ExecStop=/usr/bin/docker stop %n Restart=always RestartSec=1 @@ -179,9 +179,11 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" + write_file proxy_service_filename proxy_service_file true + local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image' local -r cron_weekly_pull_image_file="#!/bin/bash -docker pull $PROXYIMAGE +docker pull $1 systemctl restart proxy.service" write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index b954a29fd19..906bdfd1cde 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -142,7 +142,7 @@ parse_run_options() { local -n ports_to_enable="$8" local -n services_to_enable="$9" - if [ "${#options[@]}" -eq 0 ]; then + if [ "${#run_options[@]}" -eq 0 ]; then log "Running all steps" return 0 fi @@ -150,7 +150,7 @@ parse_run_options() { local OPTIND local -r allowed_options="dplsrfui" while getopts ${allowed_options} options; do - case "${options}" in + case "${run_options}" in d) log "Running step configure_disk_partitions" configure_disk_partitions From 347450e009386ff9a7d00a54b0f6df37b9171e16 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 18 Apr 2024 11:52:39 -0400 Subject: [PATCH 28/38] Remove unused function, correct nameref usage in configure_service_proxy --- pkg/deploy/assets/env-development.json | 2 +- pkg/deploy/assets/rp-production.json | 2 +- pkg/deploy/generator/scripts/devProxyVMSS.sh | 19 ++++--------------- 3 files changed, 6 insertions(+), 17 deletions(-) diff --git a/pkg/deploy/assets/env-development.json b/pkg/deploy/assets/env-development.json index af038e859b5..dc0106ae8b3 100644 --- a/pkg/deploy/assets/env-development.json +++ b/pkg/deploy/assets/env-development.json @@ -296,7 +296,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('IyEvYmluL2Jhc2gKCnNldCAtbyBlcnJleGl0IFwKICAgIC1vIG5vdW5zZXQKCmlmIFsgIiR7REVCVUc6LWZhbHNlfSIgPT0gdHJ1ZSBdOyB0aGVuCiAgICBzZXQgLXgKZmkKCm1haW4oKSB7CiAgICAjIHRyYW5zYWN0aW9uIGF0dGVtcHQgcmV0cnkgdGltZSBpbiBzZWNvbmRzCiAgICBsb2NhbCAtcmkgcmV0cnlfd2FpdF90aW1lPTYwCgogICAgIyBzaGVsbGNoZWNrIHNvdXJjZT1jb21tb24uc2gKICAgIHNvdXJjZSBjb21tb24uc2gKCiAgICBsb2NhbCAtcmEgZW5hYmxlX3BvcnRzPSgKICAgICAgICAiNDQzL3RjcCIKICAgICkKCiAgICBsb2NhbCBwcm94eV9pbWFnZT0iJFBST1hZSU1BR0UiCglsb2NhbCAtciByZWdpc3RyeV9jb25maWdfZmlsZT0iewogICAgXCJhdXRoc1wiOiB7CiAgICAgICAgXCIke1BST1hZSU1BR0UlJS8qfVwiOiB7CiAgICAgICAgICAgIFwiYXV0aFwiOiBcIiRQUk9YWUlNQUdFQVVUSFwiCiAgICAgICAgfQogICAgfSIKCiAgICBsb2NhbCAtYXIgZXhjbHVkZV9wa2dzPSgKICAgICAgICAiLXggV0FMaW51eEFnZW50IgogICAgICAgICIteCBXQUxpbnV4QWdlbnQtdWRldiIKICAgICkKCiAgICBsb2NhbCAtcmEgaW5zdGFsbF9wa2dzPSgKICAgICAgICBwb2RtYW4KICAgICAgICBwb2RtYW4tZG9ja2VyCiAgICApCgogICAgbG9jYWwgLXJhIHByb3h5X3NlcnZpY2VzPSgKCQlwcm94eQogICAgKQoKICAgIHBhcnNlX3J1bl9vcHRpb25zICIkQCIKCiAgICBkbmZfdXBkYXRlX3BrZ3MgcGtnc190b19leGNsdWRlIHJldHJ5X3dhaXRfdGltZQogICAgZG5mX2luc3RhbGxfcGtncyBpbnN0YWxsX3BrZ3MgcmV0cnlfd2FpdF90aW1lCiAgICBjb25maWd1cmVfZG5mX2Nyb25fam9iCgogICAgY29uZmlndXJlX2ZpcmV3YWxsZF9ydWxlcyBlbmFibGVfcG9ydHMKICAgIHB1bGxfY29udGFpbmVyX2ltYWdlcyBwcm94eV9pbWFnZSByZWdpc3RyeV9jb25maWdfZmlsZQogICAgY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzCiAgICBlbmFibGVfc2VydmljZXMgcHJveHlfc2VydmljZXMKICAgIHJlYm9vdF92bQp9Cgp1c2FnZSgpIHsKICAgIGxvY2FsIC1uIG9wdGlvbnM9IiQxIgogICAgbG9nICIkKGJhc2VuYW1lICIkMCIpIFskb3B0aW9uc10KICAgICAgICAtcCBDb25maWd1cmUgcnBtIHJlcG9zaXRvcmllcywgaW1wb3J0IHJlcXVpcmVkIHJwbSBrZXlzLCB1cGRhdGUgJiBpbnN0YWxsIHBhY2thZ2VzIHdpdGggZG5mCiAgICAgICAgLWYgQ29uZmlndXJlIGZpcmV3YWxsZCBkZWZhdWx0IHpvbmUgcnVsZXMKICAgICAgICAtdSBDb25maWd1cmUgc3lzdGVtZCB1bml0IGZpbGVzCiAgICAgICAgLWkgUHVsbCBjb250YWluZXIgaW1hZ2VzCgogICAgICAgIE5vdGU6IHN0ZXBzIHdpbGwgYmUgZXhlY3V0ZWQgaW4gdGhlIG9yZGVyIHRoYXQgZmxhZ3MgYXJlIHByb3ZpZGVkCiAgICAiCn0KCiMgcGFyc2VfcnVuX29wdGlvbnMgdGFrZXMgYWxsIGFyZ3VlbWVudHMgcGFzc2VkIHRvIG1haW4gYW5kIHBhcnNlcyB0aGVtCiMgYWxsb3dpbmcgaW5kaXZpZHVhbCBzdGVwKHMpIHRvIGJlIHJhbiwgcmF0aGVyIHRoYW4gYWxsIHN0ZXBzCiMKIyBUaGlzIGlzIHVzZWZ1bCBmb3IgbG9jYWwgdGVzdGluZywgb3IgcG9zc2libHkgbW9kaWZ5aW5nIHRoZSBib290c3RyYXAgZXhlY3V0aW9uIHZpYSBlbnZpcm9ubWVudCB2YXJpYWJsZXMgaW4gdGhlIGRlcGxveW1lbnQgcGlwZWxpbmUKcGFyc2VfcnVuX29wdGlvbnMoKSB7CiAgICAjIHNoZWxsY2hlY2sgZGlzYWJsZT1TQzIyMDYKICAgIGxvY2FsIC1hIG9wdGlvbnM9KCR7MTotfSkKICAgIGxvY2FsIC1uIHBrZ3NfdG9fZXhjbHVkZT0iJDIiCiAgICBsb2NhbCAtbiBwa2dzX3RvX2luc3RhbGw9IiQzIgogICAgbG9jYWwgLW4gcG9ydHNfdG9fZW5hYmxlPSIkNCIKICAgIGxvY2FsIC1uIHNlcnZpY2VzX3RvX2VuYWJsZT0iJDUiCiAgICBsb2NhbCAtbiBpbWFnZXNfdG9fcHVsbD0iJDYiCgogICAgaWYgWyAiJHsjb3B0aW9uc1tAXX0iIC1lcSAwIF07IHRoZW4KICAgICAgICBsb2cgIlJ1bm5pbmcgYWxsIHN0ZXBzIgogICAgICAgIHJldHVybiAwCiAgICBmaQoKICAgIGxvY2FsIE9QVElORAoJbG9jYWwgLXIgYWxsb3dlZF9vcHRpb25zPSJwZnVpIgogICAgd2hpbGUgZ2V0b3B0cyAke2FsbG93ZWRfb3B0aW9uc30gb3B0aW9uczsgZG8KICAgICAgICBjYXNlICIke29wdGlvbnN9IiBpbgogICAgICAgICAgICBwKQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHN0ZXAgZG5mX3VwZGF0ZV9wa2dzIgogICAgICAgICAgICAgICAgZG5mX3VwZGF0ZV9wa2dzIHBrZ3NfdG9fZXhjbHVkZSByZXRyeV93YWl0X3RpbWUKCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgc3RlcCBkbmZfaW5zdGFsbF9wa2dzIgogICAgICAgICAgICAgICAgZG5mX2luc3RhbGxfcGtncyBwa2dzX3RvX2luc3RhbGwgcmV0cnlfd2FpdF90aW1lCgogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHN0ZXAgY29uZmlndXJlX2RuZl9jcm9uX2pvYiIKICAgICAgICAgICAgICAgIGNvbmZpZ3VyZV9kbmZfY3Jvbl9qb2IKICAgICAgICAgICAgICAgIDs7CiAgICAgICAgICAgIGYpCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgY29uZmlndXJlX2ZpcmV3YWxsZF9ydWxlcyIKICAgICAgICAgICAgICAgIGNvbmZpZ3VyZV9maXJld2FsbGRfcnVsZXMgcG9ydHNfdG9fZW5hYmxlCiAgICAgICAgICAgICAgICA7OwogICAgICAgICAgICB1KQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHN0ZXAgY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzIgogICAgICAgICAgICAgICAgY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzCiAgICAgICAgICAgICAgICBlbmFibGVfc2VydmljZXMgc2VydmljZXNfdG9fZW5hYmxlCiAgICAgICAgICAgICAgICA7OwogICAgICAgICAgICBpKQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHB1bGxfY29udGFpbmVyX2ltYWdlcyIKICAgICAgICAgICAgICAgIHB1bGxfY29udGFpbmVyX2ltYWdlcyBpbWFnZXNfdG9fcHVsbAogICAgICAgICAgICAgICAgOzsKICAgICAgICAgICAgKikKICAgICAgICAgICAgICAgIHVzYWdlIGFsbG93ZWRfb3B0aW9ucwogICAgICAgICAgICAgICAgYWJvcnQgIlVua293biBvcHRpb24gcHJvdmlkZWQiCiAgICAgICAgICAgICAgICA7OwogICAgICAgIGVzYWMKICAgIGRvbmUKICAgIAogICAgZXhpdCAwCn0KCiMgY29uZmlndXJlX3N5c3RlbV9zZXJ2aWNlcyBjcmVhdGVzLCBjb25maWd1cmVzLCBhbmQgZW5hYmxlcyB0aGUgZm9sbG93aW5nIHN5c3RlbWQgc2VydmljZXMgYW5kIHRpbWVycwojIHNlcnZpY2VzCiMJcHJveHkKY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzKCkgewoJY29uZmlndXJlX3NlcnZpY2VfcHJveHkKfQoKIyBlbmFibGVfYXJvX3NlcnZpY2VzIGVuYWJsZXMgYWxsIHNlcnZpY2VzIHJlcXVpcmVkIGZvciBhcm8gcnAKZW5hYmxlX2Fyb19zZXJ2aWNlcygpIHsKICAgIGxvZyAic3RhcnRpbmciCgogICAgbG9nICJlbmFibGluZyBhcm8gc2VydmljZXMgJHthcm9fc2VydmljZXNbKl19IgogICAgIyBzaGVsbGNoZWNrIGRpc2FibGU9U0MyMDY4CiAgICBmb3Igc2VydmljZSBpbiAke2Fyb19zZXJ2aWNlc1tAXX07IGRvCiAgICAgICAgbG9nICJFbmFibGluZyAkc2VydmljZSBub3ciCiAgICAgICAgc3lzdGVtY3RsIGVuYWJsZSAiJHNlcnZpY2Uuc2VydmljZSIKICAgIGRvbmUKfQoKIyBjb25maWd1cmVfY2VydHMKY29uZmlndXJlX2NlcnRzKCkgewogICAgbG9nICJzdGFydGluZyIKCgliYXNlNjQgLWQgPDw8IiRQUk9YWUNFUlQiID4vZXRjL3Byb3h5L3Byb3h5LmNydAoJYmFzZTY0IC1kIDw8PCIkUFJPWFlLRVkiID4vZXRjL3Byb3h5L3Byb3h5LmtleQoJYmFzZTY0IC1kIDw8PCIkUFJPWFlDTElFTlRDRVJUIiA+L2V0Yy9wcm94eS9wcm94eS1jbGllbnQuY3J0CgljaG93biAtUiAxMDAwOjEwMDAgL2V0Yy9wcm94eQoJY2htb2QgMDYwMCAvZXRjL3Byb3h5L3Byb3h5LmtleQp9Cgpjb25maWd1cmVfc2VydmljZV9wcm94eSgpIHsKCWxvY2FsIC1yIHN5c2NvbmZpZ19wcm94eV9maWxlbmFtZT0nL2V0Yy9zeXNjb25maWcvcHJveHknCglsb2NhbCAtciBzeXNjb25maWdfcHJveHlfZmlsZT0iUFJPWFlfSU1BR0U9JyRQUk9YWUlNQUdFJyIKCgl3cml0ZV9maWxlIHN5c2NvbmZpZ19wcm94eV9maWxlbmFtZSBzeXNjb25maWdfcHJveHlfZmlsZSB0cnVlCgoJbG9jYWwgLXIgcHJveHlfc2VydmljZV9maWxlbmFtZT0nL2V0Yy9zeXN0ZW1kL3N5c3RlbS9wcm94eS5zZXJ2aWNlJwoJbG9jYWwgLXIgcHJveHlfc2VydmljZV9maWxlPSJbVW5pdF0KQWZ0ZXI9bmV0d29yay1vbmxpbmUudGFyZ2V0CldhbnRzPW5ldHdvcmstb25saW5lLnRhcmdldAoKW1NlcnZpY2VdCkVudmlyb25tZW50RmlsZT0vZXRjL3N5c2NvbmZpZy9wcm94eQpFeGVjU3RhcnRQcmU9LS91c3IvYmluL2RvY2tlciBybSAtZiAlbgpFeGVjU3RhcnQ9L3Vzci9iaW4vZG9ja2VyIHJ1biAtLXJtIC0tbmFtZSAlbiAtcCA0NDM6ODQ0MyAtdiAvZXRjL3Byb3h5Oi9zZWNyZXRzICRQUk9YWV9JTUFHRQpFeGVjU3RvcD0vdXNyL2Jpbi9kb2NrZXIgc3RvcCAlbgpSZXN0YXJ0PWFsd2F5cwpSZXN0YXJ0U2VjPTEKU3RhcnRMaW1pdEludGVydmFsPTAKCltJbnN0YWxsXQpXYW50ZWRCeT1tdWx0aS11c2VyLnRhcmdldCIKCglsb2NhbCAtciBjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGVuYW1lPScvZXRjL2Nyb24ud2Vla2x5L3B1bGwtaW1hZ2UnCglsb2NhbCAtciBjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGU9IiMhL2Jpbi9iYXNoCmRvY2tlciBwdWxsICRQUk9YWUlNQUdFCnN5c3RlbWN0bCByZXN0YXJ0IHByb3h5LnNlcnZpY2UiCgkKCXdyaXRlX2ZpbGUgY3Jvbl93ZWVrbHlfcHVsbF9pbWFnZV9maWxlbmFtZSBjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGUgdHJ1ZQoJY2htb2QgK3ggIiRjcm9uX3dlZWtseV9wdWxsX2ltYWdlX2ZpbGVuYW1lIgoKCWxvY2FsIC1yIGNyb25fZGFpbHlfcmVzdGFydF9wcm94eV9maWxlbmFtZT0nL2V0Yy9jcm9uLmRhaWx5L3Jlc3RhcnQtcHJveHknCglsb2NhbCAtciBjcm9uX2RhaWx5X3Jlc3RhcnRfcHJveHlfZmlsZT0iIyEvYmluL2Jhc2gKc3lzdGVtY3RsIHJlc3RhcnQgcHJveHkuc2VydmljZSIKCQoJd3JpdGVfZmlsZSBjcm9uX2RhaWx5X3Jlc3RhcnRfcHJveHlfZmlsZW5hbWUgY3Jvbl9kYWlseV9yZXN0YXJ0X3Byb3h5X2ZpbGUKCWNobW9kICt4ICIkY3Jvbl9kYWlseV9yZXN0YXJ0X3Byb3h5X2ZpbGVuYW1lIgp9CgpleHBvcnQgQVpVUkVfQ0xPVURfTkFNRT0iJHtBWlVSRUNMT1VETkFNRTo/IkZhaWxlZCB0byBjYXJyeSBvdmVyIHZhcmlhYmxlcyJ9IgoKbWFpbiAiJEAiCg==')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('IyEvYmluL2Jhc2gKCnNldCAtbyBlcnJleGl0IFwKICAgIC1vIG5vdW5zZXQKCmlmIFsgIiR7REVCVUc6LWZhbHNlfSIgPT0gdHJ1ZSBdOyB0aGVuCiAgICBzZXQgLXgKZmkKCm1haW4oKSB7CiAgICAjIHRyYW5zYWN0aW9uIGF0dGVtcHQgcmV0cnkgdGltZSBpbiBzZWNvbmRzCiAgICBsb2NhbCAtcmkgcmV0cnlfd2FpdF90aW1lPTYwCgogICAgIyBzaGVsbGNoZWNrIHNvdXJjZT1jb21tb24uc2gKICAgIHNvdXJjZSBjb21tb24uc2gKCiAgICBsb2NhbCAtcmEgZW5hYmxlX3BvcnRzPSgKICAgICAgICAiNDQzL3RjcCIKICAgICkKCiAgICBsb2NhbCAtcmEgcHJveHlfaW1hZ2VzPSgiJFBST1hZSU1BR0UiKQoJbG9jYWwgLXIgcmVnaXN0cnlfY29uZmlnX2ZpbGU9InsKICAgIFwiYXV0aHNcIjogewogICAgICAgIFwiJHtwcm94eV9pbWFnZXNbMF0lJS8qfVwiOiB7CiAgICAgICAgICAgIFwiYXV0aFwiOiBcIiRQUk9YWUlNQUdFQVVUSFwiCiAgICAgICAgfQogICAgfSIKCiAgICBsb2NhbCAtYXIgZXhjbHVkZV9wa2dzPSgKICAgICAgICAiLXggV0FMaW51eEFnZW50IgogICAgICAgICIteCBXQUxpbnV4QWdlbnQtdWRldiIKICAgICkKCiAgICBsb2NhbCAtcmEgaW5zdGFsbF9wa2dzPSgKICAgICAgICBwb2RtYW4KICAgICAgICBwb2RtYW4tZG9ja2VyCiAgICApCgogICAgbG9jYWwgLXJhIHByb3h5X3NlcnZpY2VzPSgKCQlwcm94eQogICAgKQoKICAgIGxvY2FsIC1yYSB1c2VyX29wdGlvbnM9KCIkQCIpCiAgICBwYXJzZV9ydW5fb3B0aW9ucyB1c2VyX29wdGlvbnMgXAogICAgICAgICAgICAgICAgICAgICAgICBleGNsdWRlX3BrZ3MgXAogICAgICAgICAgICAgICAgICAgICAgICBpbnN0YWxsX3BrZ3MgXAogICAgICAgICAgICAgICAgICAgICAgICBlbmFibGVfcG9ydHMgXAogICAgICAgICAgICAgICAgICAgICAgICBwcm94eV9zZXJ2aWNlcyBcCiAgICAgICAgICAgICAgICAgICAgICAgIHByb3h5X2ltYWdlcwoKICAgIGRuZl91cGRhdGVfcGtncyBwa2dzX3RvX2V4Y2x1ZGUgcmV0cnlfd2FpdF90aW1lCiAgICBkbmZfaW5zdGFsbF9wa2dzIGluc3RhbGxfcGtncyByZXRyeV93YWl0X3RpbWUKICAgIGNvbmZpZ3VyZV9kbmZfY3Jvbl9qb2IKCiAgICBjb25maWd1cmVfZmlyZXdhbGxkX3J1bGVzIGVuYWJsZV9wb3J0cwogICAgcHVsbF9jb250YWluZXJfaW1hZ2VzIHByb3h5X2ltYWdlIHJlZ2lzdHJ5X2NvbmZpZ19maWxlCiAgICBjb25maWd1cmVfZGV2cHJveHlfc2VydmljZXMgcHJveHlfaW1hZ2VzCiAgICBlbmFibGVfc2VydmljZXMgcHJveHlfc2VydmljZXMKICAgIHJlYm9vdF92bQp9Cgp1c2FnZSgpIHsKICAgIGxvY2FsIC1uIG9wdGlvbnM9IiQxIgogICAgbG9nICIkKGJhc2VuYW1lICIkMCIpIFskb3B0aW9uc10KICAgICAgICAtcCBDb25maWd1cmUgcnBtIHJlcG9zaXRvcmllcywgaW1wb3J0IHJlcXVpcmVkIHJwbSBrZXlzLCB1cGRhdGUgJiBpbnN0YWxsIHBhY2thZ2VzIHdpdGggZG5mCiAgICAgICAgLWYgQ29uZmlndXJlIGZpcmV3YWxsZCBkZWZhdWx0IHpvbmUgcnVsZXMKICAgICAgICAtdSBDb25maWd1cmUgc3lzdGVtZCB1bml0IGZpbGVzCiAgICAgICAgLWkgUHVsbCBjb250YWluZXIgaW1hZ2VzCgogICAgICAgIE5vdGU6IHN0ZXBzIHdpbGwgYmUgZXhlY3V0ZWQgaW4gdGhlIG9yZGVyIHRoYXQgZmxhZ3MgYXJlIHByb3ZpZGVkCiAgICAiCn0KCiMgcGFyc2VfcnVuX29wdGlvbnMgdGFrZXMgYWxsIGFyZ3VlbWVudHMgcGFzc2VkIHRvIG1haW4gYW5kIHBhcnNlcyB0aGVtCiMgYWxsb3dpbmcgaW5kaXZpZHVhbCBzdGVwKHMpIHRvIGJlIHJhbiwgcmF0aGVyIHRoYW4gYWxsIHN0ZXBzCiMKIyBUaGlzIGlzIHVzZWZ1bCBmb3IgbG9jYWwgdGVzdGluZywgb3IgcG9zc2libHkgbW9kaWZ5aW5nIHRoZSBib290c3RyYXAgZXhlY3V0aW9uIHZpYSBlbnZpcm9ubWVudCB2YXJpYWJsZXMgaW4gdGhlIGRlcGxveW1lbnQgcGlwZWxpbmUKcGFyc2VfcnVuX29wdGlvbnMoKSB7CiAgICAjIHNoZWxsY2hlY2sgZGlzYWJsZT1TQzIyMDYKICAgIGxvY2FsIC1uIHJ1bl9vcHRpb25zPSIkMSIKICAgIGxvY2FsIC1uIHBrZ3NfdG9fZXhjbHVkZT0iJDIiCiAgICBsb2NhbCAtbiBwa2dzX3RvX2luc3RhbGw9IiQzIgogICAgbG9jYWwgLW4gcG9ydHNfdG9fZW5hYmxlPSIkNCIKICAgIGxvY2FsIC1uIHNlcnZpY2VzX3RvX2VuYWJsZT0iJDUiCiAgICBsb2NhbCAtbiBpbWFnZXNfdG9fcHVsbD0iJDYiCgogICAgaWYgWyAiJHsjcnVuX29wdGlvbnNbQF19IiAtZXEgMCBdOyB0aGVuCiAgICAgICAgbG9nICJSdW5uaW5nIGFsbCBzdGVwcyIKICAgICAgICByZXR1cm4gMAogICAgZmkKCiAgICBsb2NhbCBPUFRJTkQKCWxvY2FsIC1yIGFsbG93ZWRfb3B0aW9ucz0icGZ1aSIKICAgIHdoaWxlIGdldG9wdHMgJHthbGxvd2VkX29wdGlvbnN9IG9wdGlvbnM7IGRvCiAgICAgICAgY2FzZSAiJHtydW5fb3B0aW9uc30iIGluCiAgICAgICAgICAgIHApCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgc3RlcCBkbmZfdXBkYXRlX3BrZ3MiCiAgICAgICAgICAgICAgICBkbmZfdXBkYXRlX3BrZ3MgcGtnc190b19leGNsdWRlIHJldHJ5X3dhaXRfdGltZQoKICAgICAgICAgICAgICAgIGxvZyAiUnVubmluZyBzdGVwIGRuZl9pbnN0YWxsX3BrZ3MiCiAgICAgICAgICAgICAgICBkbmZfaW5zdGFsbF9wa2dzIHBrZ3NfdG9faW5zdGFsbCByZXRyeV93YWl0X3RpbWUKCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgc3RlcCBjb25maWd1cmVfZG5mX2Nyb25fam9iIgogICAgICAgICAgICAgICAgY29uZmlndXJlX2RuZl9jcm9uX2pvYgogICAgICAgICAgICAgICAgOzsKICAgICAgICAgICAgZikKICAgICAgICAgICAgICAgIGxvZyAiUnVubmluZyBjb25maWd1cmVfZmlyZXdhbGxkX3J1bGVzIgogICAgICAgICAgICAgICAgY29uZmlndXJlX2ZpcmV3YWxsZF9ydWxlcyBwb3J0c190b19lbmFibGUKICAgICAgICAgICAgICAgIDs7CiAgICAgICAgICAgIHUpCiAgICAgICAgICAgICAgICBsb2cgIlJ1bm5pbmcgc3RlcCBjb25maWd1cmVfZGV2cHJveHlfc2VydmljZXMiCiAgICAgICAgICAgICAgICBjb25maWd1cmVfZGV2cHJveHlfc2VydmljZXMgcHJveHlfaW1hZ2VzCiAgICAgICAgICAgICAgICBlbmFibGVfc2VydmljZXMgc2VydmljZXNfdG9fZW5hYmxlCiAgICAgICAgICAgICAgICA7OwogICAgICAgICAgICBpKQogICAgICAgICAgICAgICAgbG9nICJSdW5uaW5nIHB1bGxfY29udGFpbmVyX2ltYWdlcyIKICAgICAgICAgICAgICAgIHB1bGxfY29udGFpbmVyX2ltYWdlcyBpbWFnZXNfdG9fcHVsbAogICAgICAgICAgICAgICAgOzsKICAgICAgICAgICAgKikKICAgICAgICAgICAgICAgIHVzYWdlIGFsbG93ZWRfb3B0aW9ucwogICAgICAgICAgICAgICAgYWJvcnQgIlVua293biBvcHRpb24gcHJvdmlkZWQiCiAgICAgICAgICAgICAgICA7OwogICAgICAgIGVzYWMKICAgIGRvbmUKICAgIAogICAgZXhpdCAwCn0KCiMgY29uZmlndXJlX3N5c3RlbV9zZXJ2aWNlcyBjcmVhdGVzLCBjb25maWd1cmVzLCBhbmQgZW5hYmxlcyB0aGUgZm9sbG93aW5nIHN5c3RlbWQgc2VydmljZXMgYW5kIHRpbWVycwojIHNlcnZpY2VzCiMJcHJveHkKY29uZmlndXJlX2RldnByb3h5X3NlcnZpY2VzKCkgewoJY29uZmlndXJlX3NlcnZpY2VfcHJveHkgIiQxIgp9CgojIGVuYWJsZV9hcm9fc2VydmljZXMgZW5hYmxlcyBhbGwgc2VydmljZXMgcmVxdWlyZWQgZm9yIGFybyBycAplbmFibGVfYXJvX3NlcnZpY2VzKCkgewogICAgbG9nICJzdGFydGluZyIKCiAgICBsb2cgImVuYWJsaW5nIGFybyBzZXJ2aWNlcyAke2Fyb19zZXJ2aWNlc1sqXX0iCiAgICAjIHNoZWxsY2hlY2sgZGlzYWJsZT1TQzIwNjgKICAgIGZvciBzZXJ2aWNlIGluICR7YXJvX3NlcnZpY2VzW0BdfTsgZG8KICAgICAgICBsb2cgIkVuYWJsaW5nICRzZXJ2aWNlIG5vdyIKICAgICAgICBzeXN0ZW1jdGwgZW5hYmxlICIkc2VydmljZS5zZXJ2aWNlIgogICAgZG9uZQp9CgojIGNvbmZpZ3VyZV9jZXJ0cwpjb25maWd1cmVfY2VydHMoKSB7CiAgICBsb2cgInN0YXJ0aW5nIgoKCWJhc2U2NCAtZCA8PDwiJFBST1hZQ0VSVCIgPi9ldGMvcHJveHkvcHJveHkuY3J0CgliYXNlNjQgLWQgPDw8IiRQUk9YWUtFWSIgPi9ldGMvcHJveHkvcHJveHkua2V5CgliYXNlNjQgLWQgPDw8IiRQUk9YWUNMSUVOVENFUlQiID4vZXRjL3Byb3h5L3Byb3h5LWNsaWVudC5jcnQKCWNob3duIC1SIDEwMDA6MTAwMCAvZXRjL3Byb3h5CgljaG1vZCAwNjAwIC9ldGMvcHJveHkvcHJveHkua2V5Cn0KCmNvbmZpZ3VyZV9zZXJ2aWNlX3Byb3h5KCkgewoJbG9jYWwgLXIgc3lzY29uZmlnX3Byb3h5X2ZpbGVuYW1lPScvZXRjL3N5c2NvbmZpZy9wcm94eScKCWxvY2FsIC1yIHN5c2NvbmZpZ19wcm94eV9maWxlPSJQUk9YWV9JTUFHRT0nJDEnIgoKCXdyaXRlX2ZpbGUgc3lzY29uZmlnX3Byb3h5X2ZpbGVuYW1lIHN5c2NvbmZpZ19wcm94eV9maWxlIHRydWUKCglsb2NhbCAtciBwcm94eV9zZXJ2aWNlX2ZpbGVuYW1lPScvZXRjL3N5c3RlbWQvc3lzdGVtL3Byb3h5LnNlcnZpY2UnCglsb2NhbCAtciBwcm94eV9zZXJ2aWNlX2ZpbGU9IltVbml0XQpBZnRlcj1uZXR3b3JrLW9ubGluZS50YXJnZXQKV2FudHM9bmV0d29yay1vbmxpbmUudGFyZ2V0CgpbU2VydmljZV0KRW52aXJvbm1lbnRGaWxlPS9ldGMvc3lzY29uZmlnL3Byb3h5CkV4ZWNTdGFydFByZT0tL3Vzci9iaW4vZG9ja2VyIHJtIC1mICVuCkV4ZWNTdGFydD0vdXNyL2Jpbi9kb2NrZXIgcnVuIC0tcm0gLS1uYW1lICVuIC1wIDQ0Mzo4NDQzIC12IC9ldGMvcHJveHk6L3NlY3JldHMgJDEKRXhlY1N0b3A9L3Vzci9iaW4vZG9ja2VyIHN0b3AgJW4KUmVzdGFydD1hbHdheXMKUmVzdGFydFNlYz0xClN0YXJ0TGltaXRJbnRlcnZhbD0wCgpbSW5zdGFsbF0KV2FudGVkQnk9bXVsdGktdXNlci50YXJnZXQiCgogICAgd3JpdGVfZmlsZSBwcm94eV9zZXJ2aWNlX2ZpbGVuYW1lIHByb3h5X3NlcnZpY2VfZmlsZSB0cnVlCgoJbG9jYWwgLXIgY3Jvbl93ZWVrbHlfcHVsbF9pbWFnZV9maWxlbmFtZT0nL2V0Yy9jcm9uLndlZWtseS9wdWxsLWltYWdlJwoJbG9jYWwgLXIgY3Jvbl93ZWVrbHlfcHVsbF9pbWFnZV9maWxlPSIjIS9iaW4vYmFzaApkb2NrZXIgcHVsbCAkMQpzeXN0ZW1jdGwgcmVzdGFydCBwcm94eS5zZXJ2aWNlIgoJCgl3cml0ZV9maWxlIGNyb25fd2Vla2x5X3B1bGxfaW1hZ2VfZmlsZW5hbWUgY3Jvbl93ZWVrbHlfcHVsbF9pbWFnZV9maWxlIHRydWUKCWNobW9kICt4ICIkY3Jvbl93ZWVrbHlfcHVsbF9pbWFnZV9maWxlbmFtZSIKCglsb2NhbCAtciBjcm9uX2RhaWx5X3Jlc3RhcnRfcHJveHlfZmlsZW5hbWU9Jy9ldGMvY3Jvbi5kYWlseS9yZXN0YXJ0LXByb3h5JwoJbG9jYWwgLXIgY3Jvbl9kYWlseV9yZXN0YXJ0X3Byb3h5X2ZpbGU9IiMhL2Jpbi9iYXNoCnN5c3RlbWN0bCByZXN0YXJ0IHByb3h5LnNlcnZpY2UiCgkKCXdyaXRlX2ZpbGUgY3Jvbl9kYWlseV9yZXN0YXJ0X3Byb3h5X2ZpbGVuYW1lIGNyb25fZGFpbHlfcmVzdGFydF9wcm94eV9maWxlCgljaG1vZCAreCAiJGNyb25fZGFpbHlfcmVzdGFydF9wcm94eV9maWxlbmFtZSIKfQoKZXhwb3J0IEFaVVJFX0NMT1VEX05BTUU9IiR7QVpVUkVDTE9VRE5BTUU6PyJGYWlsZWQgdG8gY2Fycnkgb3ZlciB2YXJpYWJsZXMifSIKCm1haW4gIiRAIgo=')))]" }, "provisionAfterExtensions": [ "Microsoft.Azure.Monitor.AzureMonitorLinuxAgent", diff --git a/pkg/deploy/assets/rp-production.json b/pkg/deploy/assets/rp-production.json index 19c4eed5edc..7eb662209c2 100644 --- a/pkg/deploy/assets/rp-production.json +++ b/pkg/deploy/assets/rp-production.json @@ -516,7 +516,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60

    # shellcheck source=common.sh
    source common.sh

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    local -ra images=(
        "$MDMIMAGE"
        "$RPIMAGE"
        "$FLUENTBITIMAGE"
    )

    local -ra enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )

    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )

    parse_run_options "$@" \
                        retry_wait_time \
                        exclude_pkgs \
                        rpm_keys \
                        repo_rpm_pkgs \
                        install_pkgs \
                        images \
                        enable_ports \
                        aro_services

    configure_sshd
    configure_rpm_repos retry_wait_time

    dnf_update_pkgs exclude_pkgs retry_wait_time

    rpm_import_keys rpm_keys retry_wait_time

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
    configure_dnf_cron_job

    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules enable_ports

    pull_container_images images
    configure_aro_services
    enable_services

    enable_services aro_services

    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Configure selinux
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    local -n retry_time="$2"
    local -n pkgs_to_exclude="$3"
    local -n keys_to_import="$4"
    local -n rpm_pkgs="$5"
    local -n pkgs_to_install="$6"
    local -n images_to_pull="$7"
    local -n ports_to_enable="$8"
    local -n services_to_enable="$9"

    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_rpm_repos"
                configure_rpm_repos keys_to_import

                log "Running step dnf_update_pkgs"
                dnf_update_pkgs pkgs_to_exclude retry_time

                log "Running step dnf_install_pkgs rpm_pkgs"
                dnf_install_pkgs rpm_pkgs retry_time

                log "Running step dnf_install_pkgs pkgs"
                dnf_install_pkgs pkgs_to_install retry_time
                
                log "Running step configure_dnf_crond_job"
                configure_dnf_cron_job
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules ports_to_enable
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_aro_services
                enable_services services_to_enable
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images images_to_pull
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# configure_rpm_repos
configure_rpm_repos() {
    log "starting"

    configure_rhui_repo "$1"
    create_azure_rpm_repos "$1"
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_aro_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_aro_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_service_filename fluentbit_service_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    log "starting"

    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file true

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_service_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "starting"
    log "configuring aro-monitor service"

    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file true
}

# configure_service_aro_portal
configure_service_aro_portal() {
    log "starting"

    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_filename aro_portal_service_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir -p "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60

    # shellcheck source=common.sh
    source common.sh

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    local -ra images=(
        "$MDMIMAGE"
        "$RPIMAGE"
        "$FLUENTBITIMAGE"
    )

    local -ra enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )

    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )

    local -ra user_options=("$@")
    parse_run_options user_options \
                        retry_wait_time \
                        exclude_pkgs \
                        rpm_keys \
                        repo_rpm_pkgs \
                        install_pkgs \
                        images \
                        enable_ports \
                        aro_services

    configure_sshd
    configure_rpm_repos retry_wait_time

    dnf_update_pkgs exclude_pkgs retry_wait_time

    rpm_import_keys rpm_keys retry_wait_time

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
    configure_dnf_cron_job

    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules enable_ports

    pull_container_images images
    configure_aro_services
    enable_services

    enable_services aro_services

    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Configure selinux
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -n run_options="$1"
    local -n retry_time="$2"
    local -n pkgs_to_exclude="$3"
    local -n keys_to_import="$4"
    local -n rpm_pkgs="$5"
    local -n pkgs_to_install="$6"
    local -n images_to_pull="$7"
    local -n ports_to_enable="$8"
    local -n services_to_enable="$9"

    if [ "${#run_options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${run_options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_rpm_repos"
                configure_rpm_repos keys_to_import

                log "Running step dnf_update_pkgs"
                dnf_update_pkgs pkgs_to_exclude retry_time

                log "Running step dnf_install_pkgs rpm_pkgs"
                dnf_install_pkgs rpm_pkgs retry_time

                log "Running step dnf_install_pkgs pkgs"
                dnf_install_pkgs pkgs_to_install retry_time
                
                log "Running step configure_dnf_crond_job"
                configure_dnf_cron_job
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules ports_to_enable
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_aro_services
                enable_services services_to_enable
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images images_to_pull
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# configure_rpm_repos
configure_rpm_repos() {
    log "starting"

    configure_rhui_repo "$1"
    create_azure_rpm_repos "$1"
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_aro_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_aro_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_service_filename fluentbit_service_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    log "starting"

    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file true

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_service_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "starting"
    log "configuring aro-monitor service"

    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file true
}

# configure_service_aro_portal
configure_service_aro_portal() {
    log "starting"

    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_filename aro_portal_service_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir -p "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" } } } diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index f7816f47294..b7ead0a35cf 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -133,18 +133,6 @@ configure_devproxy_services() { configure_service_proxy "$1" } -# enable_aro_services enables all services required for aro rp -enable_aro_services() { - log "starting" - - log "enabling aro services ${aro_services[*]}" - # shellcheck disable=SC2068 - for service in ${aro_services[@]}; do - log "Enabling $service now" - systemctl enable "$service.service" - done -} - # configure_certs configure_certs() { log "starting" @@ -157,8 +145,9 @@ configure_certs() { } configure_service_proxy() { + local -n proxy_image="$1" local -r sysconfig_proxy_filename='/etc/sysconfig/proxy' - local -r sysconfig_proxy_file="PROXY_IMAGE='$1'" + local -r sysconfig_proxy_file="PROXY_IMAGE='$proxy_image'" write_file sysconfig_proxy_filename sysconfig_proxy_file true @@ -170,7 +159,7 @@ Wants=network-online.target [Service] EnvironmentFile=/etc/sysconfig/proxy ExecStartPre=-/usr/bin/docker rm -f %n -ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $1 +ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $proxy_image ExecStop=/usr/bin/docker stop %n Restart=always RestartSec=1 @@ -183,7 +172,7 @@ WantedBy=multi-user.target" local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image' local -r cron_weekly_pull_image_file="#!/bin/bash -docker pull $1 +docker pull $proxy_image systemctl restart proxy.service" write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true From 8786bf160ba69bc42b33ecbf3c3388e9dcc77c57 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 18 Apr 2024 12:03:04 -0400 Subject: [PATCH 29/38] Correct docker json config file, overwrite daily proxy restart cron job --- pkg/deploy/generator/scripts/devProxyVMSS.sh | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index b7ead0a35cf..04be87f9aa1 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -24,7 +24,8 @@ main() { \"${proxy_images[0]%%/*}\": { \"auth\": \"$PROXYIMAGEAUTH\" } - }" + } +}" local -ar exclude_pkgs=( "-x WALinuxAgent" @@ -182,7 +183,7 @@ systemctl restart proxy.service" local -r cron_daily_restart_proxy_file="#!/bin/bash systemctl restart proxy.service" - write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file + write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file true chmod +x "$cron_daily_restart_proxy_filename" } From 86036378a219f5524e15be124eb59da277c7d790 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Thu, 18 Apr 2024 15:20:59 -0400 Subject: [PATCH 30/38] WIP remove parse_run_options --- pkg/deploy/generator/scripts/common.sh | 2 +- pkg/deploy/generator/scripts/devProxyVMSS.sh | 112 +++---------- pkg/deploy/generator/scripts/rpVMSS.sh | 163 ++++--------------- 3 files changed, 50 insertions(+), 227 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 436c89366a4..2f66da56789 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -120,7 +120,7 @@ configure_firewalld_rules() { sysctl --system - log "Enabling ports ${enable_ports[*]} on default firewalld zone" + log "Enabling ports ${ports[*]} on default firewalld zone" # shellcheck disable=SC2068 for port in ${ports[@]}; do log "Enabling port $port now" diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index 04be87f9aa1..9866313e007 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -14,10 +14,27 @@ main() { # shellcheck source=common.sh source common.sh + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + dnf_update_pkgs pkgs_to_exclude retry_wait_time + + local -ra install_pkgs=( + podman + podman-docker + ) + + dnf_install_pkgs install_pkgs retry_wait_time + configure_dnf_cron_job + local -ra enable_ports=( "443/tcp" ) + configure_firewalld_rules enable_ports + local -ra proxy_images=("$PROXYIMAGE") local -r registry_config_file="{ \"auths\": { @@ -27,106 +44,17 @@ main() { } }" - local -ar exclude_pkgs=( - "-x WALinuxAgent" - "-x WALinuxAgent-udev" - ) - - local -ra install_pkgs=( - podman - podman-docker - ) + pull_container_images proxy_image registry_config_file + configure_devproxy_services proxy_images local -ra proxy_services=( - proxy + proxy ) - local -ra user_options=("$@") - parse_run_options user_options \ - exclude_pkgs \ - install_pkgs \ - enable_ports \ - proxy_services \ - proxy_images - - dnf_update_pkgs pkgs_to_exclude retry_wait_time - dnf_install_pkgs install_pkgs retry_wait_time - configure_dnf_cron_job - - configure_firewalld_rules enable_ports - pull_container_images proxy_image registry_config_file - configure_devproxy_services proxy_images enable_services proxy_services reboot_vm } -usage() { - local -n options="$1" - log "$(basename "$0") [$options] - -p Configure rpm repositories, import required rpm keys, update & install packages with dnf - -f Configure firewalld default zone rules - -u Configure systemd unit files - -i Pull container images - - Note: steps will be executed in the order that flags are provided - " -} - -# parse_run_options takes all arguements passed to main and parses them -# allowing individual step(s) to be ran, rather than all steps -# -# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline -parse_run_options() { - # shellcheck disable=SC2206 - local -n run_options="$1" - local -n pkgs_to_exclude="$2" - local -n pkgs_to_install="$3" - local -n ports_to_enable="$4" - local -n services_to_enable="$5" - local -n images_to_pull="$6" - - if [ "${#run_options[@]}" -eq 0 ]; then - log "Running all steps" - return 0 - fi - - local OPTIND - local -r allowed_options="pfui" - while getopts ${allowed_options} options; do - case "${run_options}" in - p) - log "Running step dnf_update_pkgs" - dnf_update_pkgs pkgs_to_exclude retry_wait_time - - log "Running step dnf_install_pkgs" - dnf_install_pkgs pkgs_to_install retry_wait_time - - log "Running step configure_dnf_cron_job" - configure_dnf_cron_job - ;; - f) - log "Running configure_firewalld_rules" - configure_firewalld_rules ports_to_enable - ;; - u) - log "Running step configure_devproxy_services" - configure_devproxy_services proxy_images - enable_services services_to_enable - ;; - i) - log "Running pull_container_images" - pull_container_images images_to_pull - ;; - *) - usage allowed_options - abort "Unkown option provided" - ;; - esac - done - - exit 0 -} - # configure_system_services creates, configures, and enables the following systemd services and timers # services # proxy diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 906bdfd1cde..4f377a9d3fe 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -14,20 +14,29 @@ main() { # shellcheck source=common.sh source common.sh + configure_sshd + configure_rpm_repos retry_wait_time + local -ar exclude_pkgs=( "-x WALinuxAgent" "-x WALinuxAgent-udev" ) + dnf_update_pkgs exclude_pkgs retry_wait_time + local -ra rpm_keys=( https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 https://packages.microsoft.com/keys/microsoft.asc ) + rpm_import_keys rpm_keys retry_wait_time + local -ra repo_rpm_pkgs=( https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm ) + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + local -ra install_pkgs=( clamav azsec-clamav @@ -42,12 +51,15 @@ main() { python3 ) - MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" - local -ra images=( - "$MDMIMAGE" - "$RPIMAGE" - "$FLUENTBITIMAGE" - ) + dnf_install_pkgs install_pkgs retry_wait_time + configure_dnf_cron_job + + configure_disk_partitions + configure_logrotate + configure_selinux + + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store local -ra enable_ports=( "443/tcp" @@ -56,6 +68,17 @@ main() { "2222/tcp" ) + configure_firewalld_rules enable_ports + + MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + local -ra images=( + "$MDMIMAGE" + "$RPIMAGE" + "$FLUENTBITIMAGE" + ) + + pull_container_images images + local -ra aro_services=( "aro-dbtoken" "aro-monitor" @@ -70,38 +93,6 @@ main() { "fluentbit" ) - local -ra user_options=("$@") - parse_run_options user_options \ - retry_wait_time \ - exclude_pkgs \ - rpm_keys \ - repo_rpm_pkgs \ - install_pkgs \ - images \ - enable_ports \ - aro_services - - configure_sshd - configure_rpm_repos retry_wait_time - - dnf_update_pkgs exclude_pkgs retry_wait_time - - rpm_import_keys rpm_keys retry_wait_time - - dnf_install_pkgs repo_rpm_pkgs retry_wait_time - dnf_install_pkgs install_pkgs retry_wait_time - configure_dnf_cron_job - - configure_disk_partitions - configure_logrotate - configure_selinux - - mkdir -p /var/log/journal - mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store - - configure_firewalld_rules enable_ports - - pull_container_images images configure_aro_services enable_services @@ -110,102 +101,6 @@ main() { reboot_vm } -usage() { - local -n options="$1" - log "$(basename "$0") [$options] - -d Configure Disk Partitions - -p Configure rpm repositories, import required rpm keys, update & install packages with dnf - -l Configure logrotate.conf - -s Configure selinux - -r Configure sshd - Allow password authenticaiton - -f Configure firewalld default zone rules - -u Configure systemd unit files - -i Pull container images - - Note: steps will be executed in the order that flags are provided - " -} - -# parse_run_options takes all arguements passed to main and parses them -# allowing individual step(s) to be ran, rather than all steps -# -# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline -parse_run_options() { - # shellcheck disable=SC2206 - local -n run_options="$1" - local -n retry_time="$2" - local -n pkgs_to_exclude="$3" - local -n keys_to_import="$4" - local -n rpm_pkgs="$5" - local -n pkgs_to_install="$6" - local -n images_to_pull="$7" - local -n ports_to_enable="$8" - local -n services_to_enable="$9" - - if [ "${#run_options[@]}" -eq 0 ]; then - log "Running all steps" - return 0 - fi - - local OPTIND - local -r allowed_options="dplsrfui" - while getopts ${allowed_options} options; do - case "${run_options}" in - d) - log "Running step configure_disk_partitions" - configure_disk_partitions - ;; - p) - log "Running step configure_rpm_repos" - configure_rpm_repos keys_to_import - - log "Running step dnf_update_pkgs" - dnf_update_pkgs pkgs_to_exclude retry_time - - log "Running step dnf_install_pkgs rpm_pkgs" - dnf_install_pkgs rpm_pkgs retry_time - - log "Running step dnf_install_pkgs pkgs" - dnf_install_pkgs pkgs_to_install retry_time - - log "Running step configure_dnf_crond_job" - configure_dnf_cron_job - ;; - l) - log "Running configure_logrotate" - configure_logrotate - ;; - s) - log "Running configure_selinux" - configure_selinux - ;; - r) - log "Running configure_sshd" - configure_sshd - ;; - f) - log "Running configure_firewalld_rules" - configure_firewalld_rules ports_to_enable - ;; - u) - log "Running pull_container_images & configure_system_services" - configure_aro_services - enable_services services_to_enable - ;; - i) - log "Running pull_container_images" - pull_container_images images_to_pull - ;; - *) - usage allowed_options - abort "Unkown option provided" - ;; - esac - done - - exit 0 -} - # configure_rpm_repos configure_rpm_repos() { log "starting" From f29f2fa9c655271596c7fc379420b9d69ee3c5b3 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Fri, 19 Apr 2024 09:55:23 -0400 Subject: [PATCH 31/38] WIP committing to restore changes from stash --- pkg/deploy/generator/scripts/gatewayVMSS.sh | 2 +- pkg/deploy/generator/scripts/rpVMSS.sh | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 64b4232309f..83089fa3efe 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -757,7 +757,7 @@ WantedBy=multi-user.target' systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds" } -# configure_service_aro_rp +# configure_service_aro_gateway configure_service_aro_gateway() { local -n log_dir="$1" log "starting" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 4f377a9d3fe..424c40af8bf 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -750,6 +750,7 @@ WantedBy=multi-user.target" # configure_service_mdsd configure_service_mdsd() { + local -n mdsd log "starting" local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" From b0d90d613deaaffff6adb9d77cc444242a0da126 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Fri, 19 Apr 2024 10:02:54 -0400 Subject: [PATCH 32/38] Import stash --- pkg/deploy/generator/scripts/common.sh | 478 +++++++++++ pkg/deploy/generator/scripts/gatewayVMSS.sh | 832 ++------------------ pkg/deploy/generator/scripts/rpVMSS.sh | 522 ++---------- 3 files changed, 580 insertions(+), 1252 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 2f66da56789..f69e30dbf2c 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -131,7 +131,9 @@ configure_firewalld_rules() { } # configure_logrotate clobbers /etc/logrotate.conf +# TODO add writing of dropin files configure_logrotate() { + local -n dropin_files="$1" log "starting" local -r logrotate_conf_filename='/etc/logrotate.conf' @@ -170,6 +172,13 @@ include /etc/logrotate.d }' write_file logrotate_conf_filename logrotate_conf_file true + + local -r logrotate_d="/etc/logrotate.d" + log "Writing logrotate files to $logrotate_d" + for dropin_name in "${!dropin_files[@]}"; do + local -r dropin_file="$logrotate_d/$dropin_name" + write_file "$dropin_file" "${dropin_files["$dropin_name"]}" + done } # pull_container_images @@ -291,3 +300,472 @@ dnf update -y" chmod +x "$cron_weekly_dnf_update_filename" } +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { + log "starting" + + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] +name=azure-cli +baseurl=https://packages.microsoft.com/yumrepos/azure-cli +enabled=yes +gpgcheck=yes + +[azurecore] +name=azurecore +baseurl=https://packages.microsoft.com/yumrepos/azurecore +enabled=yes +gpgcheck=no' + + write_file azure_repo_filename azure_repo_file true +} + +# configure_disk_partitions +configure_disk_partitions() { + log "starting" + log "extending partition table" + + # Linux block devices are inconsistently named + # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here + physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" + growpart "$physical_disk" 2 + + log "extending filesystems" + log "extending root lvm" + lvextend -l +20%FREE /dev/rootvg/rootlv + log "growing root filesystem" + xfs_growfs / + + log "extending var lvm" + lvextend -l +100%FREE /dev/rootvg/varlv + log "growing var filesystem" + xfs_growfs /var +} + +# configure_certs +configure_certs() { + log "starting" + + mkdir /etc/aro-rp + base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + if [[ -n "$ARMAPICABUNDLE" ]]; then + base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + fi + chown -R 1000:1000 /etc/aro-rp + + # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not + # to honour SSL_CERT_FILE any more, heaven only knows why. + mkdir -p /usr/lib/ssl/certs + csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null + c_rehash /usr/lib/ssl/certs + +# we leave clientId blank as long as only 1 managed identity assigned to vmss +# if we have more than 1, we will need to populate with clientId used for off-node scanning + local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" + local -r nodescan_agent_file="{ + \"Nice\": 19, + \"Timeout\": 10800, + \"ClientId\": \"\", + \"TenantId\": $AZURESECPACKVSATENANTID, + \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL, + \"ProcessTimeout\": 300, + \"CommandDelay\": 0 + }" + + write_file nodescan_agent_filename nodescan_agent_file true +} + +# configure_service_mdm +configure_service_mdm() { + log "starting" + log "configuring mdm service" + + local -r sysconfig_mdm_filename="/etc/sysconfig/mdm" + local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL' +MDMIMAGE='$MDMIMAGE' +MDMSOURCEENVIRONMENT='$LOCATION' +MDMSOURCEROLE=gateway +MDMSOURCEROLEINSTANCE=\"$(hostname)\"" + + write_file sysconfig_mdm_filename sysconfig_mdm_file true + + mkdir -p /var/etw + local -r mdm_service_filename="/etc/systemd/system/mdm.service" + local -r mdm_service_file="[Unit] +After=network-online.target +Wants=network-online.target + +[Service] +EnvironmentFile=/etc/sysconfig/mdm +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStart=/usr/bin/docker run \ + --entrypoint /usr/sbin/MetricsExtension \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -m 2g \ + -v /etc/mdm.pem:/etc/mdm.pem \ + -v /var/etw:/var/etw:z \ + $MDMIMAGE \ + -CertFile /etc/mdm.pem \ + -FrontEndUrl $MDMFRONTENDURL \ + -Logger Console \ + -LogLevel Warning \ + -PrivateKeyFile /etc/mdm.pem \ + -SourceEnvironment $MDMSOURCEENVIRONMENT \ + -SourceRole $MDMSOURCEROLE \ + -SourceRoleInstance $MDMSOURCEROLEINSTANCE +ExecStop=/usr/bin/docker stop %N +Restart=always +RestartSec=1 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + write_file mdm_service_filename mdm_service_file true +} + +# configure_timers_mdm_mdsd +configure_timers_mdm_mdsd() { + log "starting" + + for var in "mdsd" "mdm"; do + local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service" + local download_creds_service_file="[Unit] +Description=Periodic $var credentials refresh + +[Service] +Type=oneshot +ExecStart=/usr/local/bin/download-credentials.sh $var" + + write_file download_creds_service_filename download_creds_service_file true + + local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer" + local download_creds_timer_file="[Unit] +Description=Periodic $var credentials refresh +After=network-online.target +Wants=network-online.target + +[Timer] +OnBootSec=0min +OnCalendar=0/12:00:00 +AccuracySec=5s + +[Install] +WantedBy=timers.target" + + write_file download_creds_timer_filename download_creds_timer_file true + done + + local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh" + local -r download_creds_script_file="#!/bin/bash +set -eu + +COMPONENT=\$1 +echo \"Download \$COMPONENT credentials\" + +TEMP_DIR=\"\$(mktemp -d)\" +export AZURE_CONFIG_DIR=\"\$(mktemp -d)\" + +echo \"Logging into Azure...\" +RETRIES=3 +while [[ \$RETRIES -gt 0 ]]; do + if az login -i --allow-no-subscriptions + then + echo \"az login successful\" + break + else + echo \"az login failed. Retrying...\" + let RETRIES-=1 + sleep 5 + fi +done + +trap \"cleanup\" EXIT + +cleanup() { + az logout + [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR + [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR +} + +if [[ \$COMPONENT = \"mdm\" ]]; then + CURRENT_CERT_FILE=\"/etc/mdm.pem\" +elif [[ \$COMPONENT\ = \"mdsd\" ]]; then + CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\" +else + echo Invalid usage && exit 1 +fi + +SECRET_NAME=\"gwy-\${COMPONENT}\" +NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\" +for attempt in {1..5}; do + az keyvault \ + secret \ + download \ + --file \"\$NEW_CERT_FILE\" \ + --id \"https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \ + && break + if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi +done + +if [ -f \$NEW_CERT_FILE ]; then + if [[ \$COMPONENT = \"mdsd\" ]]; then + chown syslog:syslog \$NEW_CERT_FILE + else + sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE + fi + + new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" + current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" + if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then + echo updating certificate for \$COMPONENT + chmod 0600 \$NEW_CERT_FILE + mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE + fi +else + echo Failed to refresh certificate for \$COMPONENT && exit 1 +fi" + + write_file download_creds_script_filename download_creds_script_file true + + chmod u+x /usr/local/bin/download-credentials.sh + + # TODO place this in enable services section + systemctl enable download-mdsd-credentials.timer + systemctl enable download-mdm-credentials.timer + + /usr/local/bin/download-credentials.sh mdsd + /usr/local/bin/download-credentials.sh mdm + + local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')" + local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service" + local -r watch_mdm_creds_service_file="[Unit] +Description=Watch for changes in mdm.pem and restarts the mdm service + +[Service] +Type=oneshot +ExecStart=/usr/bin/systemctl restart mdm.service + +[Install] +WantedBy=multi-user.target" + + write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true + + local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path' + local -r watch_mdm_creds_path_file='[Path] +PathModified=/etc/mdm.pem + +[Install] +WantedBy=multi-user.target' + + write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true + + local -r watch_mdm_creds='watch-mdm-credentials.path' + systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds" + systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds" +} + +# configure_service_fluentbit +configure_service_fluentbit() { + local -n fluentbit_conf_file="$1" + local -n fluentbit_image="$2" + log "starting" + log "configuring fluentbit service" + + if [[ -n $fluentbit_conf_file ]]; then + abort "$1 fluentbit config file cannot be empty" + elif [[ -n $fluentbit_image ]]; then + abort "$2 fluentbit image cannot be empty" + fi + + mkdir -p /etc/fluentbit/ + mkdir -p /var/lib/fluent + + local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' + write_file fluentbit_conf_filename fluentbit_conf_file true + + local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' + local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$fluentbit_image" + + write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true + + local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' + + local -r fluentbit_service_file="[Unit] +After=network-online.target +Wants=network-online.target +StartLimitIntervalSec=0 + +[Service] +RestartSec=1s +EnvironmentFile=/etc/sysconfig/fluentbit +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStart=/usr/bin/docker run \ + --security-opt label=disable \ + --entrypoint /opt/td-agent-bit/bin/td-agent-bit \ + --net=host \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \ + -v /var/lib/fluent:/var/lib/fluent:z \ + -v /var/log/journal:/var/log/journal:ro \ + -v /etc/machine-id:/etc/machine-id:ro \ + $fluentbit_image \ + -c /etc/fluentbit/fluentbit.conf + +ExecStop=/usr/bin/docker stop %N +Restart=always +RestartSec=5 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + write_file fluentbit_service_filename fluentbit_service_file true +} + +# configure_service_aro_dbtoken +configure_service_aro_dbtoken() { + local -n dbtoken_conf="$1" + local -n log_dir="${2:-}" + log "starting" + + local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken' + + write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true + + local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' + # TODO add test if log_dir is empty, else + local -r aro_dbtoken_service_file="[Unit] +After=network-online.target +Wants=network-online.target + +[Service] +EnvironmentFile=/etc/sysconfig/aro-dbtoken +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStart=/usr/bin/docker run \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \ + -e DATABASE_ACCOUNT_NAME \ + -e AZURE_DBTOKEN_CLIENT_ID \ + -e KEYVAULT_PREFIX \ + -e MDM_ACCOUNT \ + -e MDM_NAMESPACE \ + -m 2g \ + -p 445:8445 \ + -v /run/systemd/journal:/run/systemd/journal \ + -v /var/etw:/var/etw:z \ + $RPIMAGE \ + dbtoken +ExecStop=/usr/bin/docker stop -t 3600 %N +TimeoutStopSec=3600 +Restart=always +RestartSec=1 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + local -r aro_dbtoken_service_file="[Unit] +After=network-online.target +Wants=network-online.target + +[Service] +EnvironmentFile=/etc/sysconfig/aro-gateway +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir} +ExecStart=/usr/bin/docker run \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -e ACR_RESOURCE_ID \ + -e DATABASE_ACCOUNT_NAME \ + -e AZURE_DBTOKEN_CLIENT_ID \ + -e DBTOKEN_URL \ + -e GATEWAY_DOMAINS \ + -e GATEWAY_FEATURES \ + -e MDM_ACCOUNT \ + -e MDM_NAMESPACE \ + -m 2g \ + -p 80:8080 \ + -p 8081:8081 \ + -p 443:8443 \ + -v /run/systemd/journal:/run/systemd/journal \ + -v /var/etw:/var/etw:z \ + -v ${gateway_logdir}:/ctr.log:z \ + \$RPIMAGE \ + gateway +ExecStop=/usr/bin/docker stop -t 3600 %N +TimeoutStopSec=3600 +Restart=always +RestartSec=1 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + write_file aro_dbtoken_service_filename aro_dbtoken_service_file true +} + +# configure_service_mdsd +configure_service_mdsd() { + local -n monitor_config_version="$1" + log "starting" + + local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" + mkdir -p "$mdsd_service_dir" + + local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf" + local -r mdsd_override_conf_file="[Unit] +After=network-online.target" + + write_file mdsd_override_conf_filename mdsd_override_conf_file true + + local -r default_mdsd_filename="/etc/default/mdsd" + local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default +MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\" + +export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT' +export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT' +export MONITORING_GCS_REGION='$LOCATION' +export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault +export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN' +export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE' +export MONITORING_CONFIG_VERSION='$monitor_config_version' +export MONITORING_USE_GENEVA_CONFIG_SERVICE=true + +export MONITORING_TENANT='$LOCATION' +export MONITORING_ROLE=rp +export MONITORING_ROLE_INSTANCE=\"$(hostname)\" + +export MDSD_MSGPACK_SORT_COLUMNS=1\"" + + write_file default_mdsd_filename default_mdsd_file true +} + +# run_azsecd_config_scan +run_azsecd_config_scan() { + log "starting" + + local -ar configs=( + "baseline" + "clamav" + "software" + ) + + log "Scanning configuration files ${configs[*]}" + # shellcheck disable=SC2068 + for scan in ${configs[@]}; do + log "Scanning config file $scan now" + /usr/local/bin/azsecd config -s "$scan" -d P1D + done +} diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 83089fa3efe..064bf18bd49 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -8,124 +8,14 @@ if [ "${DEBUG:-false}" == true ]; then fi main() { - local -r gateway_logdir='/var/log/aro-gateway' - parse_run_options "$@" gateway_logdir - - configure_sshd - configure_and_install_dnf_pkgs_repos - configure_disk_partitions - configure_logrotate gateway_logdir - configure_selinux - - mkdir -p /var/log/journal - mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store - - configure_firewalld_rules - pull_container_images - configure_system_services gateway_logdir - reboot_vm -} - -usage() { - local -n options="$1" - log "$(basename "$0") [$options] - -d Configure Disk Partitions - -p Configure rpm repositories, import required rpm keys, update & install packages with dnf - -l Configure logrotate.conf - -s Make selinux modifications required for ARO RP - -r Configure sshd - Allow password authenticaiton - -f Configure firewalld default zone rules - -u Configure systemd unit files for ARO RP - -i Pull container images - - Note: steps will be executed in the order that flags are provided - " -} - -# parse_run_options takes all arguements passed to main and parses them -# allowing individual step(s) to be ran, rather than all steps -# -# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline -parse_run_options() { - # shellcheck disable=SC2206 - local -a options=(${1:-}) - if [ "${#options[@]}" -eq 0 ]; then - log "Running all steps" - return 0 - fi - - local OPTIND - local -r allowed_options="dplsrfui" - while getopts ${allowed_options} options; do - case "${options}" in - d) - log "Running step configure_disk_partitions" - configure_disk_partitions - ;; - p) - log "Running step configure_and_install_dnf_pkgs_repos" - configure_and_install_dnf_pkgs_repos - ;; - l) - log "Running configure_logrotate" - configure_logrotate "$2" - ;; - s) - log "Running configure_selinux" - configure_selinux - ;; - r) - log "Running configure_sshd" - configure_sshd - ;; - f) - log "Running configure_firewalld_rules" - configure_firewalld_rules - ;; - u) - log "Running pull_container_images & configure_system_services" - configure_system_services "$2" - ;; - i) - log "Running pull_container_images" - pull_container_images - ;; - *) - usage allowed_options - abort "Unkown option provided" - ;; - esac - done - - exit 0 -} - -# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work -configure_sshd() { - log "starting" - log "setting ssh password authentication" - sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config - - systemctl reload sshd.service - systemctl is-active --quiet sshd || abort "sshd failed to reload" -} - -# configure_and_install_dnf_pkgs_repos -configure_and_install_dnf_pkgs_repos() { - log "starting" - - # transaction attempt retry time in seconds - local -ri retry_wait_time=60 - configure_rhui_repo retry_wait_time - create_azure_rpm_repos retry_wait_time local -ar exclude_pkgs=( "-x WALinuxAgent" "-x WALinuxAgent-udev" ) - dnf_update_pkgs exclude_pkgs retry_wait_time + dnf_update_pkgs pkgs_to_exclude retry_wait_time local -ra rpm_keys=( https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 @@ -138,6 +28,8 @@ configure_and_install_dnf_pkgs_repos() { https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm ) + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + local -ra install_pkgs=( clamav azsec-clamav @@ -152,166 +44,15 @@ configure_and_install_dnf_pkgs_repos() { python3 ) - dnf_install_pkgs repo_rpm_pkgs retry_wait_time dnf_install_pkgs install_pkgs retry_wait_time -} - -# configure_rhui_repo -configure_rhui_repo() { - log "starting" - - local -ra cmd=( - dnf - update - -y - --disablerepo='*' - --enablerepo='rhui-microsoft-azure*' - ) - - log "running RHUI package updates" - retry cmd "$1" -} - -# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks -retry() { - local -n cmd_retry="$1" - local -n wait_time="$2" - - for attempt in {1..5}; do - log "attempt #${attempt} - ${FUNCNAME[2]}" - ${cmd_retry[@]} & - - wait $! && break - if [[ ${attempt} -lt 5 ]]; then - sleep "$wait_time" - else - abort "attempt #${attempt} - Failed to update packages" - fi - done -} - -# dnf_update_pkgs -dnf_update_pkgs() { - local -n excludes="$1" - log "starting" - - local -ra cmd=( - dnf - -y - ${excludes[@]} - update - --allowerasing - ) - - log "Updating all packages" - retry cmd "$2" -} - -# dnf_install_pkgs -dnf_install_pkgs() { - local -n pkgs="$1" - log "starting" - - local -ra cmd=( - dnf - -y - install - ${pkgs[@]} - ) - - log "Attempting to install packages: ${pkgs[*]}" - retry cmd "$2" -} - -# rpm_import_keys -rpm_import_keys() { - local -n keys="$1" - log "starting" - - - # shellcheck disable=SC2068 - for key in ${keys[@]}; do - if [ ${#keys[@]} -eq 0 ]; then - break - fi - local -a cmd=( - rpm - --import - -v - "$key" - ) - - log "attempt #$attempt - importing rpm repository key $key" - retry cmd "$2" && unset key - done -} - -# configure_disk_partitions -configure_disk_partitions() { - log "starting" - log "extending partition table" - - # Linux block devices are inconsistently named - # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here - physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" - growpart "$physical_disk" 2 - - log "extending filesystems" - log "extending root lvm" - lvextend -l +20%FREE /dev/rootvg/rootlv - log "growing root filesystem" - xfs_growfs / - - log "extending var lvm" - lvextend -l +100%FREE /dev/rootvg/varlv - log "growing var filesystem" - xfs_growfs /var -} - -# configure_logrotate clobbers /etc/logrotate.conf -configure_logrotate() { - local -n log_dir="$1" - log "starting" - - local -r logrotate_conf_filename='/etc/logrotate.conf' - local -r logrotate_conf_file="# see 'man logrotate' for details -# rotate log files weekly -weekly - -# keep 2 weeks worth of backlogs -rotate 2 - -# create new (empty) log files after rotating old ones -create - -# use date as a suffix of the rotated file -dateext - -# uncomment this if you want your log files compressed -compress - -# RPM packages drop log rotation information into this directory -include /etc/logrotate.d - -# no packages own wtmp and btmp -- we will rotate them here -/var/log/wtmp { - monthly - create 0664 root utmp - minsize 1M - rotate 1 -} -/var/log/btmp { - missingok - monthly - create 0600 root utmp - rotate 1 -} + configure_disk_partitions -# Maximum log directory size is 100G with this configuration + local -r gateway_logdir='/var/log/aro-gateway' + local -r gateway_log_file="# Maximum log directory size is 100G with this configuration # Setting limit to 100G to allow space for other logging services # copytruncate is a critical option used to prevent logs from being shipped twice -${log_dir} { +${gateway_logdir} { size 20G rotate 5 create 0600 root root @@ -320,131 +61,35 @@ ${log_dir} { compress }" - write_file logrotate_conf_filename logrotate_conf_file true -} - -# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file -create_azure_rpm_repos() { - log "starting" - - local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' - local -r azure_repo_file='[azure-cli] -name=azure-cli -baseurl=https://packages.microsoft.com/yumrepos/azure-cli -enabled=yes -gpgcheck=yes - -[azurecore] -name=azurecore -baseurl=https://packages.microsoft.com/yumrepos/azurecore -enabled=yes -gpgcheck=no' - - write_file azure_repo_filename azure_repo_file true -} - -# configure_selinux -configure_selinux() { - log "starting" - - local -r relabel="${1:-false}" - - already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" - semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" - chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent - - if "$relabel"; then - restorecon -RF /var/log/* || log "$already_defined_ignore_error" - fi -} - -# configure_firewalld_rules -configure_firewalld_rules() { - log "starting" - - # https://access.redhat.com/security/cve/cve-2020-13401 - local -r prefix="/etc/sysctl.d" - local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" - local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" - - write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true + local -rA logrotate_dropins=( + ["gateway_log_config"]="$gateway_log_file" + ) - local -r disable_core_filename="$prefix/01-disable-core.conf" - local -r disable_core_file="kernel.core_pattern = |/bin/true - " - write_file disable_core_filename disable_core_file true + configure_logrotate logrotate_dropins + configure_selinux - sysctl --system + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store local -ra enable_ports=( "80/tcp" "8081/tcp" "443/tcp" ) + configure_firewalld_rules enable_ports + + local -r mdmimage="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + local -r rpimage="$RPIMAGE" + local -r fluentbit_image="$FLUENTBITIMAGE" + local -ra images=( + "$mdmimage" + "$rpimage" + "$fluentbit_image" + ) - log "Enabling ports ${enable_ports[*]} on default firewalld zone" - # shellcheck disable=SC2068 - for port in ${enable_ports[@]}; do - log "Enabling port $port now" - firewall-cmd "--add-port=$port" - done - - firewall-cmd --runtime-to-permanent -} - -# pull_container_images -pull_container_images() { - log "starting" - - # The managed identity that the VM runs as only has a single roleassignment. - # This role assignment is ACRPull which is not necessarily present in the - # subscription we're deploying into. If the identity does not have any - # role assignments scoped on the subscription we're deploying into, it will - # not show on az login -i, which is why the below line is commented. - # az account set -s "$SUBSCRIPTIONID" - az login -i --allow-no-subscriptions - - # Suppress emulation output for podman instead of docker for az acr compatability - mkdir -p /etc/containers/ - mkdir -p /root/.docker - touch /etc/containers/nodocker - - # This name is used in the case that az acr login searches for this in it's environment - local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" - - log "logging into prod acr" - az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" - - MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" - docker pull "$MDMIMAGE" - docker pull "$RPIMAGE" - docker pull "$FLUENTBITIMAGE" - - az logout -} - -# configure_system_services creates, configures, and enables the following systemd services and timers -# services -# fluentbit -# mdm -# mdsd -# arp-rp -# aro-dbtoken -# aro-monitor -# aro-portal -configure_system_services() { - configure_service_fluentbit - configure_service_mdm - configure_timers_mdm_mdsd - configure_service_aro_gateway "$1" - configure_service_mdsd -} - -# enable_aro_services enables all services required for aro rp -enable_aro_services() { - log "starting" + pull_container_images images - local -ra aro_services=( + local -ra gateway_services=( aro-gateway auoms azsecd @@ -454,23 +99,7 @@ enable_aro_services() { chronyd fluentbit ) - log "enabling gateway services ${aro_services[*]}" - # shellcheck disable=SC2068 - for service in ${aro_services[@]}; do - log "Enabling $service now" - systemctl enable "$service.service" - done -} -# configure_service_fluentbit -configure_service_fluentbit() { - log "starting" - log "configuring fluentbit service" - - mkdir -p /etc/fluentbit/ - mkdir -p /var/lib/fluent - - local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' local -r fluentbit_conf_file="[INPUT] Name systemd Tag journald @@ -488,277 +117,28 @@ DB /var/lib/fluent/journaldb Match * Port 29230" - write_file fluentbit_conf_filename fluentbit_conf_file true - - local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' - local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" - - write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true - - local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' - - local -r fluentbit_service_file="[Unit] -After=network-online.target -Wants=network-online.target -StartLimitIntervalSec=0 - -[Service] -RestartSec=1s -EnvironmentFile=/etc/sysconfig/fluentbit -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStart=/usr/bin/docker run \ - --security-opt label=disable \ - --entrypoint /opt/td-agent-bit/bin/td-agent-bit \ - --net=host \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \ - -v /var/lib/fluent:/var/lib/fluent:z \ - -v /var/log/journal:/var/log/journal:ro \ - -v /etc/machine-id:/etc/machine-id:ro \ - $FLUENTBITIMAGE \ - -c /etc/fluentbit/fluentbit.conf - -ExecStop=/usr/bin/docker stop %N -Restart=always -RestartSec=5 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - write_file fluentbit_conf_filename fluentbit_conf_file true -} - -# configure_certs -configure_certs() { - log "starting" - - mkdir /etc/aro-rp - base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem - if [[ -n "$ARMAPICABUNDLE" ]]; then - base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem - fi - chown -R 1000:1000 /etc/aro-rp - - # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not - # to honour SSL_CERT_FILE any more, heaven only knows why. - mkdir -p /usr/lib/ssl/certs - csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null - c_rehash /usr/lib/ssl/certs - -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning - local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" - local -r nodescan_agent_file="{ - \"Nice\": 19, - \"Timeout\": 10800, - \"ClientId\": \"\", - \"TenantId\": $AZURESECPACKVSATENANTID, - \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL, - \"ProcessTimeout\": 300, - \"CommandDelay\": 0 - }" - - write_file nodescan_agent_filename nodescan_agent_file true -} - -# configure_service_mdm -configure_service_mdm() { - log "starting" - log "configuring mdm service" - - local -r sysconfig_mdm_filename="/etc/sysconfig/mdm" - local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL' -MDMIMAGE='$MDMIMAGE' -MDMSOURCEENVIRONMENT='$LOCATION' -MDMSOURCEROLE=gateway -MDMSOURCEROLEINSTANCE=\"$(hostname)\"" - - write_file sysconfig_mdm_filename sysconfig_mdm_file true - - mkdir -p /var/etw - local -r mdm_service_filename="/etc/systemd/system/mdm.service" - local -r mdm_service_file="[Unit] -After=network-online.target -Wants=network-online.target - -[Service] -EnvironmentFile=/etc/sysconfig/mdm -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStart=/usr/bin/docker run \ - --entrypoint /usr/sbin/MetricsExtension \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -m 2g \ - -v /etc/mdm.pem:/etc/mdm.pem \ - -v /var/etw:/var/etw:z \ - $MDMIMAGE \ - -CertFile /etc/mdm.pem \ - -FrontEndUrl $MDMFRONTENDURL \ - -Logger Console \ - -LogLevel Warning \ - -PrivateKeyFile /etc/mdm.pem \ - -SourceEnvironment $MDMSOURCEENVIRONMENT \ - -SourceRole $MDMSOURCEROLE \ - -SourceRoleInstance $MDMSOURCEROLEINSTANCE -ExecStop=/usr/bin/docker stop %N -Restart=always -RestartSec=1 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - write_file mdm_service_filename mdm_service_file true -} - -# configure_timers_mdm_mdsd -configure_timers_mdm_mdsd() { - log "starting" - - for var in "mdsd" "mdm"; do - local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service" - local download_creds_service_file="[Unit] -Description=Periodic $var credentials refresh - -[Service] -Type=oneshot -ExecStart=/usr/local/bin/download-credentials.sh $var" - - write_file download_creds_service_filename download_creds_service_file true - - local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer" - local download_creds_timer_file="[Unit] -Description=Periodic $var credentials refresh -After=network-online.target -Wants=network-online.target - -[Timer] -OnBootSec=0min -OnCalendar=0/12:00:00 -AccuracySec=5s - -[Install] -WantedBy=timers.target" - - write_file download_creds_timer_filename download_creds_timer_file true - done - - local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh" - local -r download_creds_script_file="#!/bin/bash -set -eu - -COMPONENT=\$1 -echo \"Download \$COMPONENT credentials\" - -TEMP_DIR=\"\$(mktemp -d)\" -export AZURE_CONFIG_DIR=\"\$(mktemp -d)\" - -echo \"Logging into Azure...\" -RETRIES=3 -while [[ \$RETRIES -gt 0 ]]; do - if az login -i --allow-no-subscriptions - then - echo \"az login successful\" - break - else - echo \"az login failed. Retrying...\" - let RETRIES-=1 - sleep 5 - fi -done - -trap \"cleanup\" EXIT - -cleanup() { - az logout - [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR - [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR -} - -if [[ \$COMPONENT = \"mdm\" ]]; then - CURRENT_CERT_FILE=\"/etc/mdm.pem\" -elif [[ \$COMPONENT\ = \"mdsd\" ]]; then - CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\" -else - echo Invalid usage && exit 1 -fi - -SECRET_NAME=\"gwy-\${COMPONENT}\" -NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\" -for attempt in {1..5}; do - az keyvault \ - secret \ - download \ - --file \"\$NEW_CERT_FILE\" \ - --id \"https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \ - && break - if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi -done - -if [ -f \$NEW_CERT_FILE ]; then - if [[ \$COMPONENT = \"mdsd\" ]]; then - chown syslog:syslog \$NEW_CERT_FILE - else - sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE - fi - - new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" - current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" - if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then - echo updating certificate for \$COMPONENT - chmod 0600 \$NEW_CERT_FILE - mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE - fi -else - echo Failed to refresh certificate for \$COMPONENT && exit 1 -fi" - - write_file download_creds_script_filename download_creds_script_file true - - chmod u+x /usr/local/bin/download-credentials.sh - - systemctl enable download-mdsd-credentials.timer - systemctl enable download-mdm-credentials.timer - - /usr/local/bin/download-credentials.sh mdsd - /usr/local/bin/download-credentials.sh mdm - - local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')" - local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service" - local -r watch_mdm_creds_service_file="[Unit] -Description=Watch for changes in mdm.pem and restarts the mdm service - -[Service] -Type=oneshot -ExecStart=/usr/bin/systemctl restart mdm.service - -[Install] -WantedBy=multi-user.target" - - write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true - - local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path' - local -r watch_mdm_creds_path_file='[Path] -PathModified=/etc/mdm.pem - -[Install] -WantedBy=multi-user.target' + local -r aro_dbtoken_service_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID' +DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' +AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' +DBTOKEN_URL='$DBTOKENURL' +MDM_ACCOUNT='$RPMDMACCOUNT' +MDM_NAMESPACE=Gateway +GATEWAY_DOMAINS='$GATEWAYDOMAINS' +GATEWAY_FEATURES='$GATEWAYFEATURES' +RPIMAGE='$RPIMAGE'" - write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true + local -n mdsd_gateway_version="$GATEWAYMDSDCONFIGVERSION" - local -r watch_mdm_creds='watch-mdm-credentials.path' - systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds" - systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds" + configure_service_fluentbit fluentbit_conf_file fluentbit_image + configure_service_mdm + configure_timers_mdm_mdsd + configure_service_gateway gateway_log_file + configure_service_mdsd + reboot_vm } -# configure_service_aro_gateway -configure_service_aro_gateway() { +# configure_service_aro_rp +configure_service_gateway() { local -n log_dir="$1" log "starting" @@ -827,7 +207,7 @@ ExecStart=/usr/bin/docker run \ -v /run/systemd/journal:/run/systemd/journal \ -v /var/etw:/var/etw:z \ -v ${log_dir}:/ctr.log:z \ - \$RPIMAGE \ + $RPIMAGE \ gateway ExecStop=/usr/bin/docker stop -t 3600 %N TimeoutStopSec=3600 @@ -842,66 +222,6 @@ WantedBy=multi-user.target write_file aro_gateway_service_filename aro_gateway_service_file true } -# configure_service_aro_dbtoken -configure_service_aro_dbtoken() { - log "starting" - - local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken' - local -r aro_dbtoken_service_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID' -DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' -AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' -DBTOKEN_URL='$DBTOKENURL' -MDM_ACCOUNT='$RPMDMACCOUNT' -MDM_NAMESPACE=Gateway -GATEWAY_DOMAINS='$GATEWAYDOMAINS' -GATEWAY_FEATURES='$GATEWAYFEATURES' -RPIMAGE='$RPIMAGE'" - - write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true - - local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' - local -r aro_dbtoken_service_file="[Unit] -After=network-online.target -Wants=network-online.target - -[Service] -EnvironmentFile=/etc/sysconfig/aro-gateway -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir} -ExecStart=/usr/bin/docker run \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -e ACR_RESOURCE_ID \ - -e DATABASE_ACCOUNT_NAME \ - -e AZURE_DBTOKEN_CLIENT_ID \ - -e DBTOKEN_URL \ - -e GATEWAY_DOMAINS \ - -e GATEWAY_FEATURES \ - -e MDM_ACCOUNT \ - -e MDM_NAMESPACE \ - -m 2g \ - -p 80:8080 \ - -p 8081:8081 \ - -p 443:8443 \ - -v /run/systemd/journal:/run/systemd/journal \ - -v /var/etw:/var/etw:z \ - -v ${gateway_logdir}:/ctr.log:z \ - \$RPIMAGE \ - gateway -ExecStop=/usr/bin/docker stop -t 3600 %N -TimeoutStopSec=3600 -Restart=always -RestartSec=1 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - write_file aro_dbtoken_service_filename aro_dbtoken_service_file true -} - # configure_service_mdsd configure_service_mdsd() { log "starting" @@ -925,7 +245,7 @@ export MONITORING_GCS_REGION='$LOCATION' export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN' export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE' -export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION' +export MONITORING_CONFIG_VERSION='' export MONITORING_USE_GENEVA_CONFIG_SERVICE=true export MONITORING_TENANT='$LOCATION' @@ -938,66 +258,6 @@ export MDSD_MSGPACK_SORT_COLUMNS=1\"" } -# run_azsecd_config_scan -run_azsecd_config_scan() { - log "starting" - - local -ar configs=( - "baseline" - "clamav" - "software" - ) - - log "Scanning configuration files ${configs[*]}" - # shellcheck disable=SC2068 - for scan in ${configs[@]}; do - log "Scanning config file $scan now" - /usr/local/bin/azsecd config -s "$scan" -d P1D - done -} - -# write_file -# Args -# 1) filename - string -# 2) file_contents - string -# 3) clobber - boolean; optional - defaults to false -write_file() { - local -n filename="$1" - local -n file_contents="$2" - local -r clobber="${3:-false}" - - if $clobber; then - log "Overwriting file $filename" - echo "$file_contents" > "$filename" - else - log "Appending to $filename" - echo "$file_contents" >> "$filename" - fi -} - -# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots -reboot_vm() { - log "starting" - - configure_selinux "true" - (sleep 30 && log "rebooting vm now"; reboot) & -} - -# log is a wrapper for echo that includes the function name -log() { - local -r msg="${1:-"log message is empty"}" - local -r stack_level="${2:-1}" - echo "${FUNCNAME[${stack_level}]}: ${msg}" -} - -# abort is a wrapper for log that exits with an error code -abort() { - local -ri origin_stacklevel=2 - log "${1}" "$origin_stacklevel" - log "Exiting" - exit 1 -} - export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" main "$@" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 424c40af8bf..c7fd67f2d30 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -70,116 +70,16 @@ main() { configure_firewalld_rules enable_ports - MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + local -r mdmimage="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + local -r rpimage="$RPIMAGE" + local -r fluentbit_image="$FLUENTBITIMAGE" local -ra images=( - "$MDMIMAGE" - "$RPIMAGE" - "$FLUENTBITIMAGE" + "$mdmimage" + "$rpimage" + "$fluentbit_image" ) - pull_container_images images - local -ra aro_services=( - "aro-dbtoken" - "aro-monitor" - "aro-portal" - "aro-rp" - "auoms" - "azsecd" - "azsecmond" - "mdsd" - "mdm" - "chronyd" - "fluentbit" - ) - - configure_aro_services - enable_services - - enable_services aro_services - - reboot_vm -} - -# configure_rpm_repos -configure_rpm_repos() { - log "starting" - - configure_rhui_repo "$1" - create_azure_rpm_repos "$1" -} - -# configure_disk_partitions -configure_disk_partitions() { - log "starting" - log "extending partition table" - - # Linux block devices are inconsistently named - # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here - physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" - growpart "$physical_disk" 2 - - log "extending filesystems" - log "extending root lvm" - lvextend -l +20%FREE /dev/rootvg/rootlv - log "growing root filesystem" - xfs_growfs / - - log "extending var lvm" - lvextend -l +100%FREE /dev/rootvg/varlv - log "growing var filesystem" - xfs_growfs /var -} - -# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file -create_azure_rpm_repos() { - log "starting" - - local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' - local -r azure_repo_file='[azure-cli] -name=azure-cli -baseurl=https://packages.microsoft.com/yumrepos/azure-cli -enabled=yes -gpgcheck=yes - -[azurecore] -name=azurecore -baseurl=https://packages.microsoft.com/yumrepos/azurecore -enabled=yes -gpgcheck=no' - - write_file azure_repo_filename azure_repo_file true -} - -# configure_aro_services creates, configures, and enables the following systemd services and timers -# services -# fluentbit -# mdm -# mdsd -# arp-rp -# aro-dbtoken -# aro-monitor -# aro-portal -configure_aro_services() { - configure_service_fluentbit - configure_service_mdm - configure_timers_mdm_mdsd - configure_service_aro_rp - configure_service_aro_dbtoken - configure_service_aro_monitor - configure_service_aro_portal - configure_service_mdsd -} - -# configure_service_fluentbit -configure_service_fluentbit() { - log "starting" - log "configuring fluentbit service" - - mkdir -p /etc/fluentbit/ - mkdir -p /var/lib/fluent - - local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' local -r fluentbit_conf_file="[INPUT] Name systemd Tag journald @@ -214,273 +114,70 @@ DB /var/lib/fluent/journaldb Match * Port 29230" - write_file fluentbit_conf_filename fluentbit_conf_file true - - local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' - local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" - - write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true - - local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' - - local -r fluentbit_service_file="[Unit] -After=network-online.target -Wants=network-online.target -StartLimitIntervalSec=0 - -[Service] -RestartSec=1s -EnvironmentFile=/etc/sysconfig/fluentbit -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStart=/usr/bin/docker run \ - --security-opt label=disable \ - --entrypoint /opt/td-agent-bit/bin/td-agent-bit \ - --net=host \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \ - -v /var/lib/fluent:/var/lib/fluent:z \ - -v /var/log/journal:/var/log/journal:ro \ - -v /etc/machine-id:/etc/machine-id:ro \ - $FLUENTBITIMAGE \ - -c /etc/fluentbit/fluentbit.conf - -ExecStop=/usr/bin/docker stop %N -Restart=always -RestartSec=5 -StartLimitInterval=0 + local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' +AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' +AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID' +KEYVAULT_PREFIX='$KEYVAULTPREFIX' +MDM_ACCOUNT='$RPMDMACCOUNT' +MDM_NAMESPACE=DBToken +RPIMAGE='$RPIMAGE'" -[Install] -WantedBy=multi-user.target" + # TODO pass this to mdsd service call + configure_service_fluentbit fluentbit_conf_file fluentbit_image + configure_service_mdm + configure_timers_mdm_mdsd + configure_service_aro_rp + configure_service_aro_dbtoken + configure_service_aro_monitor + configure_service_aro_portal + local -r mdsd_rp_version="$RPMDSDCONFIGVERSION" + configure_service_mdsd mdsd_rp_version - write_file fluentbit_service_filename fluentbit_service_file true -} + local -ra aro_services=( + "aro-dbtoken" + "aro-monitor" + "aro-portal" + "aro-rp" + "auoms" + "azsecd" + "azsecmond" + "mdsd" + "mdm" + "chronyd" + "fluentbit" + ) -# configure_certs -configure_certs() { - log "starting" + enable_services aro_services - mkdir /etc/aro-rp - base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem - if [[ -n "$ARMAPICABUNDLE" ]]; then - base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem - fi - chown -R 1000:1000 /etc/aro-rp - - # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not - # to honour SSL_CERT_FILE any more, heaven only knows why. - mkdir -p /usr/lib/ssl/certs - csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null - c_rehash /usr/lib/ssl/certs - -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning - local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" - local -r nodescan_agent_file="{ - \"Nice\": 19, - \"Timeout\": 10800, - \"ClientId\": \"\", - \"TenantId\": $AZURESECPACKVSATENANTID, - \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL, - \"ProcessTimeout\": 300, - \"CommandDelay\": 0 - }" - - write_file nodescan_agent_filename nodescan_agent_file true + reboot_vm } -# configure_service_mdm -configure_service_mdm() { +# configure_rpm_repos +configure_rpm_repos() { log "starting" - log "configuring mdm service" - - local -r sysconfig_mdm_filename="/etc/sysconfig/mdm" - local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL' -MDMIMAGE='$MDMIMAGE' -MDMSOURCEENVIRONMENT='$LOCATION' -MDMSOURCEROLE=rp -MDMSOURCEROLEINSTANCE=\"$(hostname)\"" - - write_file sysconfig_mdm_filename sysconfig_mdm_file true - mkdir -p /var/etw - local -r mdm_service_filename="/etc/systemd/system/mdm.service" - local -r mdm_service_file="[Unit] -After=network-online.target -Wants=network-online.target - -[Service] -EnvironmentFile=/etc/sysconfig/mdm -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStart=/usr/bin/docker run \ - --entrypoint /usr/sbin/MetricsExtension \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -m 2g \ - -v /etc/mdm.pem:/etc/mdm.pem \ - -v /var/etw:/var/etw:z \ - $MDMIMAGE \ - -CertFile /etc/mdm.pem \ - -FrontEndUrl $MDMFRONTENDURL \ - -Logger Console \ - -LogLevel Warning \ - -PrivateKeyFile /etc/mdm.pem \ - -SourceEnvironment $MDMSOURCEENVIRONMENT \ - -SourceRole $MDMSOURCEROLE \ - -SourceRoleInstance $MDMSOURCEROLEINSTANCE -ExecStop=/usr/bin/docker stop %N -Restart=always -RestartSec=1 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - write_file mdm_service_filename mdm_service_file true + configure_rhui_repo "$1" + create_azure_rpm_repos } -# configure_timers_mdm_mdsd -configure_timers_mdm_mdsd() { +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { log "starting" - for var in "mdsd" "mdm"; do - local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service" - local download_creds_service_file="[Unit] -Description=Periodic $var credentials refresh - -[Service] -Type=oneshot -ExecStart=/usr/local/bin/download-credentials.sh $var" - - write_file download_creds_service_filename download_creds_service_file true - - local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer" - local download_creds_timer_file="[Unit] -Description=Periodic $var credentials refresh -After=network-online.target -Wants=network-online.target - -[Timer] -OnBootSec=0min -OnCalendar=0/12:00:00 -AccuracySec=5s - -[Install] -WantedBy=timers.target" - - write_file download_creds_timer_filename download_creds_timer_file true - done - - local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh" - local -r download_creds_script_file="#!/bin/bash -set -eu - -COMPONENT=\$1 -echo \"Download \$COMPONENT credentials\" - -TEMP_DIR=\"\$(mktemp -d)\" -export AZURE_CONFIG_DIR=\"\$(mktemp -d)\" - -echo \"Logging into Azure...\" -RETRIES=3 -while [[ \$RETRIES -gt 0 ]]; do - if az login -i --allow-no-subscriptions - then - echo \"az login successful\" - break - else - echo \"az login failed. Retrying...\" - let RETRIES-=1 - sleep 5 - fi -done - -trap \"cleanup\" EXIT - -cleanup() { - az logout - [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR - [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR -} - -if [[ \$COMPONENT = \"mdm\" ]]; then - CURRENT_CERT_FILE=\"/etc/mdm.pem\" -elif [[ \$COMPONENT\ = \"mdsd\" ]]; then - CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\" -else - echo Invalid usage && exit 1 -fi - -SECRET_NAME=\"rp-\${COMPONENT}\" -NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\" -for attempt in {1..5}; do - az keyvault \ - secret \ - download \ - --file \"\$NEW_CERT_FILE\" \ - --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \ - && break - if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi -done - -if [ -f \$NEW_CERT_FILE ]; then - if [[ \$COMPONENT = \"mdsd\" ]]; then - chown syslog:syslog \$NEW_CERT_FILE - else - sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE - fi - - new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" - current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" - if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then - echo updating certificate for \$COMPONENT - chmod 0600 \$NEW_CERT_FILE - mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE - fi -else - echo Failed to refresh certificate for \$COMPONENT && exit 1 -fi" - - write_file download_creds_script_filename download_creds_script_file true - - chmod u+x /usr/local/bin/download-credentials.sh - - systemctl enable download-mdsd-credentials.timer - systemctl enable download-mdm-credentials.timer - - /usr/local/bin/download-credentials.sh mdsd - /usr/local/bin/download-credentials.sh mdm - - local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')" - local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service" - local -r watch_mdm_creds_service_file="[Unit] -Description=Watch for changes in mdm.pem and restarts the mdm service - -[Service] -Type=oneshot -ExecStart=/usr/bin/systemctl restart mdm.service - -[Install] -WantedBy=multi-user.target" - - write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true - - local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path' - local -r watch_mdm_creds_path_file='[Path] -PathModified=/etc/mdm.pem - -[Install] -WantedBy=multi-user.target' + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] +name=azure-cli +baseurl=https://packages.microsoft.com/yumrepos/azure-cli +enabled=yes +gpgcheck=yes - write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true +[azurecore] +name=azurecore +baseurl=https://packages.microsoft.com/yumrepos/azurecore +enabled=yes +gpgcheck=no' - local -r watch_mdm_creds='watch-mdm-credentials.path' - systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds" - systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds" + write_file azure_repo_filename azure_repo_file true } # configure_service_aro_rp @@ -573,58 +270,6 @@ WantedBy=multi-user.target" write_file aro_rp_service_filename aro_rp_service_file true } -# configure_service_aro_dbtoken -configure_service_aro_dbtoken() { - log "starting" - - local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken' - local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' -AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' -AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID' -KEYVAULT_PREFIX='$KEYVAULTPREFIX' -MDM_ACCOUNT='$RPMDMACCOUNT' -MDM_NAMESPACE=DBToken -RPIMAGE='$RPIMAGE'" - - write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true - - local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' - local -r aro_dbtoken_service_file="[Unit] -After=network-online.target -Wants=network-online.target - -[Service] -EnvironmentFile=/etc/sysconfig/aro-dbtoken -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStart=/usr/bin/docker run \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \ - -e DATABASE_ACCOUNT_NAME \ - -e AZURE_DBTOKEN_CLIENT_ID \ - -e KEYVAULT_PREFIX \ - -e MDM_ACCOUNT \ - -e MDM_NAMESPACE \ - -m 2g \ - -p 445:8445 \ - -v /run/systemd/journal:/run/systemd/journal \ - -v /var/etw:/var/etw:z \ - $RPIMAGE \ - dbtoken -ExecStop=/usr/bin/docker stop -t 3600 %N -TimeoutStopSec=3600 -Restart=always -RestartSec=1 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - write_file aro_dbtoken_service_filename aro_dbtoken_service_file true -} - # configure_service_aro_monitor configure_service_aro_monitor() { log "starting" @@ -748,61 +393,6 @@ WantedBy=multi-user.target" write_file aro_portal_service_filename aro_portal_service_file true } -# configure_service_mdsd -configure_service_mdsd() { - local -n mdsd - log "starting" - - local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" - mkdir -p "$mdsd_service_dir" - - local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf" - local -r mdsd_override_conf_file="[Unit] -After=network-online.target" - - write_file mdsd_override_conf_filename mdsd_override_conf_file true - - local -r default_mdsd_filename="/etc/default/mdsd" - local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default -MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\" - -export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT' -export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT' -export MONITORING_GCS_REGION='$LOCATION' -export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault -export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN' -export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE' -export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION' -export MONITORING_USE_GENEVA_CONFIG_SERVICE=true - -export MONITORING_TENANT='$LOCATION' -export MONITORING_ROLE=rp -export MONITORING_ROLE_INSTANCE=\"$(hostname)\" - -export MDSD_MSGPACK_SORT_COLUMNS=1\"" - - write_file default_mdsd_filename default_mdsd_file true - -} - -# run_azsecd_config_scan -run_azsecd_config_scan() { - log "starting" - - local -ar configs=( - "baseline" - "clamav" - "software" - ) - - log "Scanning configuration files ${configs[*]}" - # shellcheck disable=SC2068 - for scan in ${configs[@]}; do - log "Scanning config file $scan now" - /usr/local/bin/azsecd config -s "$scan" -d P1D - done -} - export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" main "$@" From d914aef195e8970e18adcd1baba0df900c420875 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Fri, 19 Apr 2024 16:39:09 -0400 Subject: [PATCH 33/38] WIP Functional rpVMSS.sh and common.sh files --- pkg/deploy/generator/scripts/common.sh | 157 ++++++------------------- pkg/deploy/generator/scripts/rpVMSS.sh | 104 ++++++++++++---- 2 files changed, 117 insertions(+), 144 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index f69e30dbf2c..c1db1d0c2f6 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -131,7 +131,9 @@ configure_firewalld_rules() { } # configure_logrotate clobbers /etc/logrotate.conf -# TODO add writing of dropin files +# args: +# 1) dropin_files - associative array. Key name dictates filenames written to /etc/logrotate.d. +# If an empty array is provided, no files will be written configure_logrotate() { local -n dropin_files="$1" log "starting" @@ -228,7 +230,7 @@ enable_services() { # shellcheck disable=SC2068 for service in ${services[@]}; do log "Enabling $service now" - systemctl enable "$service.service" + systemctl enable "$service" done } @@ -377,14 +379,16 @@ configure_certs() { # configure_service_mdm configure_service_mdm() { + local -n role="$1" + local -n image="$2" log "starting" log "configuring mdm service" local -r sysconfig_mdm_filename="/etc/sysconfig/mdm" local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL' -MDMIMAGE='$MDMIMAGE' +MDMIMAGE='$image' MDMSOURCEENVIRONMENT='$LOCATION' -MDMSOURCEROLE=gateway +MDMSOURCEROLE='$role' MDMSOURCEROLEINSTANCE=\"$(hostname)\"" write_file sysconfig_mdm_filename sysconfig_mdm_file true @@ -407,7 +411,7 @@ ExecStart=/usr/bin/docker run \ -m 2g \ -v /etc/mdm.pem:/etc/mdm.pem \ -v /var/etw:/var/etw:z \ - $MDMIMAGE \ + $image \ -CertFile /etc/mdm.pem \ -FrontEndUrl $MDMFRONTENDURL \ -Logger Console \ @@ -429,6 +433,7 @@ WantedBy=multi-user.target" # configure_timers_mdm_mdsd configure_timers_mdm_mdsd() { + local -n component="$1" log "starting" for var in "mdsd" "mdm"; do @@ -493,20 +498,20 @@ cleanup() { if [[ \$COMPONENT = \"mdm\" ]]; then CURRENT_CERT_FILE=\"/etc/mdm.pem\" -elif [[ \$COMPONENT\ = \"mdsd\" ]]; then +elif [[ \$COMPONENT = \"mdsd\" ]]; then CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\" else echo Invalid usage && exit 1 fi -SECRET_NAME=\"gwy-\${COMPONENT}\" +SECRET_NAME=\"$component-\${COMPONENT}\" NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\" for attempt in {1..5}; do az keyvault \ secret \ download \ --file \"\$NEW_CERT_FILE\" \ - --id \"https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \ + --id \"https://$KEYVAULTPREFIX-$component.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \ && break if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi done @@ -533,12 +538,8 @@ fi" chmod u+x /usr/local/bin/download-credentials.sh - # TODO place this in enable services section - systemctl enable download-mdsd-credentials.timer - systemctl enable download-mdm-credentials.timer - - /usr/local/bin/download-credentials.sh mdsd - /usr/local/bin/download-credentials.sh mdm + $download_creds_script_filename mdsd + $download_creds_script_filename mdm local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')" local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service" @@ -570,31 +571,30 @@ WantedBy=multi-user.target' # configure_service_fluentbit configure_service_fluentbit() { - local -n fluentbit_conf_file="$1" - local -n fluentbit_image="$2" + local -n conf_file="$1" + local -n image="$2" log "starting" log "configuring fluentbit service" - if [[ -n $fluentbit_conf_file ]]; then - abort "$1 fluentbit config file cannot be empty" - elif [[ -n $fluentbit_image ]]; then - abort "$2 fluentbit image cannot be empty" + if [ -z "$conf_file" ]; then + abort "$1 config file cannot be empty" + elif [ -z "$image" ]; then + abort "$2 image cannot be empty" fi mkdir -p /etc/fluentbit/ mkdir -p /var/lib/fluent - local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' - write_file fluentbit_conf_filename fluentbit_conf_file true - - local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' - local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$fluentbit_image" + local -r conf_filename='/etc/fluentbit/fluentbit.conf' + write_file conf_filename conf_file true - write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true + local -r sysconfig_filename='/etc/sysconfig/fluentbit' + local -r sysconfig_file="FLUENTBITIMAGE=$fluentbit_image" - local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' + write_file sysconfig_filename sysconfig_file true - local -r fluentbit_service_file="[Unit] + local -r service_filename='/etc/systemd/system/fluentbit.service' + local -r service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitIntervalSec=0 @@ -615,7 +615,7 @@ ExecStart=/usr/bin/docker run \ -v /var/lib/fluent:/var/lib/fluent:z \ -v /var/log/journal:/var/log/journal:ro \ -v /etc/machine-id:/etc/machine-id:ro \ - $fluentbit_image \ + $image \ -c /etc/fluentbit/fluentbit.conf ExecStop=/usr/bin/docker stop %N @@ -626,99 +626,13 @@ StartLimitInterval=0 [Install] WantedBy=multi-user.target" - write_file fluentbit_service_filename fluentbit_service_file true -} - -# configure_service_aro_dbtoken -configure_service_aro_dbtoken() { - local -n dbtoken_conf="$1" - local -n log_dir="${2:-}" - log "starting" - - local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken' - - write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true - - local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' - # TODO add test if log_dir is empty, else - local -r aro_dbtoken_service_file="[Unit] -After=network-online.target -Wants=network-online.target - -[Service] -EnvironmentFile=/etc/sysconfig/aro-dbtoken -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStart=/usr/bin/docker run \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \ - -e DATABASE_ACCOUNT_NAME \ - -e AZURE_DBTOKEN_CLIENT_ID \ - -e KEYVAULT_PREFIX \ - -e MDM_ACCOUNT \ - -e MDM_NAMESPACE \ - -m 2g \ - -p 445:8445 \ - -v /run/systemd/journal:/run/systemd/journal \ - -v /var/etw:/var/etw:z \ - $RPIMAGE \ - dbtoken -ExecStop=/usr/bin/docker stop -t 3600 %N -TimeoutStopSec=3600 -Restart=always -RestartSec=1 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - local -r aro_dbtoken_service_file="[Unit] -After=network-online.target -Wants=network-online.target - -[Service] -EnvironmentFile=/etc/sysconfig/aro-gateway -ExecStartPre=-/usr/bin/docker rm -f %N -ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir} -ExecStart=/usr/bin/docker run \ - --hostname %H \ - --name %N \ - --rm \ - --cap-drop net_raw \ - -e ACR_RESOURCE_ID \ - -e DATABASE_ACCOUNT_NAME \ - -e AZURE_DBTOKEN_CLIENT_ID \ - -e DBTOKEN_URL \ - -e GATEWAY_DOMAINS \ - -e GATEWAY_FEATURES \ - -e MDM_ACCOUNT \ - -e MDM_NAMESPACE \ - -m 2g \ - -p 80:8080 \ - -p 8081:8081 \ - -p 443:8443 \ - -v /run/systemd/journal:/run/systemd/journal \ - -v /var/etw:/var/etw:z \ - -v ${gateway_logdir}:/ctr.log:z \ - \$RPIMAGE \ - gateway -ExecStop=/usr/bin/docker stop -t 3600 %N -TimeoutStopSec=3600 -Restart=always -RestartSec=1 -StartLimitInterval=0 - -[Install] -WantedBy=multi-user.target" - - write_file aro_dbtoken_service_filename aro_dbtoken_service_file true + write_file service_filename service_file true } # configure_service_mdsd configure_service_mdsd() { - local -n monitor_config_version="$1" + local -n monitoring_role="$1" + local -n monitor_config_version="$2" log "starting" local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" @@ -744,7 +658,7 @@ export MONITORING_CONFIG_VERSION='$monitor_config_version' export MONITORING_USE_GENEVA_CONFIG_SERVICE=true export MONITORING_TENANT='$LOCATION' -export MONITORING_ROLE=rp +export MONITORING_ROLE='$monitoring_role' export MONITORING_ROLE_INSTANCE=\"$(hostname)\" export MDSD_MSGPACK_SORT_COLUMNS=1\"" @@ -769,3 +683,8 @@ run_azsecd_config_scan() { /usr/local/bin/azsecd config -s "$scan" -d P1D done } + +create_required_dirs() { + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store +} diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index c7fd67f2d30..730964d5ab7 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -53,13 +53,14 @@ main() { dnf_install_pkgs install_pkgs retry_wait_time configure_dnf_cron_job - configure_disk_partitions - configure_logrotate - configure_selinux - mkdir -p /var/log/journal - mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store + # Key dictates the filename written in /etc/logrotate.d + # Present for future dropin files, also is required for configure_logrotate + local -rA logrotate_dropins=() + configure_logrotate logrotate_dropins + configure_selinux + create_required_dirs local -ra enable_ports=( "443/tcp" @@ -78,7 +79,8 @@ main() { "$rpimage" "$fluentbit_image" ) - pull_container_images images + local -r registry_config_file="" + pull_container_images images registry_config_file local -r fluentbit_conf_file="[INPUT] Name systemd @@ -114,24 +116,17 @@ DB /var/lib/fluent/journaldb Match * Port 29230" - local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' -AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' -AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID' -KEYVAULT_PREFIX='$KEYVAULTPREFIX' -MDM_ACCOUNT='$RPMDMACCOUNT' -MDM_NAMESPACE=DBToken -RPIMAGE='$RPIMAGE'" - - # TODO pass this to mdsd service call configure_service_fluentbit fluentbit_conf_file fluentbit_image - configure_service_mdm - configure_timers_mdm_mdsd + local -r monitor_role="rp" + configure_service_mdm monitor_role mdmimage + configure_timers_mdm_mdsd monitor_role configure_service_aro_rp - configure_service_aro_dbtoken - configure_service_aro_monitor - configure_service_aro_portal + + configure_service_dbtoken rpimage + configure_service_aro_monitor rpimage + configure_service_aro_portal rpimage local -r mdsd_rp_version="$RPMDSDCONFIGVERSION" - configure_service_mdsd mdsd_rp_version + configure_service_mdsd monitor_role mdsd_rp_version local -ra aro_services=( "aro-dbtoken" @@ -145,6 +140,8 @@ RPIMAGE='$RPIMAGE'" "mdm" "chronyd" "fluentbit" + "download-mdsd-credentials.timer" + "download-mdm-credentials.timer" ) enable_services aro_services @@ -272,6 +269,7 @@ WantedBy=multi-user.target" # configure_service_aro_monitor configure_service_aro_monitor() { + local -n image="$1" log "starting" log "configuring aro-monitor service" @@ -292,7 +290,7 @@ DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' KEYVAULT_PREFIX='$KEYVAULTPREFIX' MDM_ACCOUNT='$RPMDMACCOUNT' MDM_NAMESPACE=BBM -RPIMAGE='$RPIMAGE'" +RPIMAGE='$image'" write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true @@ -326,7 +324,7 @@ ExecStart=/usr/bin/docker run \ -m 2.5g \ -v /run/systemd/journal:/run/systemd/journal \ -v /var/etw:/var/etw:z \ - $RPIMAGE \ + $image \ monitor Restart=always RestartSec=1 @@ -340,6 +338,7 @@ WantedBy=multi-user.target" # configure_service_aro_portal configure_service_aro_portal() { + local -n image="$1" log "starting" local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal' @@ -351,7 +350,7 @@ KEYVAULT_PREFIX='$KEYVAULTPREFIX' MDM_ACCOUNT='$RPMDMACCOUNT' MDM_NAMESPACE=Portal PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME' -RPIMAGE='$RPIMAGE'" +RPIMAGE='$image'" write_file aro_portal_service_conf_filename aro_portal_service_conf_file true @@ -382,7 +381,7 @@ ExecStart=/usr/bin/docker run \ -p 2222:2222 \ -v /run/systemd/journal:/run/systemd/journal \ -v /var/etw:/var/etw:z \ - $RPIMAGE \ + $image \ portal Restart=always RestartSec=1 @@ -393,6 +392,61 @@ WantedBy=multi-user.target" write_file aro_portal_service_filename aro_portal_service_file true } +# configure_service_aro_dbtoken +configure_service_dbtoken() { + local -n image="$1" + log "starting" + + local -r conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' +AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' +AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID' +KEYVAULT_PREFIX='$KEYVAULTPREFIX' +MDM_ACCOUNT='$RPMDMACCOUNT' +MDM_NAMESPACE=DBToken +RPIMAGE='$image'" + + local -r conf_filename='/etc/sysconfig/aro-dbtoken' + + write_file conf_filename conf_file true + + local -r service_file="[Unit] +After=network-online.target +Wants=network-online.target + +[Service] +EnvironmentFile=/etc/sysconfig/aro-dbtoken +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStart=/usr/bin/docker run \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \ + -e DATABASE_ACCOUNT_NAME \ + -e AZURE_DBTOKEN_CLIENT_ID \ + -e KEYVAULT_PREFIX \ + -e MDM_ACCOUNT \ + -e MDM_NAMESPACE \ + -m 2g \ + -p 445:8445 \ + -v /run/systemd/journal:/run/systemd/journal \ + -v /var/etw:/var/etw:z \ + $image \ + dbtoken +ExecStop=/usr/bin/docker stop -t 3600 %N +TimeoutStopSec=3600 +Restart=always +RestartSec=1 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + local -r service_filename='/etc/systemd/system/aro-dbtoken.service' + write_file service_filename service_file true +} + + export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" main "$@" From 429c281ee140247f342dce477126923a5d5ffd17 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Tue, 23 Apr 2024 16:08:27 -0400 Subject: [PATCH 34/38] WIP Functional gatewayVMSS.sh, moved repo functions into common.sh --- pkg/deploy/generator/scripts/common.sh | 72 ++++++++++++--------- pkg/deploy/generator/scripts/gatewayVMSS.sh | 60 ++++++++++------- pkg/deploy/generator/scripts/rpVMSS.sh | 28 -------- 3 files changed, 78 insertions(+), 82 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index c1db1d0c2f6..fbae20b34d3 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -178,8 +178,9 @@ include /etc/logrotate.d local -r logrotate_d="/etc/logrotate.d" log "Writing logrotate files to $logrotate_d" for dropin_name in "${!dropin_files[@]}"; do - local -r dropin_file="$logrotate_d/$dropin_name" - write_file "$dropin_file" "${dropin_files["$dropin_name"]}" + local -r dropin_filename="$logrotate_d/$dropin_name" + local -r dropin_file="${dropin_files["$dropin_name"]}" + write_file dropin_filename dropin_file true done } @@ -226,6 +227,8 @@ enable_services() { local -n services="$1" log "starting" + systemctl daemon-reload + log "enabling services ${services[*]}" # shellcheck disable=SC2068 for service in ${services[@]}; do @@ -276,7 +279,40 @@ abort() { exit 1 } -# configure_rhui_repo +# configure_rpm_repos +# New repositories should be added in their own functions, and called here +# args: +# 1) retry_wait_time - nameref +configure_rpm_repos() { + log "starting" + + configure_rhui_repo "$1" + create_azure_rpm_repos +} + +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { + log "starting" + + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] +name=azure-cli +baseurl=https://packages.microsoft.com/yumrepos/azure-cli +enabled=yes +gpgcheck=yes + +[azurecore] +name=azurecore +baseurl=https://packages.microsoft.com/yumrepos/azurecore +enabled=yes +gpgcheck=no' + + write_file azure_repo_filename azure_repo_file true +} + +# configure_rhui_repo enables all rhui-microsoft-azure* repos +# args: +# 1) retry_wait_time - nameref configure_rhui_repo() { log "starting" @@ -302,26 +338,6 @@ dnf update -y" chmod +x "$cron_weekly_dnf_update_filename" } -# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file -create_azure_rpm_repos() { - log "starting" - - local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' - local -r azure_repo_file='[azure-cli] -name=azure-cli -baseurl=https://packages.microsoft.com/yumrepos/azure-cli -enabled=yes -gpgcheck=yes - -[azurecore] -name=azurecore -baseurl=https://packages.microsoft.com/yumrepos/azurecore -enabled=yes -gpgcheck=no' - - write_file azure_repo_filename azure_repo_file true -} - # configure_disk_partitions configure_disk_partitions() { log "starting" @@ -361,8 +377,8 @@ configure_certs() { csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null c_rehash /usr/lib/ssl/certs -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning + # we leave clientId blank as long as only 1 managed identity assigned to vmss + # if we have more than 1, we will need to populate with clientId used for off-node scanning local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" local -r nodescan_agent_file="{ \"Nice\": 19, @@ -576,12 +592,6 @@ configure_service_fluentbit() { log "starting" log "configuring fluentbit service" - if [ -z "$conf_file" ]; then - abort "$1 config file cannot be empty" - elif [ -z "$image" ]; then - abort "$2 image cannot be empty" - fi - mkdir -p /etc/fluentbit/ mkdir -p /var/lib/fluent diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 064bf18bd49..edc219928cd 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -8,7 +8,14 @@ if [ "${DEBUG:-false}" == true ]; then fi main() { + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + + # shellcheck source=common.sh + source common.sh + configure_sshd + configure_rpm_repos retry_wait_time local -ar exclude_pkgs=( "-x WALinuxAgent" @@ -29,6 +36,7 @@ main() { ) dnf_install_pkgs repo_rpm_pkgs retry_wait_time + configure_dnf_cron_job local -ra install_pkgs=( clamav @@ -61,15 +69,14 @@ ${gateway_logdir} { compress }" + # Key dictates the filename written in /etc/logrotate.d local -rA logrotate_dropins=( - ["gateway_log_config"]="$gateway_log_file" + ["gateway"]="$gateway_log_file" ) configure_logrotate logrotate_dropins configure_selinux - - mkdir -p /var/log/journal - mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store + create_required_dirs local -ra enable_ports=( "80/tcp" @@ -87,18 +94,7 @@ ${gateway_logdir} { "$fluentbit_image" ) - pull_container_images images - - local -ra gateway_services=( - aro-gateway - auoms - azsecd - azsecmond - mdsd - mdm - chronyd - fluentbit - ) + pull_container_images images registry_config_file local -r fluentbit_conf_file="[INPUT] Name systemd @@ -117,7 +113,11 @@ DB /var/lib/fluent/journaldb Match * Port 29230" - local -r aro_dbtoken_service_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID' + configure_service_fluentbit fluentbit_conf_file fluentbit_image + local -r mdm_role="gateway" + configure_service_mdm mdm_role mdmimage + + local -r gwy_dbtoken_service_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID' DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME' AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID' DBTOKEN_URL='$DBTOKENURL' @@ -126,14 +126,28 @@ MDM_NAMESPACE=Gateway GATEWAY_DOMAINS='$GATEWAYDOMAINS' GATEWAY_FEATURES='$GATEWAYFEATURES' RPIMAGE='$RPIMAGE'" + configure_service_gateway gateway_logdir - local -n mdsd_gateway_version="$GATEWAYMDSDCONFIGVERSION" + local -r mdsd_config_version="$GATEWAYMDSDCONFIGVERSION" + configure_service_mdsd mdm_role mdsd_config_version + local -r mdsd_role="gwy" + configure_timers_mdm_mdsd mdsd_role + + local -ra gateway_services=( + "aro-gateway" + "auoms" + "azsecd" + "azsecmond" + "mdsd" + "mdm" + "chronyd" + "fluentbit" + "download-mdsd-credentials.timer" + "download-mdm-credentials.timer" + ) + + enable_services gateway_services - configure_service_fluentbit fluentbit_conf_file fluentbit_image - configure_service_mdm - configure_timers_mdm_mdsd - configure_service_gateway gateway_log_file - configure_service_mdsd reboot_vm } diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 730964d5ab7..406e8273042 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -149,34 +149,6 @@ DB /var/lib/fluent/journaldb reboot_vm } -# configure_rpm_repos -configure_rpm_repos() { - log "starting" - - configure_rhui_repo "$1" - create_azure_rpm_repos -} - -# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file -create_azure_rpm_repos() { - log "starting" - - local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' - local -r azure_repo_file='[azure-cli] -name=azure-cli -baseurl=https://packages.microsoft.com/yumrepos/azure-cli -enabled=yes -gpgcheck=yes - -[azurecore] -name=azurecore -baseurl=https://packages.microsoft.com/yumrepos/azurecore -enabled=yes -gpgcheck=no' - - write_file azure_repo_filename azure_repo_file true -} - # configure_service_aro_rp configure_service_aro_rp() { log "starting" From 5a3ab70f1ad95069bfbc0008c79f6fa255da13d1 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Tue, 23 Apr 2024 17:12:36 -0400 Subject: [PATCH 35/38] Consolidate configure_certs by adding arguement determining certs to configure --- pkg/deploy/generator/scripts/common.sh | 23 ++++++++++++++++++----- 1 file changed, 18 insertions(+), 5 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index fbae20b34d3..1de8b773786 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -362,14 +362,27 @@ configure_disk_partitions() { # configure_certs configure_certs() { + local -n role="$1" log "starting" + log "Configuring certificates for $role" + + if [ "$role" == "devproxy" ]; then + base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt + base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key + base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt + chown -R 1000:1000 /etc/proxy + chmod 0600 /etc/proxy/proxy.key + return 0 + fi - mkdir /etc/aro-rp - base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem - if [[ -n "$ARMAPICABUNDLE" ]]; then - base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + if [ "$role" == "rp" ]; then + mkdir -p /etc/aro-rp + base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + if [[ -n "$ARMAPICABUNDLE" ]]; then + base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + fi + chown -R 1000:1000 /etc/aro-rp fi - chown -R 1000:1000 /etc/aro-rp # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not # to honour SSL_CERT_FILE any more, heaven only knows why. From f289e16e4cca13ae0473d458ee1f4d4ff0700ba6 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Tue, 23 Apr 2024 17:12:58 -0400 Subject: [PATCH 36/38] WIP configure certificates on gateway, rp, devProxy VMSSes Move create_required_dirs to be the first step that runs, to ensure they exist when needed. This was mostly for the devProxyVMSS --- pkg/deploy/generator/scripts/common.sh | 43 +++++++++++++------- pkg/deploy/generator/scripts/devProxyVMSS.sh | 18 +++----- pkg/deploy/generator/scripts/gatewayVMSS.sh | 4 +- pkg/deploy/generator/scripts/rpVMSS.sh | 4 +- 4 files changed, 40 insertions(+), 29 deletions(-) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/common.sh index 1de8b773786..6f54ced7354 100644 --- a/pkg/deploy/generator/scripts/common.sh +++ b/pkg/deploy/generator/scripts/common.sh @@ -187,7 +187,8 @@ include /etc/logrotate.d # pull_container_images pull_container_images() { local -n pull_images="$1" - local -n registry_conf="${2:-}" + local -n registry_conf="${2:-empty}" + local -r az_login="${3:-true}" log "starting" # The managed identity that the VM runs as only has a single roleassignment. @@ -196,7 +197,9 @@ pull_container_images() { # role assignments scoped on the subscription we're deploying into, it will # not show on az login -i, which is why the below line is commented. # az account set -s "$SUBSCRIPTIONID" - az login -i --allow-no-subscriptions + if $az_login; then + az login -i --allow-no-subscriptions + fi # Suppress emulation output for podman instead of docker for az acr compatability mkdir -p /etc/containers/ @@ -211,7 +214,9 @@ pull_container_images() { fi log "logging into prod acr" - az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + if $az_login; then + az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + fi # shellcheck disable=SC2068 for i in ${pull_images[@]}; do @@ -219,7 +224,9 @@ pull_container_images() { podman pull "$i" done - az logout + if $az_login; then + az logout + fi } # enable_services enables all services required for aro rp @@ -367,28 +374,32 @@ configure_certs() { log "Configuring certificates for $role" if [ "$role" == "devproxy" ]; then - base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt - base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key - base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt + local -r proxy_certs_basedir="/etc/proxy" + mkdir -p "$proxy_certs_basedir" + base64 -d <<<"$PROXYCERT" > "$proxy_certs_basedir/proxy.crt" + base64 -d <<<"$PROXYKEY" > "$proxy_certs_basedir/proxy.key" + base64 -d <<<"$PROXYCLIENTCERT" > "$proxy_certs_basedir/proxy-client.crt" chown -R 1000:1000 /etc/proxy - chmod 0600 /etc/proxy/proxy.key + chmod 0600 "$proxy_certs_basedir/proxy.key" return 0 fi if [ "$role" == "rp" ]; then - mkdir -p /etc/aro-rp - base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + local -r rp_certs_basedir="/etc/aro-rp" + mkdir -p + base64 -d <<<"$ADMINAPICABUNDLE" > "$rp_certs_basedir/admin-ca-bundle.pem" if [[ -n "$ARMAPICABUNDLE" ]]; then - base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + base64 -d <<<"$ARMAPICABUNDLE" > "$rp_certs_basedir/arm-ca-bundle.pem" fi - chown -R 1000:1000 /etc/aro-rp + chown -R 1000:1000 "$rp_certs_basedir" fi # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not # to honour SSL_CERT_FILE any more, heaven only knows why. - mkdir -p /usr/lib/ssl/certs - csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null - c_rehash /usr/lib/ssl/certs + local -r ssl_certs_basedir="/usr/lib/ssl/certs" + mkdir -p + csplit -f "$ssl_certs_basedir/cert-" -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null + c_rehash "$ssl_certs_basedir" # we leave clientId blank as long as only 1 managed identity assigned to vmss # if we have more than 1, we will need to populate with clientId used for off-node scanning @@ -710,4 +721,6 @@ run_azsecd_config_scan() { create_required_dirs() { mkdir -p /var/log/journal mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store + # Does not exist on devProxyVMSS + mkdir -p /var/opt/microsoft/linuxmonagent } diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index 9866313e007..af727a11155 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -14,6 +14,8 @@ main() { # shellcheck source=common.sh source common.sh + create_required_dirs + local -ar exclude_pkgs=( "-x WALinuxAgent" "-x WALinuxAgent-udev" @@ -44,9 +46,12 @@ main() { } }" - pull_container_images proxy_image registry_config_file + pull_container_images proxy_image registry_config_file false configure_devproxy_services proxy_images + local -r vmss_role="devproxy" + configure_certs vmss_role + local -ra proxy_services=( proxy ) @@ -62,17 +67,6 @@ configure_devproxy_services() { configure_service_proxy "$1" } -# configure_certs -configure_certs() { - log "starting" - - base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt - base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key - base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt - chown -R 1000:1000 /etc/proxy - chmod 0600 /etc/proxy/proxy.key -} - configure_service_proxy() { local -n proxy_image="$1" local -r sysconfig_proxy_filename='/etc/sysconfig/proxy' diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index edc219928cd..bb0e12e7137 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -14,6 +14,7 @@ main() { # shellcheck source=common.sh source common.sh + create_required_dirs configure_sshd configure_rpm_repos retry_wait_time @@ -76,7 +77,6 @@ ${gateway_logdir} { configure_logrotate logrotate_dropins configure_selinux - create_required_dirs local -ra enable_ports=( "80/tcp" @@ -133,6 +133,8 @@ RPIMAGE='$RPIMAGE'" local -r mdsd_role="gwy" configure_timers_mdm_mdsd mdsd_role + configure_certs mdm_role + local -ra gateway_services=( "aro-gateway" "auoms" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 406e8273042..2d9f16b717d 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -14,6 +14,7 @@ main() { # shellcheck source=common.sh source common.sh + create_required_dirs configure_sshd configure_rpm_repos retry_wait_time @@ -60,7 +61,6 @@ main() { local -rA logrotate_dropins=() configure_logrotate logrotate_dropins configure_selinux - create_required_dirs local -ra enable_ports=( "443/tcp" @@ -128,6 +128,8 @@ DB /var/lib/fluent/journaldb local -r mdsd_rp_version="$RPMDSDCONFIGVERSION" configure_service_mdsd monitor_role mdsd_rp_version + configure_certs monitor_role + local -ra aro_services=( "aro-dbtoken" "aro-monitor" From 63867bb55e0b637c3eeaa154b65414c3de890c30 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Tue, 23 Apr 2024 18:02:52 -0400 Subject: [PATCH 37/38] rename common.sh to commonVMSS.sh to show it's common to \*VMSS.sh scripts --- pkg/deploy/generator/scripts/{common.sh => commonVMSS.sh} | 0 pkg/deploy/generator/scripts/devProxyVMSS.sh | 4 ++-- pkg/deploy/generator/scripts/gatewayVMSS.sh | 4 ++-- pkg/deploy/generator/scripts/rpVMSS.sh | 4 ++-- 4 files changed, 6 insertions(+), 6 deletions(-) rename pkg/deploy/generator/scripts/{common.sh => commonVMSS.sh} (100%) diff --git a/pkg/deploy/generator/scripts/common.sh b/pkg/deploy/generator/scripts/commonVMSS.sh similarity index 100% rename from pkg/deploy/generator/scripts/common.sh rename to pkg/deploy/generator/scripts/commonVMSS.sh diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index af727a11155..23aab382c85 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -11,8 +11,8 @@ main() { # transaction attempt retry time in seconds local -ri retry_wait_time=60 - # shellcheck source=common.sh - source common.sh + # shellcheck source=commonVMSS.sh + source commonVMSS.sh create_required_dirs diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index bb0e12e7137..8b382698977 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -11,8 +11,8 @@ main() { # transaction attempt retry time in seconds local -ri retry_wait_time=60 - # shellcheck source=common.sh - source common.sh + # shellcheck source=commonVMSS.sh + source commonVMSS.sh create_required_dirs configure_sshd diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 2d9f16b717d..dfe02052521 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -11,8 +11,8 @@ main() { # transaction attempt retry time in seconds local -ri retry_wait_time=60 - # shellcheck source=common.sh - source common.sh + # shellcheck source=commonVMSS.sh + source commonVMSS.sh create_required_dirs configure_sshd From bdf8d12b053faa89f6bbae09f3205e986cbf03b1 Mon Sep 17 00:00:00 2001 From: Steven Fairchild Date: Wed, 10 Apr 2024 11:24:40 -0400 Subject: [PATCH 38/38] Move systemd service configurations into functions Move dnf package and repo operations into function, move all service configuration into a function Move repository configuration higher in sequence of events, make unchanging variables readonly Add write_file function to cleanup creation of new files, appending to existing files move packages to install and rpm keys to import into arrays, this will make adding new packages and keys easier Add retry loop for rpm repo key imports, remove erroneous package from install_pkgs array Pass dnf packages and rpm keys to function calls via nameref to allow reuse, This also allows for function reuse. Add wait for all rpm related transactions to avoid rpm database corruption Add starting log message for each function call rpm database corruption has been seen in testing, and Prod deployments due to concurrent rpm database operations between rpm and dnf. wait is needed due to this. remove ERR trap, we aren't attempting to trap any specific errors yet. Increase dnf & rpm retry time to 1 minute, 5 minutes total Pass wait time as a nameref variable to allow easier modification Add parse_run_options to run individual steps for testing Add az login -i comment found in gatewayVMSS.sh, change variable syntex to snake case for consistency Port changes made in rpVMSS.sh to gatewayVMSS.sh Make gateway log directory to be passed in to functions where it is needed, this allows the value to be set in one location. Move retry steps into a single retry function call This is to reduce code duplication Move configure_fiewall_rules file creation to use write_file Correct accept_ra_conf variable name spelling Pass usage options via nameref variable that is also used by getops Move docker file creation to more logical location --- pkg/deploy/assets/env-development.json | 2 +- pkg/deploy/assets/gateway-production.json | 2 +- pkg/deploy/assets/rp-production.json | 2 +- pkg/deploy/generator/scripts/devProxyVMSS.sh | 440 ++++++-- pkg/deploy/generator/scripts/gatewayVMSS.sh | 1031 ++++++++++++----- pkg/deploy/generator/scripts/rpVMSS.sh | 1058 +++++++++++++----- 6 files changed, 1892 insertions(+), 643 deletions(-) diff --git a/pkg/deploy/assets/env-development.json b/pkg/deploy/assets/env-development.json index 10057c04528..1da1cb9fb5b 100644 --- a/pkg/deploy/assets/env-development.json +++ b/pkg/deploy/assets/env-development.json @@ -296,7 +296,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('I0FkZGluZyByZXRyeSBsb2dpYyB0byB5dW0gY29tbWFuZHMgaW4gb3JkZXIgdG8gYXZvaWQgc3RhbGxpbmcgb3V0IG9uIHJlc291cmNlIGxvY2tzCmVjaG8gInJ1bm5pbmcgUkhVSSBmaXgiCmZvciBhdHRlbXB0IGluIHsxLi41fTsgZG8KICB5dW0gdXBkYXRlIC15IC0tZGlzYWJsZXJlcG89JyonIC0tZW5hYmxlcmVwbz0ncmh1aS1taWNyb3NvZnQtYXp1cmUqJyAmJiBicmVhawogIGlmIFtbICR7YXR0ZW1wdH0gLWx0IDUgXV07IHRoZW4gc2xlZXAgMTA7IGVsc2UgZXhpdCAxOyBmaQpkb25lCgplY2hvICJydW5uaW5nIHl1bSB1cGRhdGUiCmZvciBhdHRlbXB0IGluIHsxLi41fTsgZG8KICB5dW0gLXkgLXggV0FMaW51eEFnZW50IC14IFdBTGludXhBZ2VudC11ZGV2IHVwZGF0ZSAtLWFsbG93ZXJhc2luZyAmJiBicmVhawogIGlmIFtbICR7YXR0ZW1wdH0gLWx0IDUgXV07IHRoZW4gc2xlZXAgMTA7IGVsc2UgZXhpdCAxOyBmaQpkb25lCgplY2hvICJpbnN0YWxsaW5nIHBvZG1hbi1kb2NrZXIiCmZvciBhdHRlbXB0IGluIHsxLi41fTsgZG8KICB5dW0gLXkgaW5zdGFsbCBwb2RtYW4tZG9ja2VyICYmIGJyZWFrCiAgaWYgW1sgJHthdHRlbXB0fSAtbHQgNSBdXTsgdGhlbiBzbGVlcCAxMDsgZWxzZSBleGl0IDE7IGZpCmRvbmUKCmZpcmV3YWxsLWNtZCAtLWFkZC1wb3J0PTQ0My90Y3AgLS1wZXJtYW5lbnQKCm1rZGlyIC9yb290Ly5kb2NrZXIKY2F0ID4vcm9vdC8uZG9ja2VyL2NvbmZpZy5qc29uIDw8RU9GCnsKCSJhdXRocyI6IHsKCQkiJHtQUk9YWUlNQUdFJSUvKn0iOiB7CgkJCSJhdXRoIjogIiRQUk9YWUlNQUdFQVVUSCIKCQl9Cgl9Cn0KRU9GCgpta2RpciAtcCAvZXRjL2NvbnRhaW5lcnMvCnRvdWNoIC9ldGMvY29udGFpbmVycy9ub2RvY2tlcgoKZG9ja2VyIHB1bGwgIiRQUk9YWUlNQUdFIgoKbWtkaXIgL2V0Yy9wcm94eQpiYXNlNjQgLWQgPDw8IiRQUk9YWUNFUlQiID4vZXRjL3Byb3h5L3Byb3h5LmNydApiYXNlNjQgLWQgPDw8IiRQUk9YWUtFWSIgPi9ldGMvcHJveHkvcHJveHkua2V5CmJhc2U2NCAtZCA8PDwiJFBST1hZQ0xJRU5UQ0VSVCIgPi9ldGMvcHJveHkvcHJveHktY2xpZW50LmNydApjaG93biAtUiAxMDAwOjEwMDAgL2V0Yy9wcm94eQpjaG1vZCAwNjAwIC9ldGMvcHJveHkvcHJveHkua2V5CgpjYXQgPi9ldGMvc3lzY29uZmlnL3Byb3h5IDw8RU9GClBST1hZX0lNQUdFPSckUFJPWFlJTUFHRScKRU9GCgpjYXQgPi9ldGMvc3lzdGVtZC9zeXN0ZW0vcHJveHkuc2VydmljZSA8PCdFT0YnCltVbml0XQpBZnRlcj1uZXR3b3JrLW9ubGluZS50YXJnZXQKV2FudHM9bmV0d29yay1vbmxpbmUudGFyZ2V0CgpbU2VydmljZV0KRW52aXJvbm1lbnRGaWxlPS9ldGMvc3lzY29uZmlnL3Byb3h5CkV4ZWNTdGFydFByZT0tL3Vzci9iaW4vZG9ja2VyIHJtIC1mICVuCkV4ZWNTdGFydD0vdXNyL2Jpbi9kb2NrZXIgcnVuIC0tcm0gLS1uYW1lICVuIC1wIDQ0Mzo4NDQzIC12IC9ldGMvcHJveHk6L3NlY3JldHMgJFBST1hZX0lNQUdFCkV4ZWNTdG9wPS91c3IvYmluL2RvY2tlciBzdG9wICVuClJlc3RhcnQ9YWx3YXlzClJlc3RhcnRTZWM9MQpTdGFydExpbWl0SW50ZXJ2YWw9MAoKW0luc3RhbGxdCldhbnRlZEJ5PW11bHRpLXVzZXIudGFyZ2V0CkVPRgoKc3lzdGVtY3RsIGVuYWJsZSBwcm94eS5zZXJ2aWNlCgpjYXQgPi9ldGMvY3Jvbi53ZWVrbHkvcHVsbC1pbWFnZSA8PCdFT0YnCiMhL2Jpbi9iYXNoCgpkb2NrZXIgcHVsbCAkUFJPWFlJTUFHRQpzeXN0ZW1jdGwgcmVzdGFydCBwcm94eS5zZXJ2aWNlCkVPRgpjaG1vZCAreCAvZXRjL2Nyb24ud2Vla2x5L3B1bGwtaW1hZ2UKCmNhdCA+L2V0Yy9jcm9uLndlZWtseS95dW11cGRhdGUgPDwnRU9GJwojIS9iaW4vYmFzaAoKeXVtIHVwZGF0ZSAteQpFT0YKY2htb2QgK3ggL2V0Yy9jcm9uLndlZWtseS95dW11cGRhdGUKCmNhdCA+L2V0Yy9jcm9uLmRhaWx5L3Jlc3RhcnQtcHJveHkgPDwnRU9GJwojIS9iaW4vYmFzaAoKc3lzdGVtY3RsIHJlc3RhcnQgcHJveHkuc2VydmljZQpFT0YKY2htb2QgK3ggL2V0Yy9jcm9uLmRhaWx5L3Jlc3RhcnQtcHJveHkKCigKCXNsZWVwIDMwCglyZWJvb3QKKSAmCg==')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'PROXYIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImage')),''')\n','PROXYIMAGEAUTH=$(base64 -d \u003c\u003c\u003c''',base64(parameters('proxyImageAuth')),''')\n','PROXYCERT=''',parameters('proxyCert'),'''\n','PROXYCLIENTCERT=''',parameters('proxyClientCert'),'''\n','PROXYKEY=''',parameters('proxyKey'),'''\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    parse_run_options "$@"

    configure_and_install_dnf_pkgs_repos

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
	local -r allowed_options="pfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        podman
        podman-docker
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time

	local -r cron_weekly_dnf_update_filename='/etc/cron.weekly/dnfupdate'
	local -r cron_weekly_dnf_update_file="#!/bin/bash
dnf update -y"

	write_file cron_weekly_dnf_update_filename cron_weekly_dnf_update_file true
	chmod +x "$cron_weekly_dnf_update_filename"
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "443/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
	local -r registry_config_file="{
	"auths": {
		\"${PROXYIMAGE%%/*}\": {
			\"auth\": \"$PROXYIMAGEAUTH\"
		}
	}"

	write_file REGISTRY_AUTH_FILE registry_config_file true

    log "logging into prod acr"

    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    docker pull "$PROXYIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#	proxy
configure_system_services() {
	configure_service_proxy
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
		proxy
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_certs
configure_certs() {
    log "starting"

	base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt
	base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key
	base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt
	chown -R 1000:1000 /etc/proxy
	chmod 0600 /etc/proxy/proxy.key
}

configure_service_proxy() {
	local -r sysconfig_proxy_filename='/etc/sysconfig/proxy'
	local -r sysconfig_proxy_file="PROXY_IMAGE='$PROXYIMAGE'"

	write_file sysconfig_proxy_filename sysconfig_proxy_file true

	local -r proxy_service_filename='/etc/systemd/system/proxy.service'
	local -r proxy_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/proxy
ExecStartPre=-/usr/bin/docker rm -f %n
ExecStart=/usr/bin/docker run --rm --name %n -p 443:8443 -v /etc/proxy:/secrets $PROXY_IMAGE
ExecStop=/usr/bin/docker stop %n
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

	local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image'
	local -r cron_weekly_pull_image_file="#!/bin/bash
docker pull $PROXYIMAGE
systemctl restart proxy.service"
	
	write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true
	chmod +x "$cron_weekly_pull_image_filename"

	local -r cron_daily_restart_proxy_filename='/etc/cron.daily/restart-proxy'
	local -r cron_daily_restart_proxy_file="#!/bin/bash
systemctl restart proxy.service"
	
	write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file
	chmod +x "$cron_daily_restart_proxy_filename"
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" }, "provisionAfterExtensions": [ "Microsoft.Azure.Monitor.AzureMonitorLinuxAgent", diff --git a/pkg/deploy/assets/gateway-production.json b/pkg/deploy/assets/gateway-production.json index 1a3296cd889..ecbbe148c12 100644 --- a/pkg/deploy/assets/gateway-production.json +++ b/pkg/deploy/assets/gateway-production.json @@ -309,7 +309,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','DBTOKENURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenUrl')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','GATEWAYMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayMdsdConfigVersion')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayFeatures')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

echo "setting ssh password authentication"
# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work
sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config
systemctl reload sshd.service

#Adding retry logic to yum commands in order to avoid stalling out on resource locks
echo "running RHUI fix"
for attempt in {1..5}; do
  yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "running yum update"
for attempt in {1..5}; do
  yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "extending partition table"
# Linux block devices are inconsistently named
# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
growpart "$physical_disk" 2

echo "extending filesystems"
lvextend -l +20%FREE /dev/rootvg/rootlv
xfs_growfs /

lvextend -l +100%FREE /dev/rootvg/varlv
xfs_growfs /var

rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
rpm --import https://packages.microsoft.com/keys/microsoft.asc

for attempt in {1..5}; do
  yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "configuring logrotate"

# gateway_logdir is a readonly variable that specifies the host path mount point for the gateway container log file
# for the purpose of rotating the gateway logs
declare -r gateway_logdir='/var/log/aro-gateway'

cat >/etc/logrotate.conf <<EOF
# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we'll rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}

# Maximum log directory size is 100G with this configuration
# Setting limit to 100G to allow space for other logging services
# copytruncate is a critical option used to prevent logs from being shipped twice
${gateway_logdir} {
    size 20G
    rotate 5
    create 0600 root root
    copytruncate
    noolddir
    compress
}
EOF

echo "configuring yum repository and running yum update"
cat >/etc/yum.repos.d/azure.repo <<'EOF'
[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no
EOF

semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?"
mkdir -p /var/log/journal

for attempt in {1..5}; do
  yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman-docker openssl-perl python3 && break
  # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "applying firewall rules"
# https://access.redhat.com/security/cve/cve-2020-13401
cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

cat >/etc/sysctl.d/01-disable-core.conf <<'EOF'
kernel.core_pattern = |/bin/true
EOF
sysctl --system

firewall-cmd --add-port=80/tcp --permanent
firewall-cmd --add-port=8081/tcp --permanent
firewall-cmd --add-port=443/tcp --permanent

echo "logging into prod acr"
export AZURE_CLOUD_NAME=$AZURECLOUDNAME
az login -i --allow-no-subscriptions

# The managed identity that the VM runs as only has a single roleassignment.
# This role assignment is ACRPull which is not necessarily present in the
# subscription we're deploying into.  If the identity does not have any
# role assignments scoped on the subscription we're deploying into, it will
# not show on az login -i, which is why the below line is commented.
# az account set -s "$SUBSCRIPTIONID"

# Suppress emulation output for podman instead of docker for az acr compatability
mkdir -p /etc/containers/
touch /etc/containers/nodocker

mkdir -p /root/.docker
REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
docker pull "$MDMIMAGE"
docker pull "$RPIMAGE"
docker pull "$FLUENTBITIMAGE"

az logout

echo "configuring fluentbit service"
mkdir -p /etc/fluentbit/
mkdir -p /var/lib/fluent

cat >/etc/fluentbit/fluentbit.conf <<'EOF'
[INPUT]
	Name systemd
	Tag journald
	Systemd_Filter _COMM=aro
	DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[OUTPUT]
	Name forward
	Match *
	Port 29230
EOF

echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit

cat >/etc/systemd/system/fluentbit.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring mdm service"
cat >/etc/sysconfig/mdm <<EOF
MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=gateway
MDMSOURCEROLEINSTANCE='$(hostname)'
EOF

mkdir /var/etw
cat >/etc/systemd/system/mdm.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-gateway service"
cat >/etc/sysconfig/aro-gateway <<EOF
ACR_RESOURCE_ID='$ACRRESOURCEID'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT="$RPMDMACCOUNT"
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-gateway.service <<EOF
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${gateway_logdir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

echo "configuring mdsd and mdm services"
for var in "mdsd" "mdm"; do
cat >/etc/systemd/system/download-$var-credentials.service <<EOF
[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var
EOF

cat >/etc/systemd/system/download-$var-credentials.timer <<EOF
[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target
EOF
done

cat >/usr/local/bin/download-credentials.sh <<EOF
#!/bin/bash
set -eu

COMPONENT="\$1"
echo "Download \$COMPONENT credentials"

TEMP_DIR=\$(mktemp -d)
export AZURE_CONFIG_DIR=\$(mktemp -d)

echo "Logging into Azure..."
RETRIES=3
while [ "\$RETRIES" -gt 0 ]; do
    if az login -i --allow-no-subscriptions
    then
        echo "az login successful"
        break
    else
        echo "az login failed. Retrying..."
        let RETRIES-=1
        sleep 5
    fi
done

trap "cleanup" EXIT

cleanup() {
  az logout
  [[ "\$TEMP_DIR" =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ "\$AZURE_CONFIG_DIR" =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [ "\$COMPONENT" = "mdm" ]; then
  CURRENT_CERT_FILE="/etc/mdm.pem"
elif [ "\$COMPONENT" = "mdsd" ]; then
  CURRENT_CERT_FILE="/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME="gwy-\${COMPONENT}"
NEW_CERT_FILE="\$TEMP_DIR/\$COMPONENT.pem"
for attempt in {1..5}; do
  az keyvault secret download --file \$NEW_CERT_FILE --id "https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME" && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [ "\$COMPONENT" = "mdsd" ]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn="\$(openssl x509 -in "\$NEW_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  current_cert_sn="\$(openssl x509 -in "\$CURRENT_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != "\$current_cert_sn" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi
EOF

chmod u+x /usr/local/bin/download-credentials.sh

systemctl enable download-mdsd-credentials.timer
systemctl enable download-mdm-credentials.timer

/usr/local/bin/download-credentials.sh mdsd
/usr/local/bin/download-credentials.sh mdm
MDSDCERTIFICATESAN=$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')

cat >/etc/systemd/system/watch-mdm-credentials.service <<EOF
[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target
EOF

cat >/etc/systemd/system/watch-mdm-credentials.path <<EOF
[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target
EOF

systemctl enable watch-mdm-credentials.path
systemctl start watch-mdm-credentials.path

mkdir /etc/systemd/system/mdsd.service.d
cat >/etc/systemd/system/mdsd.service.d/override.conf <<'EOF'
[Unit]
After=network-online.target
EOF

cat >/etc/default/mdsd <<EOF
MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS="-A -d -r \$MDSD_ROLE_PREFIX"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=gateway
export MONITORING_ROLE_INSTANCE='$(hostname)'

export MDSD_MSGPACK_SORT_COLUMNS=1
EOF

# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
# to honour SSL_CERT_FILE any more, heaven only knows why.
mkdir -p /usr/lib/ssl/certs
csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null
c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
cat >/etc/default/vsa-nodescan-agent.config <<EOF
{
    "Nice": 19,
    "Timeout": 10800,
    "ClientId": "",
    "TenantId": "$AZURESECPACKVSATENANTID",
    "QualysStoreBaseUrl": "$AZURESECPACKQUALYSURL",
    "ProcessTimeout": 300,
    "CommandDelay": 0
  }
EOF

echo "enabling aro services"
for service in aro-gateway auoms azsecd azsecmond mdsd mdm chronyd fluentbit; do
  systemctl enable $service.service
done

for scan in baseline clamav software; do
  /usr/local/bin/azsecd config -s $scan -d P1D
done

echo "rebooting"
restorecon -RF /var/log/*
(sleep 30; reboot) &
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','DBTOKENURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenUrl')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','GATEWAYMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayMdsdConfigVersion')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayFeatures')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    local -r gateway_logdir='/var/log/aro-gateway'
    parse_run_options "$@" gateway_logdir


    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate gateway_logdir
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services gateway_logdir
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Make selinux modifications required for ARO RP
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate "$2"
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services "$2"
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "starting"
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time
    create_azure_rpm_repos retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    rpm_import_keys rpm_keys retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# rpm_import_keys
rpm_import_keys() {
    local -n keys="$1"
    log "starting"


    # shellcheck disable=SC2068
    for key in ${keys[@]}; do
        if [ ${#keys[@]} -eq 0 ]; then
            break
        fi
            local -a cmd=(
                rpm
                --import
                -v
                "$key"
            )

            log "attempt #$attempt - importing rpm repository key $key"
            retry cmd "$2" && unset key
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    local -n log_dir="$1"
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file="# see 'man logrotate' for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}

# Maximum log directory size is 100G with this configuration
# Setting limit to 100G to allow space for other logging services
# copytruncate is a critical option used to prevent logs from being shipped twice
${log_dir} {
    size 20G
    rotate 5
    create 0600 root root
    copytruncate
    noolddir
    compress
}"

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_selinux
configure_selinux() {
    log "starting"

    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "80/tcp"
        "8081/tcp"
        "443/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    log "logging into prod acr"
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_gateway "$1"
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
      aro-gateway
      auoms
      azsecd
      azsecmond
      mdsd
      mdm
      chronyd
      fluentbit
    )
    log "enabling gateway services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=gateway
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"gwy-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-gwy.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_gateway() {
    local -n log_dir="$1"
    log "starting"

    local -r aro_gateway_conf_filename='/etc/sysconfig/aro-gateway'
    local -r aro_gateway_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_gateway_conf_filename aro_gateway_conf_file true

    local -r aro_gateway_service_filename='/etc/systemd/system/aro-gateway.service'

    local -r aro_gateway_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${log_dir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${log_dir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
    "

    write_file aro_gateway_service_filename aro_gateway_service_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
DBTOKEN_URL='$DBTOKENURL'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Gateway
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_FEATURES='$GATEWAYFEATURES'
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-gateway
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir}
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e DBTOKEN_URL \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_FEATURES \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 80:8080 \
  -p 8081:8081 \
  -p 443:8443 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  -v ${gateway_logdir}:/ctr.log:z \
  \$RPIMAGE \
  gateway
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$GATEWAYMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=gateway
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" } } } diff --git a/pkg/deploy/assets/rp-production.json b/pkg/deploy/assets/rp-production.json index 7b80cdb2236..99f72f4d6ff 100644 --- a/pkg/deploy/assets/rp-production.json +++ b/pkg/deploy/assets/rp-production.json @@ -516,7 +516,7 @@ "autoUpgradeMinorVersion": true, "settings": {}, "protectedSettings": { - "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

echo "setting ssh password authentication"
# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work
sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config
systemctl reload sshd.service

#Adding retry logic to yum commands in order to avoid stalling out on resource locks
echo "running RHUI fix"
for attempt in {1..5}; do
  yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "running yum update"
for attempt in {1..5}; do
  yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "extending partition table"
# Linux block devices are inconsistently named
# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
growpart "$physicalDisk" 2

echo "extending filesystems"
lvextend -l +20%FREE /dev/rootvg/rootlv
xfs_growfs /

lvextend -l +100%FREE /dev/rootvg/varlv
xfs_growfs /var

echo "importing rpm repositories"
rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
rpm --import https://packages.microsoft.com/keys/microsoft.asc

for attempt in {1..5}; do
  yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

echo "configuring logrotate"
cat >/etc/logrotate.conf <<'EOF'
# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we'll rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}
EOF

echo "configuring yum repository and running yum update"
cat >/etc/yum.repos.d/azure.repo <<'EOF'
[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no
EOF

semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?"
mkdir -p /var/log/journal

for attempt in {1..5}; do
yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman podman-docker openssl-perl python3 && break
  # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
  if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi
done

# https://access.redhat.com/security/cve/cve-2020-13401
echo "applying firewall rules"
cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF'
net.ipv6.conf.all.accept_ra=0
EOF

cat >/etc/sysctl.d/01-disable-core.conf <<'EOF'
kernel.core_pattern = |/bin/true
EOF
sysctl --system

firewall-cmd --add-port=443/tcp --permanent
firewall-cmd --add-port=444/tcp --permanent
firewall-cmd --add-port=445/tcp --permanent
firewall-cmd --add-port=2222/tcp --permanent

export AZURE_CLOUD_NAME=$AZURECLOUDNAME

echo "logging into prod acr"
az login -i --allow-no-subscriptions

# Suppress emulation output for podman instead of docker for az acr compatability
mkdir -p /etc/containers/
touch /etc/containers/nodocker

mkdir -p /root/.docker
REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
docker pull "$MDMIMAGE"
docker pull "$RPIMAGE"
docker pull "$FLUENTBITIMAGE"

az logout

echo "configuring fluentbit service"
mkdir -p /etc/fluentbit/
mkdir -p /var/lib/fluent

cat >/etc/fluentbit/fluentbit.conf <<'EOF'
[INPUT]
	Name systemd
	Tag journald
	Systemd_Filter _COMM=aro
	DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230
EOF

echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit

cat >/etc/systemd/system/fluentbit.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

mkdir /etc/aro-rp
base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
if [[ -n "$ARMAPICABUNDLE" ]]; then
  base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
fi
chown -R 1000:1000 /etc/aro-rp

echo "configuring mdm service"
cat >/etc/sysconfig/mdm <<EOF
MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE='$(hostname)'
EOF

mkdir /var/etw
cat >/etc/systemd/system/mdm.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-rp service"
cat >/etc/sysconfig/aro-rp <<EOF
ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'
EOF

cat >/etc/systemd/system/aro-rp.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-dbtoken service"
cat >/etc/sysconfig/aro-dbtoken <<EOF
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-dbtoken.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

# DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
# are not used, but can't easily be refactored out. Should be revisited in the future.
echo "configuring aro-monitor service"
cat >/etc/sysconfig/aro-monitor <<EOF
AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-monitor.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target
EOF

echo "configuring aro-portal service"
cat >/etc/sysconfig/aro-portal <<EOF
AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'
EOF

cat >/etc/systemd/system/aro-portal.service <<'EOF'
[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target
EOF

echo "configuring mdsd and mdm services"
chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

for var in "mdsd" "mdm"; do
cat >/etc/systemd/system/download-$var-credentials.service <<EOF
[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var
EOF

cat >/etc/systemd/system/download-$var-credentials.timer <<EOF
[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target
EOF
done

cat >/usr/local/bin/download-credentials.sh <<EOF
#!/bin/bash
set -eu

COMPONENT="\$1"
echo "Download \$COMPONENT credentials"

TEMP_DIR=\$(mktemp -d)
export AZURE_CONFIG_DIR=\$(mktemp -d)

echo "Logging into Azure..."
RETRIES=3
while [ "\$RETRIES" -gt 0 ]; do
    if az login -i --allow-no-subscriptions
    then
        echo "az login successful"
        break
    else
        echo "az login failed. Retrying..."
        let RETRIES-=1
        sleep 5
    fi
done

trap "cleanup" EXIT

cleanup() {
  az logout
  [[ "\$TEMP_DIR" =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ "\$AZURE_CONFIG_DIR" =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [ "\$COMPONENT" = "mdm" ]; then
  CURRENT_CERT_FILE="/etc/mdm.pem"
elif [ "\$COMPONENT" = "mdsd" ]; then
  CURRENT_CERT_FILE="/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME="rp-\${COMPONENT}"
NEW_CERT_FILE="\$TEMP_DIR/\$COMPONENT.pem"
for attempt in {1..5}; do
  az keyvault secret download --file \$NEW_CERT_FILE --id "https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME" && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [ "\$COMPONENT" = "mdsd" ]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn="\$(openssl x509 -in "\$NEW_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  current_cert_sn="\$(openssl x509 -in "\$CURRENT_CERT_FILE" -noout -serial | awk -F= '{print \$2}')"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != "\$current_cert_sn" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi
EOF

chmod u+x /usr/local/bin/download-credentials.sh

systemctl enable download-mdsd-credentials.timer
systemctl enable download-mdm-credentials.timer

/usr/local/bin/download-credentials.sh mdsd
/usr/local/bin/download-credentials.sh mdm
MDSDCERTIFICATESAN=$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')

cat >/etc/systemd/system/watch-mdm-credentials.service <<EOF
[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target
EOF

cat >/etc/systemd/system/watch-mdm-credentials.path <<EOF
[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target
EOF

systemctl enable watch-mdm-credentials.path
systemctl start watch-mdm-credentials.path

mkdir /etc/systemd/system/mdsd.service.d
cat >/etc/systemd/system/mdsd.service.d/override.conf <<'EOF'
[Unit]
After=network-online.target
EOF

cat >/etc/default/mdsd <<EOF
MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS="-A -d -r \$MDSD_ROLE_PREFIX"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE='$(hostname)'

export MDSD_MSGPACK_SORT_COLUMNS=1
EOF

# setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
# to honour SSL_CERT_FILE any more, heaven only knows why.
mkdir -p /usr/lib/ssl/certs
csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 {*} >/dev/null
c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
cat >/etc/default/vsa-nodescan-agent.config <<EOF
{
    "Nice": 19,
    "Timeout": 10800,
    "ClientId": "",
    "TenantId": "$AZURESECPACKVSATENANTID",
    "QualysStoreBaseUrl": "$AZURESECPACKQUALYSURL",
    "ProcessTimeout": 300,
    "CommandDelay": 0
  }
EOF

echo "enabling aro services"
for service in aro-dbtoken aro-monitor aro-portal aro-rp auoms azsecd azsecmond mdsd mdm chronyd fluentbit; do
  systemctl enable $service.service
done

for scan in baseline clamav software; do
  /usr/local/bin/azsecd config -s $scan -d P1D
done

echo "rebooting"
restorecon -RF /var/log/*
(sleep 30; reboot) &
')))]" + "script": "[base64(concat(base64ToString('c2V0IC1leAoK'),'ACRRESOURCEID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('acrResourceId')),''')\n','ADMINAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('adminApiClientCertCommonName')),''')\n','ARMAPICLIENTCERTCOMMONNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armApiClientCertCommonName')),''')\n','ARMCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('armClientId')),''')\n','AZURECLOUDNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureCloudName')),''')\n','AZURESECPACKQUALYSURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackQualysUrl')),''')\n','AZURESECPACKVSATENANTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('azureSecPackVSATenantId')),''')\n','BILLINGE2ESTORAGEACCOUNTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('billingE2EStorageAccountId')),''')\n','CLUSTERMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdmAccount')),''')\n','CLUSTERMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdAccount')),''')\n','CLUSTERMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdConfigVersion')),''')\n','CLUSTERMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterMdsdNamespace')),''')\n','CLUSTERPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterParentDomainName')),''')\n','DATABASEACCOUNTNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('databaseAccountName')),''')\n','DBTOKENCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('dbtokenClientId')),''')\n','FLUENTBITIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fluentbitImage')),''')\n','FPCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpClientId')),''')\n','FPSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('fpServicePrincipalId')),''')\n','GATEWAYDOMAINS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayDomains')),''')\n','GATEWAYRESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayResourceGroupName')),''')\n','GATEWAYSERVICEPRINCIPALID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('gatewayServicePrincipalId')),''')\n','KEYVAULTDNSSUFFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultDNSSuffix')),''')\n','KEYVAULTPREFIX=$(base64 -d \u003c\u003c\u003c''',base64(parameters('keyvaultPrefix')),''')\n','MDMFRONTENDURL=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdmFrontendUrl')),''')\n','MDSDENVIRONMENT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('mdsdEnvironment')),''')\n','PORTALACCESSGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalAccessGroupIds')),''')\n','PORTALCLIENTID=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalClientId')),''')\n','PORTALELEVATEDGROUPIDS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('portalElevatedGroupIds')),''')\n','RPFEATURES=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpFeatures')),''')\n','RPIMAGE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpImage')),''')\n','RPMDMACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdmAccount')),''')\n','RPMDSDACCOUNT=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdAccount')),''')\n','RPMDSDCONFIGVERSION=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdConfigVersion')),''')\n','RPMDSDNAMESPACE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpMdsdNamespace')),''')\n','RPPARENTDOMAINNAME=$(base64 -d \u003c\u003c\u003c''',base64(parameters('rpParentDomainName')),''')\n','CLUSTERSINSTALLVIAHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersInstallViaHive')),''')\n','CLUSTERSADOPTBYHIVE=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clustersAdoptByHive')),''')\n','CLUSTERDEFAULTINSTALLERPULLSPEC=$(base64 -d \u003c\u003c\u003c''',base64(parameters('clusterDefaultInstallerPullspec')),''')\n','USECHECKACCESS=$(base64 -d \u003c\u003c\u003c''',base64(parameters('useCheckAccess')),''')\n','ADMINAPICABUNDLE=''',parameters('adminApiCaBundle'),'''\n','ARMAPICABUNDLE=''',parameters('armApiCaBundle'),'''\n','MDMIMAGE=''/genevamdm:2.2024.328.1744-c5fb79-20240328t1935''\n','LOCATION=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().location),''')\n','SUBSCRIPTIONID=$(base64 -d \u003c\u003c\u003c''',base64(subscription().subscriptionId),''')\n','RESOURCEGROUPNAME=$(base64 -d \u003c\u003c\u003c''',base64(resourceGroup().name),''')\n','\n',base64ToString('#!/bin/bash

set -o errexit \
    -o nounset

if [ "${DEBUG:-false}" == true ]; then
    set -x
fi

main() {
    parse_run_options "$@"


    configure_sshd
    configure_and_install_dnf_pkgs_repos
    configure_disk_partitions
    configure_logrotate
    configure_selinux

    mkdir -p /var/log/journal
    mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store

    configure_firewalld_rules
    pull_container_images
    configure_system_services
    reboot_vm
}

usage() {
    local -n options="$1"
    log "$(basename "$0") [$options]
        -d Configure Disk Partitions
        -p Configure rpm repositories, import required rpm keys, update & install packages with dnf
        -l Configure logrotate.conf
        -s Make selinux modifications required for ARO RP
        -r Configure sshd - Allow password authenticaiton
        -f Configure firewalld default zone rules
        -u Configure systemd unit files for ARO RP
        -i Pull container images

        Note: steps will be executed in the order that flags are provided
    "
}

# parse_run_options takes all arguements passed to main and parses them
# allowing individual step(s) to be ran, rather than all steps
#
# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline
parse_run_options() {
    # shellcheck disable=SC2206
    local -a options=(${1:-})
    if [ "${#options[@]}" -eq 0 ]; then
        log "Running all steps"
        return 0
    fi

    local OPTIND
    local -r allowed_options="dplsrfui"
    while getopts ${allowed_options} options; do
        case "${options}" in
            d)
                log "Running step configure_disk_partitions"
                configure_disk_partitions
                ;;
            p)
                log "Running step configure_and_install_dnf_pkgs_repos"
                configure_and_install_dnf_pkgs_repos
                ;;
            l)
                log "Running configure_logrotate"
                configure_logrotate
                ;;
            s)
                log "Running configure_selinux"
                configure_selinux
                ;;
            r)
                log "Running configure_sshd"
                configure_sshd
                ;;
            f)
                log "Running configure_firewalld_rules"
                configure_firewalld_rules
                ;;
            u)
                log "Running pull_container_images & configure_system_services"
                configure_system_services
                ;;
            i)
                log "Running pull_container_images"
                pull_container_images 
                ;;
            *)
                usage allowed_options
                abort "Unkown option provided"
                ;;
        esac
    done
    
    exit 0
}

# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work
configure_sshd() {
    log "starting"
    log "setting ssh password authentication"
    sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config

    systemctl reload sshd.service
    systemctl is-active --quiet sshd || abort "sshd failed to reload"
}

# configure_and_install_dnf_pkgs_repos
configure_and_install_dnf_pkgs_repos() {
    log "starting"

    # transaction attempt retry time in seconds
    local -ri retry_wait_time=60
    configure_rhui_repo retry_wait_time
    create_azure_rpm_repos retry_wait_time

    local -ar exclude_pkgs=(
        "-x WALinuxAgent"
        "-x WALinuxAgent-udev"
    )

    dnf_update_pkgs exclude_pkgs retry_wait_time

    local -ra rpm_keys=(
        https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8
        https://packages.microsoft.com/keys/microsoft.asc
    )

    rpm_import_keys rpm_keys retry_wait_time

    local -ra repo_rpm_pkgs=(
        https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm
    )

    local -ra install_pkgs=(
        clamav
        azsec-clamav
        azsec-monitor
        azure-cli
        azure-mdsd
        azure-security
        podman
        podman-docker
        openssl-perl
        # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505
        python3
    )

    dnf_install_pkgs repo_rpm_pkgs retry_wait_time
    dnf_install_pkgs install_pkgs retry_wait_time
}

# configure_rhui_repo
configure_rhui_repo() {
    log "starting"

    local -ra cmd=(
        dnf
        update
        -y
        --disablerepo='*'
        --enablerepo='rhui-microsoft-azure*'
    )

    log "running RHUI package updates"
    retry cmd "$1"
}

# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks
retry() {
    local -n cmd_retry="$1"
    local -n wait_time="$2"

    for attempt in {1..5}; do
        log "attempt #${attempt} - ${FUNCNAME[2]}"
        ${cmd_retry[@]} &

        wait $! && break
        if [[ ${attempt} -lt 5 ]]; then
            sleep "$wait_time"
        else
            abort "attempt #${attempt} - Failed to update packages"
        fi
    done
}

# dnf_update_pkgs
dnf_update_pkgs() {
    local -n excludes="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        ${excludes[@]}
        update
        --allowerasing
    )

    log "Updating all packages"
    retry cmd "$2"
}

# dnf_install_pkgs
dnf_install_pkgs() {
    local -n pkgs="$1"
    log "starting"

    local -ra cmd=(
        dnf
        -y
        install
        ${pkgs[@]}
    )

    log "Attempting to install packages: ${pkgs[*]}"
    retry cmd "$2"
}

# rpm_import_keys
rpm_import_keys() {
    local -n keys="$1"
    log "starting"


    # shellcheck disable=SC2068
    for key in ${keys[@]}; do
        if [ ${#keys[@]} -eq 0 ]; then
            break
        fi
            local -a cmd=(
                rpm
                --import
                -v
                "$key"
            )

            log "attempt #$attempt - importing rpm repository key $key"
            retry cmd "$2" && unset key
    done
}

# configure_disk_partitions
configure_disk_partitions() {
    log "starting"
    log "extending partition table"

    # Linux block devices are inconsistently named
    # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here
    physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')"
    growpart "$physical_disk" 2

    log "extending filesystems"
    log "extending root lvm"
    lvextend -l +20%FREE /dev/rootvg/rootlv
    log "growing root filesystem"
    xfs_growfs /

    log "extending var lvm"
    lvextend -l +100%FREE /dev/rootvg/varlv
    log "growing var filesystem"
    xfs_growfs /var
}

# configure_logrotate clobbers /etc/logrotate.conf
configure_logrotate() {
    log "starting"

    local -r logrotate_conf_filename='/etc/logrotate.conf'
    local -r logrotate_conf_file='# see "man logrotate" for details
# rotate log files weekly
weekly

# keep 2 weeks worth of backlogs
rotate 2

# create new (empty) log files after rotating old ones
create

# use date as a suffix of the rotated file
dateext

# uncomment this if you want your log files compressed
compress

# RPM packages drop log rotation information into this directory
include /etc/logrotate.d

# no packages own wtmp and btmp -- we will rotate them here
/var/log/wtmp {
    monthly
    create 0664 root utmp
        minsize 1M
    rotate 1
}

/var/log/btmp {
    missingok
    monthly
    create 0600 root utmp
    rotate 1
}'

    write_file logrotate_conf_filename logrotate_conf_file true
}

# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file
create_azure_rpm_repos() {
    log "starting"

    local -r azure_repo_filename='/etc/yum.repos.d/azure.repo'
    local -r azure_repo_file='[azure-cli]
name=azure-cli
baseurl=https://packages.microsoft.com/yumrepos/azure-cli
enabled=yes
gpgcheck=yes

[azurecore]
name=azurecore
baseurl=https://packages.microsoft.com/yumrepos/azurecore
enabled=yes
gpgcheck=no'

    write_file azure_repo_filename azure_repo_file true
}

# configure_selinux
configure_selinux() {
    log "starting"

    local -r relabel="${1:-false}"

    already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined"
    semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error"
    chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent

    if "$relabel"; then
        restorecon -RF /var/log/* || log "$already_defined_ignore_error"
    fi
}

# configure_firewalld_rules
configure_firewalld_rules() {
    log "starting"

    # https://access.redhat.com/security/cve/cve-2020-13401
    local -r prefix="/etc/sysctl.d"
    local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf"
    local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0"

    write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true

    local -r disable_core_filename="$prefix/01-disable-core.conf"
    local -r disable_core_file="kernel.core_pattern = |/bin/true
    "
    write_file disable_core_filename disable_core_file true

    sysctl --system

    local -ra enable_ports=(
        "443/tcp"
        "444/tcp"
        "445/tcp"
        "2222/tcp"
    )

    log "Enabling ports ${enable_ports[*]} on default firewalld zone"
    # shellcheck disable=SC2068
    for port in ${enable_ports[@]}; do
        log "Enabling port $port now"
        firewall-cmd "--add-port=$port"
    done

    firewall-cmd --runtime-to-permanent
}

# pull_container_images
pull_container_images() {
    log "starting"

    # The managed identity that the VM runs as only has a single roleassignment.
    # This role assignment is ACRPull which is not necessarily present in the
    # subscription we're deploying into.  If the identity does not have any
    # role assignments scoped on the subscription we're deploying into, it will
    # not show on az login -i, which is why the below line is commented.
    # az account set -s "$SUBSCRIPTIONID"
    az login -i --allow-no-subscriptions

    # Suppress emulation output for podman instead of docker for az acr compatability
    mkdir -p /etc/containers/
    mkdir -p /root/.docker
    touch /etc/containers/nodocker

	# This name is used in the case that az acr login searches for this in it's environment
    local -r REGISTRY_AUTH_FILE="/root/.docker/config.json"
    
    log "logging into prod acr"
    az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")"

    MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}"
    docker pull "$MDMIMAGE"
    docker pull "$RPIMAGE"
    docker pull "$FLUENTBITIMAGE"

    az logout
}

# configure_system_services creates, configures, and enables the following systemd services and timers
# services
#   fluentbit
#   mdm
#   mdsd
#   arp-rp
#   aro-dbtoken
#   aro-monitor
#   aro-portal
configure_system_services() {
    configure_service_fluentbit
    configure_service_mdm
    configure_timers_mdm_mdsd
    configure_service_aro_rp
    configure_service_aro_dbtoken
    configure_service_aro_monitor
    configure_service_aro_portal
    configure_service_mdsd
}

# enable_aro_services enables all services required for aro rp
enable_aro_services() {
    log "starting"

    local -ra aro_services=(
        "aro-dbtoken"
        "aro-monitor"
        "aro-portal"
        "aro-rp"
        "auoms"
        "azsecd"
        "azsecmond"
        "mdsd"
        "mdm"
        "chronyd"
        "fluentbit"
    )
    log "enabling aro services ${aro_services[*]}"
    # shellcheck disable=SC2068
    for service in ${aro_services[@]}; do
        log "Enabling $service now"
        systemctl enable "$service.service"
    done
}

# configure_service_fluentbit
configure_service_fluentbit() {
    log "starting"
    log "configuring fluentbit service"

    mkdir -p /etc/fluentbit/
    mkdir -p /var/lib/fluent

    local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf'
    local -r fluentbit_conf_file="[INPUT]
Name systemd
Tag journald
Systemd_Filter _COMM=aro
DB /var/lib/fluent/journaldb

[FILTER]
	Name modify
	Match journald
	Remove_wildcard _
	Remove TIMESTAMP

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND asyncqos asyncqos true

[FILTER]
	Name modify
	Match asyncqos
	Remove CLIENT_PRINCIPAL_NAME
	Remove FILE
	Remove COMPONENT

[FILTER]
	Name rewrite_tag
	Match journald
	Rule $LOGKIND ifxaudit ifxaudit false

[OUTPUT]
	Name forward
	Match *
	Port 29230"

    write_file fluentbit_conf_filename fluentbit_conf_file true

    local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit'
    local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE"

    write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true

    local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service'

    local -r fluentbit_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitIntervalSec=0

[Service]
RestartSec=1s
EnvironmentFile=/etc/sysconfig/fluentbit
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --security-opt label=disable \
  --entrypoint /opt/td-agent-bit/bin/td-agent-bit \
  --net=host \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -v /etc/fluentbit/fluentbit.conf:/etc/fluentbit/fluentbit.conf \
  -v /var/lib/fluent:/var/lib/fluent:z \
  -v /var/log/journal:/var/log/journal:ro \
  -v /etc/machine-id:/etc/machine-id:ro \
  $FLUENTBITIMAGE \
  -c /etc/fluentbit/fluentbit.conf

ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=5
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file fluentbit_conf_filename fluentbit_conf_file true
}

# configure_certs
configure_certs() {
    log "starting"

    mkdir /etc/aro-rp
    base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem
    if [[ -n "$ARMAPICABUNDLE" ]]; then
    base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem
    fi
    chown -R 1000:1000 /etc/aro-rp

    # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not
    # to honour SSL_CERT_FILE any more, heaven only knows why.
    mkdir -p /usr/lib/ssl/certs
    csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null
    c_rehash /usr/lib/ssl/certs

# we leave clientId blank as long as only 1 managed identity assigned to vmss
# if we have more than 1, we will need to populate with clientId used for off-node scanning
    local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config"
    local -r nodescan_agent_file="{
    \"Nice\": 19,
    \"Timeout\": 10800,
    \"ClientId\": \"\",
    \"TenantId\": $AZURESECPACKVSATENANTID,
    \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL,
    \"ProcessTimeout\": 300,
    \"CommandDelay\": 0
  }"

    write_file nodescan_agent_filename nodescan_agent_file true
}

# configure_service_mdm
configure_service_mdm() {
    log "starting"
    log "configuring mdm service"

    local -r sysconfig_mdm_filename="/etc/sysconfig/mdm"
    local -r sysconfig_mdm_file="MDMFRONTENDURL='$MDMFRONTENDURL'
MDMIMAGE='$MDMIMAGE'
MDMSOURCEENVIRONMENT='$LOCATION'
MDMSOURCEROLE=rp
MDMSOURCEROLEINSTANCE=\"$(hostname)\""

    write_file sysconfig_mdm_filename sysconfig_mdm_file true

    mkdir -p /var/etw
    local -r mdm_service_filename="/etc/systemd/system/mdm.service"
    local -r mdm_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/mdm
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --entrypoint /usr/sbin/MetricsExtension \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -m 2g \
  -v /etc/mdm.pem:/etc/mdm.pem \
  -v /var/etw:/var/etw:z \
  $MDMIMAGE \
  -CertFile /etc/mdm.pem \
  -FrontEndUrl $MDMFRONTENDURL \
  -Logger Console \
  -LogLevel Warning \
  -PrivateKeyFile /etc/mdm.pem \
  -SourceEnvironment $MDMSOURCEENVIRONMENT \
  -SourceRole $MDMSOURCEROLE \
  -SourceRoleInstance $MDMSOURCEROLEINSTANCE
ExecStop=/usr/bin/docker stop %N
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file mdm_service_filename mdm_service_file true
}

# configure_timers_mdm_mdsd
configure_timers_mdm_mdsd() {
    log "starting"

    for var in "mdsd" "mdm"; do
        local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service"
        local download_creds_service_file="[Unit]
Description=Periodic $var credentials refresh

[Service]
Type=oneshot
ExecStart=/usr/local/bin/download-credentials.sh $var"

        write_file download_creds_service_filename download_creds_service_file true

        local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer"
        local download_creds_timer_file="[Unit]
Description=Periodic $var credentials refresh
After=network-online.target
Wants=network-online.target

[Timer]
OnBootSec=0min
OnCalendar=0/12:00:00
AccuracySec=5s

[Install]
WantedBy=timers.target"

        write_file download_creds_timer_filename download_creds_timer_file true
    done

    local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh"
    local -r download_creds_script_file="#!/bin/bash
set -eu

COMPONENT=\$1
echo \"Download \$COMPONENT credentials\"

TEMP_DIR=\"\$(mktemp -d)\"
export AZURE_CONFIG_DIR=\"\$(mktemp -d)\"

echo \"Logging into Azure...\"
RETRIES=3
while [[ \$RETRIES -gt 0 ]]; do
    if az login -i --allow-no-subscriptions
    then
        echo \"az login successful\"
        break
    else
        echo \"az login failed. Retrying...\"
        let RETRIES-=1
        sleep 5
    fi
done

trap \"cleanup\" EXIT

cleanup() {
  az logout
  [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR
  [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR
}

if [[ \$COMPONENT = \"mdm\" ]]; then
  CURRENT_CERT_FILE=\"/etc/mdm.pem\"
elif [[ \$COMPONENT\ = \"mdsd\" ]]; then
  CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\"
else
  echo Invalid usage && exit 1
fi

SECRET_NAME=\"rp-\${COMPONENT}\"
NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\"
for attempt in {1..5}; do
  az keyvault \
    secret \
    download \
    --file \"\$NEW_CERT_FILE\" \
    --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \
    && break
  if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi
done

if [ -f \$NEW_CERT_FILE ]; then
  if [[ \$COMPONENT = \"mdsd\" ]]; then
    chown syslog:syslog \$NEW_CERT_FILE
  else
    sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE
  fi

  new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\"
  if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then
    echo updating certificate for \$COMPONENT
    chmod 0600 \$NEW_CERT_FILE
    mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE
  fi
else
  echo Failed to refresh certificate for \$COMPONENT && exit 1
fi"

    write_file download_creds_script_filename download_creds_script_file true

    chmod u+x /usr/local/bin/download-credentials.sh

    systemctl enable download-mdsd-credentials.timer
    systemctl enable download-mdm-credentials.timer

    /usr/local/bin/download-credentials.sh mdsd
    /usr/local/bin/download-credentials.sh mdm

    local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')"
    local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service"
    local -r watch_mdm_creds_service_file="[Unit]
Description=Watch for changes in mdm.pem and restarts the mdm service

[Service]
Type=oneshot
ExecStart=/usr/bin/systemctl restart mdm.service

[Install]
WantedBy=multi-user.target"

    write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true

    local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path'
    local -r watch_mdm_creds_path_file='[Path]
PathModified=/etc/mdm.pem

[Install]
WantedBy=multi-user.target'

    write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true

    local -r watch_mdm_creds='watch-mdm-credentials.path'
    systemctl enable "$watch_mdm_creds" || abort "failed to enable $watch_mdm_creds"
    systemctl start "$watch_mdm_creds" || abort "failed to start $watch_mdm_creds"
}

# configure_service_aro_rp
configure_service_aro_rp() {
    log "starting"

    local -r aro_rp_conf_filename='/etc/sysconfig/aro-rp'
    local -r aro_rp_conf_file="ACR_RESOURCE_ID='$ACRRESOURCEID'
ADMIN_API_CLIENT_CERT_COMMON_NAME='$ADMINAPICLIENTCERTCOMMONNAME'
ARM_API_CLIENT_CERT_COMMON_NAME='$ARMAPICLIENTCERTCOMMONNAME'
AZURE_ARM_CLIENT_ID='$ARMCLIENTID'
AZURE_FP_CLIENT_ID='$FPCLIENTID'
AZURE_FP_SERVICE_PRINCIPAL_ID='$FPSERVICEPRINCIPALID'
BILLING_E2E_STORAGE_ACCOUNT_ID='$BILLINGE2ESTORAGEACCOUNTID'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=RP
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=RP
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
RP_FEATURES='$RPFEATURES'
RPIMAGE='$RPIMAGE'
ARO_INSTALL_VIA_HIVE='$CLUSTERSINSTALLVIAHIVE'
ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC='$CLUSTERDEFAULTINSTALLERPULLSPEC'
ARO_ADOPT_BY_HIVE='$CLUSTERSADOPTBYHIVE'
USE_CHECKACCESS='$USECHECKACCESS'"

    write_file aro_rp_conf_filename aro_rp_conf_file true

    local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service'
    local -r aro_rp_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-rp
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e ACR_RESOURCE_ID \
  -e ADMIN_API_CLIENT_CERT_COMMON_NAME \
  -e ARM_API_CLIENT_CERT_COMMON_NAME \
  -e AZURE_ARM_CLIENT_ID \
  -e AZURE_FP_CLIENT_ID \
  -e BILLING_E2E_STORAGE_ACCOUNT_ID \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e CLUSTER_MDSD_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e DOMAIN_NAME \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e MDSD_ENVIRONMENT \
  -e RP_FEATURES \
  -e ARO_INSTALL_VIA_HIVE \
  -e ARO_HIVE_DEFAULT_INSTALLER_PULLSPEC \
  -e ARO_ADOPT_BY_HIVE \
  -e USE_CHECKACCESS \
  -m 2g \
  -p 443:8443 \
  -v /etc/aro-rp:/etc/aro-rp \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  rp
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_rp_service_filename aro_rp_conf_file true
}

# configure_service_aro_dbtoken
configure_service_aro_dbtoken() {
    log "starting"

    local -r aro_dbtoken_service_conf_filename='/etc/sysconfig/aro-dbtoken'
    local -r aro_dbtoken_service_conf_file="DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
AZURE_DBTOKEN_CLIENT_ID='$DBTOKENCLIENTID'
AZURE_GATEWAY_SERVICE_PRINCIPAL_ID='$GATEWAYSERVICEPRINCIPALID'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=DBToken
RPIMAGE='$RPIMAGE'"

    write_file aro_dbtoken_service_conf_filename aro_dbtoken_service_conf_file true

    local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service'
    local -r aro_dbtoken_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-dbtoken
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_GATEWAY_SERVICE_PRINCIPAL_ID \
  -e DATABASE_ACCOUNT_NAME \
  -e AZURE_DBTOKEN_CLIENT_ID \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2g \
  -p 445:8445 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  dbtoken
ExecStop=/usr/bin/docker stop -t 3600 %N
TimeoutStopSec=3600
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_dbtoken_service_filename aro_dbtoken_service_file true
}

# configure_service_aro_monitor
configure_service_aro_monitor() {
    log "starting"
    log "configuring aro-monitor service"

    # DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE
    # are not used, but can't easily be refactored out. Should be revisited in the future.
    local -r aro_monitor_service_conf_filename='/etc/sysconfig/aro-monitor'
    local -r aro_monitor_service_conf_file="AZURE_FP_CLIENT_ID='$FPCLIENTID'
DOMAIN_NAME='$LOCATION.$CLUSTERPARENTDOMAINNAME'
CLUSTER_MDSD_ACCOUNT='$CLUSTERMDSDACCOUNT'
CLUSTER_MDSD_CONFIG_VERSION='$CLUSTERMDSDCONFIGVERSION'
GATEWAY_DOMAINS='$GATEWAYDOMAINS'
GATEWAY_RESOURCEGROUP='$GATEWAYRESOURCEGROUPNAME'
MDSD_ENVIRONMENT='$MDSDENVIRONMENT'
CLUSTER_MDSD_NAMESPACE='$CLUSTERMDSDNAMESPACE'
CLUSTER_MDM_ACCOUNT='$CLUSTERMDMACCOUNT'
CLUSTER_MDM_NAMESPACE=BBM
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=BBM
RPIMAGE='$RPIMAGE'"

    write_file aro_monitor_service_conf_filename aro_monitor_service_conf_file true

    local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service'
    local -r aro_monitor_service_file="[Unit]
After=network-online.target
Wants=network-online.target

[Service]
EnvironmentFile=/etc/sysconfig/aro-monitor
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_FP_CLIENT_ID \
  -e DOMAIN_NAME \
  -e CLUSTER_MDSD_ACCOUNT \
  -e CLUSTER_MDSD_CONFIG_VERSION \
  -e GATEWAY_DOMAINS \
  -e GATEWAY_RESOURCEGROUP \
  -e MDSD_ENVIRONMENT \
  -e CLUSTER_MDSD_NAMESPACE \
  -e CLUSTER_MDM_ACCOUNT \
  -e CLUSTER_MDM_NAMESPACE \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -m 2.5g \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  monitor
Restart=always
RestartSec=1
StartLimitInterval=0

[Install]
WantedBy=multi-user.target"

    write_file aro_monitor_service_filename aro_monitor_service_file true
}

# configure_service_aro_portal
configure_service_aro_portal() {
    log "starting"

    local -r aro_portal_service_conf_filename='/etc/sysconfig/aro-portal'
    local -r aro_portal_service_conf_file="AZURE_PORTAL_ACCESS_GROUP_IDS='$PORTALACCESSGROUPIDS'
AZURE_PORTAL_CLIENT_ID='$PORTALCLIENTID'
AZURE_PORTAL_ELEVATED_GROUP_IDS='$PORTALELEVATEDGROUPIDS'
DATABASE_ACCOUNT_NAME='$DATABASEACCOUNTNAME'
KEYVAULT_PREFIX='$KEYVAULTPREFIX'
MDM_ACCOUNT='$RPMDMACCOUNT'
MDM_NAMESPACE=Portal
PORTAL_HOSTNAME='$LOCATION.admin.$RPPARENTDOMAINNAME'
RPIMAGE='$RPIMAGE'"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true

    local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service'
    local -r aro_portal_service_file="[Unit]
After=network-online.target
Wants=network-online.target
StartLimitInterval=0

[Service]
EnvironmentFile=/etc/sysconfig/aro-portal
ExecStartPre=-/usr/bin/docker rm -f %N
ExecStart=/usr/bin/docker run \
  --hostname %H \
  --name %N \
  --rm \
  --cap-drop net_raw \
  -e AZURE_PORTAL_ACCESS_GROUP_IDS \
  -e AZURE_PORTAL_CLIENT_ID \
  -e AZURE_PORTAL_ELEVATED_GROUP_IDS \
  -e DATABASE_ACCOUNT_NAME \
  -e KEYVAULT_PREFIX \
  -e MDM_ACCOUNT \
  -e MDM_NAMESPACE \
  -e PORTAL_HOSTNAME \
  -m 2g \
  -p 444:8444 \
  -p 2222:2222 \
  -v /run/systemd/journal:/run/systemd/journal \
  -v /var/etw:/var/etw:z \
  $RPIMAGE \
  portal
Restart=always
RestartSec=1

[Install]
WantedBy=multi-user.target"

    write_file aro_portal_service_conf_filename aro_portal_service_conf_file true
}

# configure_service_mdsd
configure_service_mdsd() {
    log "starting"

    local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d"
    mkdir "$mdsd_service_dir"

    local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf"
    local -r mdsd_override_conf_file="[Unit]
After=network-online.target"

    write_file mdsd_override_conf_filename mdsd_override_conf_file true

    local -r default_mdsd_filename="/etc/default/mdsd"
    local -r default_mdsd_file="MDSD_ROLE_PREFIX=/var/run/mdsd/default
MDSD_OPTIONS=\"-A -d -r \$MDSD_ROLE_PREFIX\"

export MONITORING_GCS_ENVIRONMENT='$MDSDENVIRONMENT'
export MONITORING_GCS_ACCOUNT='$RPMDSDACCOUNT'
export MONITORING_GCS_REGION='$LOCATION'
export MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault
export MONITORING_GCS_AUTH_ID='$MDSDCERTIFICATESAN'
export MONITORING_GCS_NAMESPACE='$RPMDSDNAMESPACE'
export MONITORING_CONFIG_VERSION='$RPMDSDCONFIGVERSION'
export MONITORING_USE_GENEVA_CONFIG_SERVICE=true

export MONITORING_TENANT='$LOCATION'
export MONITORING_ROLE=rp
export MONITORING_ROLE_INSTANCE=\"$(hostname)\"

export MDSD_MSGPACK_SORT_COLUMNS=1\""

    write_file default_mdsd_filename default_mdsd_file true

}

# run_azsecd_config_scan
run_azsecd_config_scan() {
    log "starting"

    local -ar configs=(
        "baseline"
        "clamav"
        "software"
    )

    log "Scanning configuration files ${configs[*]}"
    # shellcheck disable=SC2068
    for scan in ${configs[@]}; do
        log "Scanning config file $scan now"
        /usr/local/bin/azsecd config -s "$scan" -d P1D
    done
}

# write_file
# Args
# 1) filename - string
# 2) file_contents - string
# 3) clobber - boolean; optional - defaults to false
write_file() {
    local -n filename="$1"
    local -n file_contents="$2"
    local -r clobber="${3:-false}"

    if $clobber; then
        log "Overwriting file $filename"
        echo "$file_contents" > "$filename"
    else
        log "Appending to $filename"
        echo "$file_contents" >> "$filename"
    fi
}

# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots
reboot_vm() {
    log "starting"

    configure_selinux "true"
    (sleep 30 && log "rebooting vm now"; reboot) &
}

# log is a wrapper for echo that includes the function name
log() {
    local -r msg="${1:-"log message is empty"}"
    local -r stack_level="${2:-1}"
    echo "${FUNCNAME[${stack_level}]}: ${msg}"
}

# abort is a wrapper for log that exits with an error code
abort() {
    local -ri origin_stacklevel=2
    log "${1}" "$origin_stacklevel"
    log "Exiting"
    exit 1
}

export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}"

main "$@"
')))]" } } } diff --git a/pkg/deploy/generator/scripts/devProxyVMSS.sh b/pkg/deploy/generator/scripts/devProxyVMSS.sh index bdbb8fe35b3..2b405881bce 100644 --- a/pkg/deploy/generator/scripts/devProxyVMSS.sh +++ b/pkg/deploy/generator/scripts/devProxyVMSS.sh @@ -1,53 +1,331 @@ -#Adding retry logic to yum commands in order to avoid stalling out on resource locks -echo "running RHUI fix" -for attempt in {1..5}; do - yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done - -echo "running yum update" -for attempt in {1..5}; do - yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done - -echo "installing podman-docker" -for attempt in {1..5}; do - yum -y install podman-docker && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done - -firewall-cmd --add-port=443/tcp --permanent - -mkdir /root/.docker -cat >/root/.docker/config.json </etc/proxy/proxy.crt -base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key -base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt -chown -R 1000:1000 /etc/proxy -chmod 0600 /etc/proxy/proxy.key + local -ra aro_services=( + proxy + ) + log "enabling aro services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} -cat >/etc/sysconfig/proxy </etc/systemd/system/proxy.service <<'EOF' -[Unit] + base64 -d <<<"$PROXYCERT" >/etc/proxy/proxy.crt + base64 -d <<<"$PROXYKEY" >/etc/proxy/proxy.key + base64 -d <<<"$PROXYCLIENTCERT" >/etc/proxy/proxy-client.crt + chown -R 1000:1000 /etc/proxy + chmod 0600 /etc/proxy/proxy.key +} + +configure_service_proxy() { + local -r sysconfig_proxy_filename='/etc/sysconfig/proxy' + local -r sysconfig_proxy_file="PROXY_IMAGE='$PROXYIMAGE'" + + write_file sysconfig_proxy_filename sysconfig_proxy_file true + + local -r proxy_service_filename='/etc/systemd/system/proxy.service' + local -r proxy_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -61,34 +339,66 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" -systemctl enable proxy.service + local -r cron_weekly_pull_image_filename='/etc/cron.weekly/pull-image' + local -r cron_weekly_pull_image_file="#!/bin/bash +docker pull $PROXYIMAGE +systemctl restart proxy.service" + + write_file cron_weekly_pull_image_filename cron_weekly_pull_image_file true + chmod +x "$cron_weekly_pull_image_filename" -cat >/etc/cron.weekly/pull-image <<'EOF' -#!/bin/bash + local -r cron_daily_restart_proxy_filename='/etc/cron.daily/restart-proxy' + local -r cron_daily_restart_proxy_file="#!/bin/bash +systemctl restart proxy.service" + + write_file cron_daily_restart_proxy_filename cron_daily_restart_proxy_file + chmod +x "$cron_daily_restart_proxy_filename" +} -docker pull $PROXYIMAGE -systemctl restart proxy.service -EOF -chmod +x /etc/cron.weekly/pull-image +# write_file +# Args +# 1) filename - string +# 2) file_contents - string +# 3) clobber - boolean; optional - defaults to false +write_file() { + local -n filename="$1" + local -n file_contents="$2" + local -r clobber="${3:-false}" -cat >/etc/cron.weekly/yumupdate <<'EOF' -#!/bin/bash + if $clobber; then + log "Overwriting file $filename" + echo "$file_contents" > "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} -yum update -y -EOF -chmod +x /etc/cron.weekly/yumupdate +# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots +reboot_vm() { + log "starting" -cat >/etc/cron.daily/restart-proxy <<'EOF' -#!/bin/bash + configure_selinux "true" + (sleep 30 && log "rebooting vm now"; reboot) & +} + +# log is a wrapper for echo that includes the function name +log() { + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" + echo "${FUNCNAME[${stack_level}]}: ${msg}" +} + +# abort is a wrapper for log that exits with an error code +abort() { + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" + log "Exiting" + exit 1 +} -systemctl restart proxy.service -EOF -chmod +x /etc/cron.daily/restart-proxy +export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -( - sleep 30 - reboot -) & +main "$@" diff --git a/pkg/deploy/generator/scripts/gatewayVMSS.sh b/pkg/deploy/generator/scripts/gatewayVMSS.sh index 4034eed3675..64b4232309f 100644 --- a/pkg/deploy/generator/scripts/gatewayVMSS.sh +++ b/pkg/deploy/generator/scripts/gatewayVMSS.sh @@ -1,52 +1,280 @@ #!/bin/bash -echo "setting ssh password authentication" -# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work -sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config -systemctl reload sshd.service +set -o errexit \ + -o nounset -#Adding retry logic to yum commands in order to avoid stalling out on resource locks -echo "running RHUI fix" -for attempt in {1..5}; do - yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +if [ "${DEBUG:-false}" == true ]; then + set -x +fi -echo "running yum update" -for attempt in {1..5}; do - yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +main() { + local -r gateway_logdir='/var/log/aro-gateway' + parse_run_options "$@" gateway_logdir -echo "extending partition table" -# Linux block devices are inconsistently named -# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here -physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" -growpart "$physical_disk" 2 -echo "extending filesystems" -lvextend -l +20%FREE /dev/rootvg/rootlv -xfs_growfs / + configure_sshd + configure_and_install_dnf_pkgs_repos + configure_disk_partitions + configure_logrotate gateway_logdir + configure_selinux -lvextend -l +100%FREE /dev/rootvg/varlv -xfs_growfs /var + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store -rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 -rpm --import https://packages.microsoft.com/keys/microsoft.asc + configure_firewalld_rules + pull_container_images + configure_system_services gateway_logdir + reboot_vm +} -for attempt in {1..5}; do - yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +usage() { + local -n options="$1" + log "$(basename "$0") [$options] + -d Configure Disk Partitions + -p Configure rpm repositories, import required rpm keys, update & install packages with dnf + -l Configure logrotate.conf + -s Make selinux modifications required for ARO RP + -r Configure sshd - Allow password authenticaiton + -f Configure firewalld default zone rules + -u Configure systemd unit files for ARO RP + -i Pull container images + + Note: steps will be executed in the order that flags are provided + " +} + +# parse_run_options takes all arguements passed to main and parses them +# allowing individual step(s) to be ran, rather than all steps +# +# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline +parse_run_options() { + # shellcheck disable=SC2206 + local -a options=(${1:-}) + if [ "${#options[@]}" -eq 0 ]; then + log "Running all steps" + return 0 + fi + + local OPTIND + local -r allowed_options="dplsrfui" + while getopts ${allowed_options} options; do + case "${options}" in + d) + log "Running step configure_disk_partitions" + configure_disk_partitions + ;; + p) + log "Running step configure_and_install_dnf_pkgs_repos" + configure_and_install_dnf_pkgs_repos + ;; + l) + log "Running configure_logrotate" + configure_logrotate "$2" + ;; + s) + log "Running configure_selinux" + configure_selinux + ;; + r) + log "Running configure_sshd" + configure_sshd + ;; + f) + log "Running configure_firewalld_rules" + configure_firewalld_rules + ;; + u) + log "Running pull_container_images & configure_system_services" + configure_system_services "$2" + ;; + i) + log "Running pull_container_images" + pull_container_images + ;; + *) + usage allowed_options + abort "Unkown option provided" + ;; + esac + done + + exit 0 +} + +# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work +configure_sshd() { + log "starting" + log "setting ssh password authentication" + sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config + + systemctl reload sshd.service + systemctl is-active --quiet sshd || abort "sshd failed to reload" +} -echo "configuring logrotate" +# configure_and_install_dnf_pkgs_repos +configure_and_install_dnf_pkgs_repos() { + log "starting" + + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + configure_rhui_repo retry_wait_time + create_azure_rpm_repos retry_wait_time + + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + dnf_update_pkgs exclude_pkgs retry_wait_time + + local -ra rpm_keys=( + https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + https://packages.microsoft.com/keys/microsoft.asc + ) + + rpm_import_keys rpm_keys retry_wait_time + + local -ra repo_rpm_pkgs=( + https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm + ) + + local -ra install_pkgs=( + clamav + azsec-clamav + azsec-monitor + azure-cli + azure-mdsd + azure-security + podman + podman-docker + openssl-perl + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + python3 + ) + + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time +} + +# configure_rhui_repo +configure_rhui_repo() { + log "starting" + + local -ra cmd=( + dnf + update + -y + --disablerepo='*' + --enablerepo='rhui-microsoft-azure*' + ) + + log "running RHUI package updates" + retry cmd "$1" +} + +# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks +retry() { + local -n cmd_retry="$1" + local -n wait_time="$2" + + for attempt in {1..5}; do + log "attempt #${attempt} - ${FUNCNAME[2]}" + ${cmd_retry[@]} & + + wait $! && break + if [[ ${attempt} -lt 5 ]]; then + sleep "$wait_time" + else + abort "attempt #${attempt} - Failed to update packages" + fi + done +} + +# dnf_update_pkgs +dnf_update_pkgs() { + local -n excludes="$1" + log "starting" + + local -ra cmd=( + dnf + -y + ${excludes[@]} + update + --allowerasing + ) + + log "Updating all packages" + retry cmd "$2" +} + +# dnf_install_pkgs +dnf_install_pkgs() { + local -n pkgs="$1" + log "starting" + + local -ra cmd=( + dnf + -y + install + ${pkgs[@]} + ) + + log "Attempting to install packages: ${pkgs[*]}" + retry cmd "$2" +} + +# rpm_import_keys +rpm_import_keys() { + local -n keys="$1" + log "starting" + + + # shellcheck disable=SC2068 + for key in ${keys[@]}; do + if [ ${#keys[@]} -eq 0 ]; then + break + fi + local -a cmd=( + rpm + --import + -v + "$key" + ) + + log "attempt #$attempt - importing rpm repository key $key" + retry cmd "$2" && unset key + done +} -# gateway_logdir is a readonly variable that specifies the host path mount point for the gateway container log file -# for the purpose of rotating the gateway logs -declare -r gateway_logdir='/var/log/aro-gateway' +# configure_disk_partitions +configure_disk_partitions() { + log "starting" + log "extending partition table" + + # Linux block devices are inconsistently named + # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here + physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" + growpart "$physical_disk" 2 + + log "extending filesystems" + log "extending root lvm" + lvextend -l +20%FREE /dev/rootvg/rootlv + log "growing root filesystem" + xfs_growfs / + + log "extending var lvm" + lvextend -l +100%FREE /dev/rootvg/varlv + log "growing var filesystem" + xfs_growfs /var +} -cat >/etc/logrotate.conf </etc/yum.repos.d/azure.repo <<'EOF' -[azure-cli] +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { + log "starting" + + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] name=azure-cli baseurl=https://packages.microsoft.com/yumrepos/azure-cli enabled=yes @@ -105,68 +338,144 @@ gpgcheck=yes name=azurecore baseurl=https://packages.microsoft.com/yumrepos/azurecore enabled=yes -gpgcheck=no -EOF +gpgcheck=no' + + write_file azure_repo_filename azure_repo_file true +} -semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" -mkdir -p /var/log/journal +# configure_selinux +configure_selinux() { + log "starting" -for attempt in {1..5}; do - yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman-docker openssl-perl python3 && break - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done + local -r relabel="${1:-false}" + + already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" + semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" + chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent + + if "$relabel"; then + restorecon -RF /var/log/* || log "$already_defined_ignore_error" + fi +} + +# configure_firewalld_rules +configure_firewalld_rules() { + log "starting" + + # https://access.redhat.com/security/cve/cve-2020-13401 + local -r prefix="/etc/sysctl.d" + local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" + local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" + + write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true + + local -r disable_core_filename="$prefix/01-disable-core.conf" + local -r disable_core_file="kernel.core_pattern = |/bin/true + " + write_file disable_core_filename disable_core_file true + + sysctl --system -echo "applying firewall rules" -# https://access.redhat.com/security/cve/cve-2020-13401 -cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF' -net.ipv6.conf.all.accept_ra=0 -EOF - -cat >/etc/sysctl.d/01-disable-core.conf <<'EOF' -kernel.core_pattern = |/bin/true -EOF -sysctl --system - -firewall-cmd --add-port=80/tcp --permanent -firewall-cmd --add-port=8081/tcp --permanent -firewall-cmd --add-port=443/tcp --permanent - -echo "logging into prod acr" -export AZURE_CLOUD_NAME=$AZURECLOUDNAME -az login -i --allow-no-subscriptions - -# The managed identity that the VM runs as only has a single roleassignment. -# This role assignment is ACRPull which is not necessarily present in the -# subscription we're deploying into. If the identity does not have any -# role assignments scoped on the subscription we're deploying into, it will -# not show on az login -i, which is why the below line is commented. -# az account set -s "$SUBSCRIPTIONID" - -# Suppress emulation output for podman instead of docker for az acr compatability -mkdir -p /etc/containers/ -touch /etc/containers/nodocker - -mkdir -p /root/.docker -REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" - -MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" -docker pull "$MDMIMAGE" -docker pull "$RPIMAGE" -docker pull "$FLUENTBITIMAGE" - -az logout - -echo "configuring fluentbit service" -mkdir -p /etc/fluentbit/ -mkdir -p /var/lib/fluent - -cat >/etc/fluentbit/fluentbit.conf <<'EOF' -[INPUT] - Name systemd - Tag journald - Systemd_Filter _COMM=aro - DB /var/lib/fluent/journaldb + local -ra enable_ports=( + "80/tcp" + "8081/tcp" + "443/tcp" + ) + + log "Enabling ports ${enable_ports[*]} on default firewalld zone" + # shellcheck disable=SC2068 + for port in ${enable_ports[@]}; do + log "Enabling port $port now" + firewall-cmd "--add-port=$port" + done + + firewall-cmd --runtime-to-permanent +} + +# pull_container_images +pull_container_images() { + log "starting" + + # The managed identity that the VM runs as only has a single roleassignment. + # This role assignment is ACRPull which is not necessarily present in the + # subscription we're deploying into. If the identity does not have any + # role assignments scoped on the subscription we're deploying into, it will + # not show on az login -i, which is why the below line is commented. + # az account set -s "$SUBSCRIPTIONID" + az login -i --allow-no-subscriptions + + # Suppress emulation output for podman instead of docker for az acr compatability + mkdir -p /etc/containers/ + mkdir -p /root/.docker + touch /etc/containers/nodocker + + # This name is used in the case that az acr login searches for this in it's environment + local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + + log "logging into prod acr" + az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + + MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + docker pull "$MDMIMAGE" + docker pull "$RPIMAGE" + docker pull "$FLUENTBITIMAGE" + + az logout +} + +# configure_system_services creates, configures, and enables the following systemd services and timers +# services +# fluentbit +# mdm +# mdsd +# arp-rp +# aro-dbtoken +# aro-monitor +# aro-portal +configure_system_services() { + configure_service_fluentbit + configure_service_mdm + configure_timers_mdm_mdsd + configure_service_aro_gateway "$1" + configure_service_mdsd +} + +# enable_aro_services enables all services required for aro rp +enable_aro_services() { + log "starting" + + local -ra aro_services=( + aro-gateway + auoms + azsecd + azsecmond + mdsd + mdm + chronyd + fluentbit + ) + log "enabling gateway services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} + +# configure_service_fluentbit +configure_service_fluentbit() { + log "starting" + log "configuring fluentbit service" + + mkdir -p /etc/fluentbit/ + mkdir -p /var/lib/fluent + + local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' + local -r fluentbit_conf_file="[INPUT] +Name systemd +Tag journald +Systemd_Filter _COMM=aro +DB /var/lib/fluent/journaldb [FILTER] Name modify @@ -177,13 +486,18 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' [OUTPUT] Name forward Match * - Port 29230 -EOF + Port 29230" + + write_file fluentbit_conf_filename fluentbit_conf_file true + + local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' + local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" + + write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true -echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit + local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' -cat >/etc/systemd/system/fluentbit.service <<'EOF' -[Unit] + local -r fluentbit_service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitIntervalSec=0 @@ -213,21 +527,61 @@ RestartSec=5 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file fluentbit_conf_filename fluentbit_conf_file true +} + +# configure_certs +configure_certs() { + log "starting" + + mkdir /etc/aro-rp + base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + if [[ -n "$ARMAPICABUNDLE" ]]; then + base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + fi + chown -R 1000:1000 /etc/aro-rp + + # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not + # to honour SSL_CERT_FILE any more, heaven only knows why. + mkdir -p /usr/lib/ssl/certs + csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null + c_rehash /usr/lib/ssl/certs + +# we leave clientId blank as long as only 1 managed identity assigned to vmss +# if we have more than 1, we will need to populate with clientId used for off-node scanning + local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" + local -r nodescan_agent_file="{ + \"Nice\": 19, + \"Timeout\": 10800, + \"ClientId\": \"\", + \"TenantId\": $AZURESECPACKVSATENANTID, + \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL, + \"ProcessTimeout\": 300, + \"CommandDelay\": 0 + }" + + write_file nodescan_agent_filename nodescan_agent_file true +} + +# configure_service_mdm +configure_service_mdm() { + log "starting" + log "configuring mdm service" -echo "configuring mdm service" -cat >/etc/sysconfig/mdm </etc/systemd/system/mdm.service <<'EOF' -[Unit] + write_file sysconfig_mdm_filename sysconfig_mdm_file true + + mkdir -p /var/etw + local -r mdm_service_filename="/etc/systemd/system/mdm.service" + local -r mdm_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -258,80 +612,28 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF - -echo "configuring aro-gateway service" -cat >/etc/sysconfig/aro-gateway </etc/systemd/system/aro-gateway.service </etc/systemd/system/download-$var-credentials.service </etc/systemd/system/download-$var-credentials.timer </usr/local/bin/download-credentials.sh </etc/systemd/system/watch-mdm-credentials.service </etc/systemd/system/watch-mdm-credentials.path </etc/systemd/system/mdsd.service.d/override.conf <<'EOF' -[Unit] + local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' + local -r aro_dbtoken_service_file="[Unit] After=network-online.target -EOF +Wants=network-online.target + +[Service] +EnvironmentFile=/etc/sysconfig/aro-gateway +ExecStartPre=-/usr/bin/docker rm -f %N +ExecStartPre=/usr/bin/mkdir -p ${gateway_logdir} +ExecStart=/usr/bin/docker run \ + --hostname %H \ + --name %N \ + --rm \ + --cap-drop net_raw \ + -e ACR_RESOURCE_ID \ + -e DATABASE_ACCOUNT_NAME \ + -e AZURE_DBTOKEN_CLIENT_ID \ + -e DBTOKEN_URL \ + -e GATEWAY_DOMAINS \ + -e GATEWAY_FEATURES \ + -e MDM_ACCOUNT \ + -e MDM_NAMESPACE \ + -m 2g \ + -p 80:8080 \ + -p 8081:8081 \ + -p 443:8443 \ + -v /run/systemd/journal:/run/systemd/journal \ + -v /var/etw:/var/etw:z \ + -v ${gateway_logdir}:/ctr.log:z \ + \$RPIMAGE \ + gateway +ExecStop=/usr/bin/docker stop -t 3600 %N +TimeoutStopSec=3600 +Restart=always +RestartSec=1 +StartLimitInterval=0 + +[Install] +WantedBy=multi-user.target" + + write_file aro_dbtoken_service_filename aro_dbtoken_service_file true +} + +# configure_service_mdsd +configure_service_mdsd() { + log "starting" + + local -r mdsd_service_dir="/etc/systemd/system/mdsd.service.d" + mkdir "$mdsd_service_dir" + + local -r mdsd_override_conf_filename="$mdsd_service_dir/override.conf" + local -r mdsd_override_conf_file="[Unit] +After=network-online.target" -cat >/etc/default/mdsd </dev/null -c_rehash /usr/lib/ssl/certs + write_file default_mdsd_filename default_mdsd_file true -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning -cat >/etc/default/vsa-nodescan-agent.config < "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} + +# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots +reboot_vm() { + log "starting" + + configure_selinux "true" + (sleep 30 && log "rebooting vm now"; reboot) & +} + +# log is a wrapper for echo that includes the function name +log() { + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" + echo "${FUNCNAME[${stack_level}]}: ${msg}" +} + +# abort is a wrapper for log that exits with an error code +abort() { + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" + log "Exiting" + exit 1 +} + +export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -echo "rebooting" -restorecon -RF /var/log/* -(sleep 30; reboot) & +main "$@" diff --git a/pkg/deploy/generator/scripts/rpVMSS.sh b/pkg/deploy/generator/scripts/rpVMSS.sh index 290b534c1c9..3c00da1185c 100644 --- a/pkg/deploy/generator/scripts/rpVMSS.sh +++ b/pkg/deploy/generator/scripts/rpVMSS.sh @@ -1,48 +1,278 @@ #!/bin/bash -echo "setting ssh password authentication" -# We need to manually set PasswordAuthentication to true in order for the VMSS Access JIT to work -sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config -systemctl reload sshd.service +set -o errexit \ + -o nounset -#Adding retry logic to yum commands in order to avoid stalling out on resource locks -echo "running RHUI fix" -for attempt in {1..5}; do - yum update -y --disablerepo='*' --enablerepo='rhui-microsoft-azure*' && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +if [ "${DEBUG:-false}" == true ]; then + set -x +fi -echo "running yum update" -for attempt in {1..5}; do - yum -y -x WALinuxAgent -x WALinuxAgent-udev update --allowerasing && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +main() { + parse_run_options "$@" -echo "extending partition table" -# Linux block devices are inconsistently named -# it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here -physicalDisk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" -growpart "$physicalDisk" 2 -echo "extending filesystems" -lvextend -l +20%FREE /dev/rootvg/rootlv -xfs_growfs / + configure_sshd + configure_and_install_dnf_pkgs_repos + configure_disk_partitions + configure_logrotate + configure_selinux -lvextend -l +100%FREE /dev/rootvg/varlv -xfs_growfs /var + mkdir -p /var/log/journal + mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store -echo "importing rpm repositories" -rpm --import https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 -rpm --import https://packages.microsoft.com/keys/microsoft.asc + configure_firewalld_rules + pull_container_images + configure_system_services + reboot_vm +} -for attempt in {1..5}; do - yum -y install https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm && break - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +usage() { + local -n options="$1" + log "$(basename "$0") [$options] + -d Configure Disk Partitions + -p Configure rpm repositories, import required rpm keys, update & install packages with dnf + -l Configure logrotate.conf + -s Make selinux modifications required for ARO RP + -r Configure sshd - Allow password authenticaiton + -f Configure firewalld default zone rules + -u Configure systemd unit files for ARO RP + -i Pull container images + + Note: steps will be executed in the order that flags are provided + " +} -echo "configuring logrotate" -cat >/etc/logrotate.conf <<'EOF' -# see "man logrotate" for details +# parse_run_options takes all arguements passed to main and parses them +# allowing individual step(s) to be ran, rather than all steps +# +# This is useful for local testing, or possibly modifying the bootstrap execution via environment variables in the deployment pipeline +parse_run_options() { + # shellcheck disable=SC2206 + local -a options=(${1:-}) + if [ "${#options[@]}" -eq 0 ]; then + log "Running all steps" + return 0 + fi + + local OPTIND + local -r allowed_options="dplsrfui" + while getopts ${allowed_options} options; do + case "${options}" in + d) + log "Running step configure_disk_partitions" + configure_disk_partitions + ;; + p) + log "Running step configure_and_install_dnf_pkgs_repos" + configure_and_install_dnf_pkgs_repos + ;; + l) + log "Running configure_logrotate" + configure_logrotate + ;; + s) + log "Running configure_selinux" + configure_selinux + ;; + r) + log "Running configure_sshd" + configure_sshd + ;; + f) + log "Running configure_firewalld_rules" + configure_firewalld_rules + ;; + u) + log "Running pull_container_images & configure_system_services" + configure_system_services + ;; + i) + log "Running pull_container_images" + pull_container_images + ;; + *) + usage allowed_options + abort "Unkown option provided" + ;; + esac + done + + exit 0 +} + +# We need to configure PasswordAuthentication to yes in order for the VMSS Access JIT to work +configure_sshd() { + log "starting" + log "setting ssh password authentication" + sed -i 's/PasswordAuthentication no/PasswordAuthentication yes/g' /etc/ssh/sshd_config + + systemctl reload sshd.service + systemctl is-active --quiet sshd || abort "sshd failed to reload" +} + +# configure_and_install_dnf_pkgs_repos +configure_and_install_dnf_pkgs_repos() { + log "starting" + + # transaction attempt retry time in seconds + local -ri retry_wait_time=60 + configure_rhui_repo retry_wait_time + create_azure_rpm_repos retry_wait_time + + local -ar exclude_pkgs=( + "-x WALinuxAgent" + "-x WALinuxAgent-udev" + ) + + dnf_update_pkgs exclude_pkgs retry_wait_time + + local -ra rpm_keys=( + https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-8 + https://packages.microsoft.com/keys/microsoft.asc + ) + + rpm_import_keys rpm_keys retry_wait_time + + local -ra repo_rpm_pkgs=( + https://dl.fedoraproject.org/pub/epel/epel-release-latest-8.noarch.rpm + ) + + local -ra install_pkgs=( + clamav + azsec-clamav + azsec-monitor + azure-cli + azure-mdsd + azure-security + podman + podman-docker + openssl-perl + # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 + python3 + ) + + dnf_install_pkgs repo_rpm_pkgs retry_wait_time + dnf_install_pkgs install_pkgs retry_wait_time +} + +# configure_rhui_repo +configure_rhui_repo() { + log "starting" + + local -ra cmd=( + dnf + update + -y + --disablerepo='*' + --enablerepo='rhui-microsoft-azure*' + ) + + log "running RHUI package updates" + retry cmd "$1" +} + +# retry Adding retry logic to yum commands in order to avoid stalling out on resource locks +retry() { + local -n cmd_retry="$1" + local -n wait_time="$2" + + for attempt in {1..5}; do + log "attempt #${attempt} - ${FUNCNAME[2]}" + ${cmd_retry[@]} & + + wait $! && break + if [[ ${attempt} -lt 5 ]]; then + sleep "$wait_time" + else + abort "attempt #${attempt} - Failed to update packages" + fi + done +} + +# dnf_update_pkgs +dnf_update_pkgs() { + local -n excludes="$1" + log "starting" + + local -ra cmd=( + dnf + -y + ${excludes[@]} + update + --allowerasing + ) + + log "Updating all packages" + retry cmd "$2" +} + +# dnf_install_pkgs +dnf_install_pkgs() { + local -n pkgs="$1" + log "starting" + + local -ra cmd=( + dnf + -y + install + ${pkgs[@]} + ) + + log "Attempting to install packages: ${pkgs[*]}" + retry cmd "$2" +} + +# rpm_import_keys +rpm_import_keys() { + local -n keys="$1" + log "starting" + + + # shellcheck disable=SC2068 + for key in ${keys[@]}; do + if [ ${#keys[@]} -eq 0 ]; then + break + fi + local -a cmd=( + rpm + --import + -v + "$key" + ) + + log "attempt #$attempt - importing rpm repository key $key" + retry cmd "$2" && unset key + done +} + +# configure_disk_partitions +configure_disk_partitions() { + log "starting" + log "extending partition table" + + # Linux block devices are inconsistently named + # it's difficult to tie the lvm pv to the physical disk using /dev/disk files, which is why lvs is used here + physical_disk="$(lvs -o devices -a | head -n2 | tail -n1 | cut -d ' ' -f 3 | cut -d \( -f 1 | tr -d '[:digit:]')" + growpart "$physical_disk" 2 + + log "extending filesystems" + log "extending root lvm" + lvextend -l +20%FREE /dev/rootvg/rootlv + log "growing root filesystem" + xfs_growfs / + + log "extending var lvm" + lvextend -l +100%FREE /dev/rootvg/varlv + log "growing var filesystem" + xfs_growfs /var +} + +# configure_logrotate clobbers /etc/logrotate.conf +configure_logrotate() { + log "starting" + + local -r logrotate_conf_filename='/etc/logrotate.conf' + local -r logrotate_conf_file='# see "man logrotate" for details # rotate log files weekly weekly @@ -61,7 +291,7 @@ compress # RPM packages drop log rotation information into this directory include /etc/logrotate.d -# no packages own wtmp and btmp -- we'll rotate them here +# no packages own wtmp and btmp -- we will rotate them here /var/log/wtmp { monthly create 0664 root utmp @@ -74,12 +304,17 @@ include /etc/logrotate.d monthly create 0600 root utmp rotate 1 +}' + + write_file logrotate_conf_filename logrotate_conf_file true } -EOF -echo "configuring yum repository and running yum update" -cat >/etc/yum.repos.d/azure.repo <<'EOF' -[azure-cli] +# create_azure_rpm_repos creates /etc/yum.repos.d/azure.repo repository file +create_azure_rpm_repos() { + log "starting" + + local -r azure_repo_filename='/etc/yum.repos.d/azure.repo' + local -r azure_repo_file='[azure-cli] name=azure-cli baseurl=https://packages.microsoft.com/yumrepos/azure-cli enabled=yes @@ -89,63 +324,151 @@ gpgcheck=yes name=azurecore baseurl=https://packages.microsoft.com/yumrepos/azurecore enabled=yes -gpgcheck=no -EOF +gpgcheck=no' -semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" -mkdir -p /var/log/journal + write_file azure_repo_filename azure_repo_file true +} -for attempt in {1..5}; do -yum -y install clamav azsec-clamav azsec-monitor azure-cli azure-mdsd azure-security podman podman-docker openssl-perl python3 && break - # hack - we are installing python3 on hosts due to an issue with Azure Linux Extensions https://github.com/Azure/azure-linux-extensions/pull/1505 - if [[ ${attempt} -lt 5 ]]; then sleep 10; else exit 1; fi -done +# configure_selinux +configure_selinux() { + log "starting" + + local -r relabel="${1:-false}" -# https://access.redhat.com/security/cve/cve-2020-13401 -echo "applying firewall rules" -cat >/etc/sysctl.d/02-disable-accept-ra.conf <<'EOF' -net.ipv6.conf.all.accept_ra=0 -EOF + already_defined_ignore_error="File context for /var/log/journal(/.*)? already defined" + semanage fcontext -a -t var_log_t "/var/log/journal(/.*)?" || log "$already_defined_ignore_error" + chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent -cat >/etc/sysctl.d/01-disable-core.conf <<'EOF' -kernel.core_pattern = |/bin/true -EOF -sysctl --system + if "$relabel"; then + restorecon -RF /var/log/* || log "$already_defined_ignore_error" + fi +} + +# configure_firewalld_rules +configure_firewalld_rules() { + log "starting" + + # https://access.redhat.com/security/cve/cve-2020-13401 + local -r prefix="/etc/sysctl.d" + local -r disable_accept_ra_conf_filename="$prefix/02-disable-accept-ra.conf" + local -r disable_accept_ra_conf_file="net.ipv6.conf.all.accept_ra=0" -firewall-cmd --add-port=443/tcp --permanent -firewall-cmd --add-port=444/tcp --permanent -firewall-cmd --add-port=445/tcp --permanent -firewall-cmd --add-port=2222/tcp --permanent + write_file disable_accept_ra_conf_filename disable_accept_ra_conf_file true -export AZURE_CLOUD_NAME=$AZURECLOUDNAME + local -r disable_core_filename="$prefix/01-disable-core.conf" + local -r disable_core_file="kernel.core_pattern = |/bin/true + " + write_file disable_core_filename disable_core_file true -echo "logging into prod acr" -az login -i --allow-no-subscriptions + sysctl --system + + local -ra enable_ports=( + "443/tcp" + "444/tcp" + "445/tcp" + "2222/tcp" + ) + + log "Enabling ports ${enable_ports[*]} on default firewalld zone" + # shellcheck disable=SC2068 + for port in ${enable_ports[@]}; do + log "Enabling port $port now" + firewall-cmd "--add-port=$port" + done + + firewall-cmd --runtime-to-permanent +} -# Suppress emulation output for podman instead of docker for az acr compatability -mkdir -p /etc/containers/ -touch /etc/containers/nodocker +# pull_container_images +pull_container_images() { + log "starting" + + # The managed identity that the VM runs as only has a single roleassignment. + # This role assignment is ACRPull which is not necessarily present in the + # subscription we're deploying into. If the identity does not have any + # role assignments scoped on the subscription we're deploying into, it will + # not show on az login -i, which is why the below line is commented. + # az account set -s "$SUBSCRIPTIONID" + az login -i --allow-no-subscriptions + + # Suppress emulation output for podman instead of docker for az acr compatability + mkdir -p /etc/containers/ + mkdir -p /root/.docker + touch /etc/containers/nodocker + + # This name is used in the case that az acr login searches for this in it's environment + local -r REGISTRY_AUTH_FILE="/root/.docker/config.json" + + log "logging into prod acr" + az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" + + MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" + docker pull "$MDMIMAGE" + docker pull "$RPIMAGE" + docker pull "$FLUENTBITIMAGE" + + az logout +} -mkdir -p /root/.docker -REGISTRY_AUTH_FILE=/root/.docker/config.json az acr login --name "$(sed -e 's|.*/||' <<<"$ACRRESOURCEID")" +# configure_system_services creates, configures, and enables the following systemd services and timers +# services +# fluentbit +# mdm +# mdsd +# arp-rp +# aro-dbtoken +# aro-monitor +# aro-portal +configure_system_services() { + configure_service_fluentbit + configure_service_mdm + configure_timers_mdm_mdsd + configure_service_aro_rp + configure_service_aro_dbtoken + configure_service_aro_monitor + configure_service_aro_portal + configure_service_mdsd +} -MDMIMAGE="${RPIMAGE%%/*}/${MDMIMAGE##*/}" -docker pull "$MDMIMAGE" -docker pull "$RPIMAGE" -docker pull "$FLUENTBITIMAGE" +# enable_aro_services enables all services required for aro rp +enable_aro_services() { + log "starting" + + local -ra aro_services=( + "aro-dbtoken" + "aro-monitor" + "aro-portal" + "aro-rp" + "auoms" + "azsecd" + "azsecmond" + "mdsd" + "mdm" + "chronyd" + "fluentbit" + ) + log "enabling aro services ${aro_services[*]}" + # shellcheck disable=SC2068 + for service in ${aro_services[@]}; do + log "Enabling $service now" + systemctl enable "$service.service" + done +} -az logout +# configure_service_fluentbit +configure_service_fluentbit() { + log "starting" + log "configuring fluentbit service" -echo "configuring fluentbit service" -mkdir -p /etc/fluentbit/ -mkdir -p /var/lib/fluent + mkdir -p /etc/fluentbit/ + mkdir -p /var/lib/fluent -cat >/etc/fluentbit/fluentbit.conf <<'EOF' -[INPUT] - Name systemd - Tag journald - Systemd_Filter _COMM=aro - DB /var/lib/fluent/journaldb + local -r fluentbit_conf_filename='/etc/fluentbit/fluentbit.conf' + local -r fluentbit_conf_file="[INPUT] +Name systemd +Tag journald +Systemd_Filter _COMM=aro +DB /var/lib/fluent/journaldb [FILTER] Name modify @@ -173,13 +496,18 @@ cat >/etc/fluentbit/fluentbit.conf <<'EOF' [OUTPUT] Name forward Match * - Port 29230 -EOF + Port 29230" + + write_file fluentbit_conf_filename fluentbit_conf_file true -echo "FLUENTBITIMAGE=$FLUENTBITIMAGE" >/etc/sysconfig/fluentbit + local -r sysconfig_fluentbit_filename='/etc/sysconfig/fluentbit' + local -r sysconfig_fluentbit_file="FLUENTBITIMAGE=$FLUENTBITIMAGE" -cat >/etc/systemd/system/fluentbit.service <<'EOF' -[Unit] + write_file sysconfig_fluentbit_filename sysconfig_fluentbit_file true + + local -r fluentbit_service_filename='/etc/systemd/system/fluentbit.service' + + local -r fluentbit_service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitIntervalSec=0 @@ -209,28 +537,61 @@ RestartSec=5 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" -mkdir /etc/aro-rp -base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem -if [[ -n "$ARMAPICABUNDLE" ]]; then - base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem -fi -chown -R 1000:1000 /etc/aro-rp + write_file fluentbit_conf_filename fluentbit_conf_file true +} + +# configure_certs +configure_certs() { + log "starting" + + mkdir /etc/aro-rp + base64 -d <<<"$ADMINAPICABUNDLE" >/etc/aro-rp/admin-ca-bundle.pem + if [[ -n "$ARMAPICABUNDLE" ]]; then + base64 -d <<<"$ARMAPICABUNDLE" >/etc/aro-rp/arm-ca-bundle.pem + fi + chown -R 1000:1000 /etc/aro-rp + + # setting MONITORING_GCS_AUTH_ID_TYPE=AuthKeyVault seems to have caused mdsd not + # to honour SSL_CERT_FILE any more, heaven only knows why. + mkdir -p /usr/lib/ssl/certs + csplit -f /usr/lib/ssl/certs/cert- -b %03d.pem /etc/pki/tls/certs/ca-bundle.crt /^$/1 "{*}" >/dev/null + c_rehash /usr/lib/ssl/certs + +# we leave clientId blank as long as only 1 managed identity assigned to vmss +# if we have more than 1, we will need to populate with clientId used for off-node scanning + local -r nodescan_agent_filename="/etc/default/vsa-nodescan-agent.config" + local -r nodescan_agent_file="{ + \"Nice\": 19, + \"Timeout\": 10800, + \"ClientId\": \"\", + \"TenantId\": $AZURESECPACKVSATENANTID, + \"QualysStoreBaseUrl\": $AZURESECPACKQUALYSURL, + \"ProcessTimeout\": 300, + \"CommandDelay\": 0 + }" + + write_file nodescan_agent_filename nodescan_agent_file true +} -echo "configuring mdm service" -cat >/etc/sysconfig/mdm </etc/systemd/system/mdm.service <<'EOF' -[Unit] + mkdir -p /var/etw + local -r mdm_service_filename="/etc/systemd/system/mdm.service" + local -r mdm_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -261,12 +622,157 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" + + write_file mdm_service_filename mdm_service_file true +} + +# configure_timers_mdm_mdsd +configure_timers_mdm_mdsd() { + log "starting" + + for var in "mdsd" "mdm"; do + local download_creds_service_filename="/etc/systemd/system/download-$var-credentials.service" + local download_creds_service_file="[Unit] +Description=Periodic $var credentials refresh + +[Service] +Type=oneshot +ExecStart=/usr/local/bin/download-credentials.sh $var" + + write_file download_creds_service_filename download_creds_service_file true + + local download_creds_timer_filename="/etc/systemd/system/download-$var-credentials.timer" + local download_creds_timer_file="[Unit] +Description=Periodic $var credentials refresh +After=network-online.target +Wants=network-online.target + +[Timer] +OnBootSec=0min +OnCalendar=0/12:00:00 +AccuracySec=5s + +[Install] +WantedBy=timers.target" + + write_file download_creds_timer_filename download_creds_timer_file true + done + + local -r download_creds_script_filename="/usr/local/bin/download-credentials.sh" + local -r download_creds_script_file="#!/bin/bash +set -eu + +COMPONENT=\$1 +echo \"Download \$COMPONENT credentials\" + +TEMP_DIR=\"\$(mktemp -d)\" +export AZURE_CONFIG_DIR=\"\$(mktemp -d)\" + +echo \"Logging into Azure...\" +RETRIES=3 +while [[ \$RETRIES -gt 0 ]]; do + if az login -i --allow-no-subscriptions + then + echo \"az login successful\" + break + else + echo \"az login failed. Retrying...\" + let RETRIES-=1 + sleep 5 + fi +done + +trap \"cleanup\" EXIT + +cleanup() { + az logout + [[ \$TEMP_DIR =~ /tmp/.+ ]] && rm -rf \$TEMP_DIR + [[ \$AZURE_CONFIG_DIR =~ /tmp/.+ ]] && rm -rf \$AZURE_CONFIG_DIR +} + +if [[ \$COMPONENT = \"mdm\" ]]; then + CURRENT_CERT_FILE=\"/etc/mdm.pem\" +elif [[ \$COMPONENT\ = \"mdsd\" ]]; then + CURRENT_CERT_FILE=\"/var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem\" +else + echo Invalid usage && exit 1 +fi + +SECRET_NAME=\"rp-\${COMPONENT}\" +NEW_CERT_FILE=\"\$TEMP_DIR/\$COMPONENT.pem\" +for attempt in {1..5}; do + az keyvault \ + secret \ + download \ + --file \"\$NEW_CERT_FILE\" \ + --id \"https://$KEYVAULTPREFIX-svc.$KEYVAULTDNSSUFFIX/secrets/\$SECRET_NAME\" \ + && break + if [[ \$attempt -lt 5 ]]; then sleep 10; else exit 1; fi +done + +if [ -f \$NEW_CERT_FILE ]; then + if [[ \$COMPONENT = \"mdsd\" ]]; then + chown syslog:syslog \$NEW_CERT_FILE + else + sed -i -ne '1,/END CERTIFICATE/ p' \$NEW_CERT_FILE + fi + + new_cert_sn=\"\$(openssl x509 -in \"\$NEW_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" + current_cert_sn=\"\$(openssl x509 -in \"\$CURRENT_CERT_FILE\" -noout -serial | awk -F= '{print \$2}')\" + if [[ ! -z \$new_cert_sn ]] && [[ \$new_cert_sn != \"\$current_cert_sn\" ]]; then + echo updating certificate for \$COMPONENT + chmod 0600 \$NEW_CERT_FILE + mv \$NEW_CERT_FILE \$CURRENT_CERT_FILE + fi +else + echo Failed to refresh certificate for \$COMPONENT && exit 1 +fi" + + write_file download_creds_script_filename download_creds_script_file true + + chmod u+x /usr/local/bin/download-credentials.sh + + systemctl enable download-mdsd-credentials.timer + systemctl enable download-mdm-credentials.timer + + /usr/local/bin/download-credentials.sh mdsd + /usr/local/bin/download-credentials.sh mdm + + local -r MDSDCERTIFICATESAN="$(openssl x509 -in /var/lib/waagent/Microsoft.Azure.KeyVault.Store/mdsd.pem -noout -subject | sed -e 's/.*CN = //')" + local -r watch_mdm_creds_service_filename="/etc/systemd/system/watch-mdm-credentials.service" + local -r watch_mdm_creds_service_file="[Unit] +Description=Watch for changes in mdm.pem and restarts the mdm service + +[Service] +Type=oneshot +ExecStart=/usr/bin/systemctl restart mdm.service + +[Install] +WantedBy=multi-user.target" + + write_file watch_mdm_creds_service_filename watch_mdm_creds_service_file true + + local -r watch_mdm_creds_path_filename='/etc/systemd/system/watch-mdm-credentials.path' + local -r watch_mdm_creds_path_file='[Path] +PathModified=/etc/mdm.pem + +[Install] +WantedBy=multi-user.target' + + write_file watch_mdm_creds_path_filename watch_mdm_creds_path_file true -echo "configuring aro-rp service" -cat >/etc/sysconfig/aro-rp </etc/systemd/system/aro-rp.service <<'EOF' -[Unit] + local -r aro_rp_service_filename='/etc/systemd/system/aro-rp.service' + local -r aro_rp_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -345,22 +852,28 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" -echo "configuring aro-dbtoken service" -cat >/etc/sysconfig/aro-dbtoken </etc/systemd/system/aro-dbtoken.service <<'EOF' -[Unit] + local -r aro_dbtoken_service_filename='/etc/systemd/system/aro-dbtoken.service' + local -r aro_dbtoken_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -391,14 +904,20 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" -# DOMAIN_NAME, CLUSTER_MDSD_ACCOUNT, CLUSTER_MDSD_CONFIG_VERSION, GATEWAY_DOMAINS, GATEWAY_RESOURCEGROUP, MDSD_ENVIRONMENT CLUSTER_MDSD_NAMESPACE -# are not used, but can't easily be refactored out. Should be revisited in the future. -echo "configuring aro-monitor service" -cat >/etc/sysconfig/aro-monitor </etc/systemd/system/aro-monitor.service <<'EOF' -[Unit] + local -r aro_monitor_service_filename='/etc/systemd/system/aro-monitor.service' + local -r aro_monitor_service_file="[Unit] After=network-online.target Wants=network-online.target @@ -452,12 +972,17 @@ RestartSec=1 StartLimitInterval=0 [Install] -WantedBy=multi-user.target -EOF +WantedBy=multi-user.target" -echo "configuring aro-portal service" -cat >/etc/sysconfig/aro-portal </etc/systemd/system/aro-portal.service <<'EOF' -[Unit] + write_file aro_portal_service_conf_filename aro_portal_service_conf_file true + + local -r aro_portal_service_filename='/etc/systemd/system/aro-portal.service' + local -r aro_portal_service_file="[Unit] After=network-online.target Wants=network-online.target StartLimitInterval=0 @@ -501,147 +1027,27 @@ Restart=always RestartSec=1 [Install] -WantedBy=multi-user.target -EOF - -echo "configuring mdsd and mdm services" -chcon -R system_u:object_r:var_log_t:s0 /var/opt/microsoft/linuxmonagent - -mkdir -p /var/lib/waagent/Microsoft.Azure.KeyVault.Store - -for var in "mdsd" "mdm"; do -cat >/etc/systemd/system/download-$var-credentials.service </etc/systemd/system/download-$var-credentials.timer </usr/local/bin/download-credentials.sh </etc/systemd/system/watch-mdm-credentials.service </etc/systemd/system/watch-mdm-credentials.path </etc/systemd/system/mdsd.service.d/override.conf <<'EOF' -[Unit] -After=network-online.target -EOF - -cat >/etc/default/mdsd </dev/null -c_rehash /usr/lib/ssl/certs + write_file default_mdsd_filename default_mdsd_file true -# we leave clientId blank as long as only 1 managed identity assigned to vmss -# if we have more than 1, we will need to populate with clientId used for off-node scanning -cat >/etc/default/vsa-nodescan-agent.config < "$filename" + else + log "Appending to $filename" + echo "$file_contents" >> "$filename" + fi +} + +# reboot_vm restores all selinux file contexts, waits 30 seconds then reboots +reboot_vm() { + log "starting" + + configure_selinux "true" + (sleep 30 && log "rebooting vm now"; reboot) & +} + +# log is a wrapper for echo that includes the function name +log() { + local -r msg="${1:-"log message is empty"}" + local -r stack_level="${2:-1}" + echo "${FUNCNAME[${stack_level}]}: ${msg}" +} + +# abort is a wrapper for log that exits with an error code +abort() { + local -ri origin_stacklevel=2 + log "${1}" "$origin_stacklevel" + log "Exiting" + exit 1 +} + +export AZURE_CLOUD_NAME="${AZURECLOUDNAME:?"Failed to carry over variables"}" -echo "rebooting" -restorecon -RF /var/log/* -(sleep 30; reboot) & +main "$@"