Rollin feedback/address issues from mug upgrade (also add copyright)

Brad Klein · Brad Klein · commit 8ee48b0d003e · 2021-05-05T10:47:12.000-06:00
diff --git a/runLint.sh b/runLint.sh
@@ -7,4 +7,4 @@ grep -n -R \” *.md && echo >&2 'Malformed quotes detected (bad: ” vs. good:
 [ $error = 1 ] && echo '^FAILED'
 
 
-printf "+++++++++++++++ ... OK\n" && exit 0
+printf "+++++++++++++++ ... OK\n" && exit 0
diff --git a/upgrade/1.0/resource_material/common/prerequisite-steps.md b/upgrade/1.0/resource_material/common/prerequisite-steps.md
@@ -27,7 +27,7 @@ These steps should be taken regardless of the type of NCN you will be upgrading.
 
     ```text
     ncn# export CSM_RELEASE=csm-x.y.z
-    ncn# export UPGRADE_NCN=ncn-m001
+    ncn# export UPGRADE_NCN=<ncn> # <-- SET TO NODE BEING UPGRADED (like ncn-s001)
    
     ncn# export STABLE_NCN=$(hostname)
     ncn# export UPGRADE_XNAME=$(curl -s -k -H "Authorization: Bearer ${TOKEN}" "https://api-gw-service-nmn.local/apis/sls/v1/search/hardware?extra_properties.Role=Management" | \
diff --git a/upgrade/1.0/resource_material/prereqs/get-csm.md b/upgrade/1.0/resource_material/prereqs/get-csm.md
@@ -9,18 +9,9 @@ Fetch the base installation CSM tarball and extract it, installing the contained
    ```
 2. Download the CSM software release to ncn-m001 -- choose either stable or prerelease depending on your intent:
 
-   a. Preferred method (stable):
+   a. **OPTION 1:** Internal/Test Systems:
 
-      ```bash
-      ncn-m001# cd ~
-      ncn-m001# export ENDPOINT=https://arti.dev.cray.com/artifactory/shasta-distribution-stable-local/csm/
-      ncn-m001# export CSM_RELEASE=csm-x.y.z
-      ncn-m001# wget ${ENDPOINT}/${CSM_RELEASE}.tar.gz
-      ```
-
-   b. Prerelease/internal use (only):
-
-      > **`INTERNAL USE`** The `ENDPOINT` URL below are for internal use. Customers do not need to download any additional 
+      > NOTE: The `ENDPOINT` URL below are for internal use. Customers do not need to download any additional 
       > artifacts, the CSM tarball is included along with the Shasta release.
      
       ```bash
@@ -30,6 +21,16 @@ Fetch the base installation CSM tarball and extract it, installing the contained
       ncn-m001# wget ${ENDPOINT}/${CSM_RELEASE}.tar.gz
       ``` 
 
+   b. **OPTION 2:** Customer/Production Systems:
+
+      ```bash
+      ncn-m001# cd ~
+      ncn-m001# export ENDPOINT=https://arti.dev.cray.com/artifactory/shasta-distribution-stable-local/csm/
+      ncn-m001# export CSM_RELEASE=csm-x.y.z
+      ncn-m001# wget ${ENDPOINT}/${CSM_RELEASE}.tar.gz
+      ```
+
+
 3. Expand the CSM software release:
    ```bash
    ncn-m001# tar -zxvf ${CSM_RELEASE}.tar.gz
diff --git a/upgrade/1.0/scripts/ceph/ceph-partitions-stage1.sh b/upgrade/1.0/scripts/ceph/ceph-partitions-stage1.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 disks=$(lsblk | grep -B2 -F md1  | grep ^s | awk '{print $1}')
 disk1=$(echo $disks | awk '{print $1}')
diff --git a/upgrade/1.0/scripts/ceph/ceph-services-stage2.sh b/upgrade/1.0/scripts/ceph/ceph-services-stage2.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 echo "Reconfiguring apparmor for haproxy"
 sed -i -e '/inet6/a\' -e '  /etc/ceph/rgw.pem r,' /etc/apparmor.d/usr.sbin.haproxy
diff --git a/upgrade/1.0/scripts/ceph/ceph-upgrade.sh b/upgrade/1.0/scripts/ceph/ceph-upgrade.sh
@@ -1,11 +1,12 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 ###
 # Part 1.  Prep work
 ###
 
 file="/etc/cray/ceph/_upgraded"
 pre_pull_images_file="/etc/cray/ceph/images_pre_pulled"
-scale_down_cephfs_clients_file="/etc/cray/ceph/cephfs_scaled_down"
-scale_up_cephfs_clients_file="/etc/cray/ceph/cephfs_scaled_up"
 convert_rgw_file="/etc/cray/ceph/radosgw_converted"
 upgrade_init_file="/etc/cray/ceph/upgrade_initialized"
 upgrade_mons_file="/etc/cray/ceph/mons_upgraded"
@@ -59,13 +60,8 @@ else
   mark_initialized $pre_pull_images_file
 fi
 
-if [ -f "$scale_down_cephfs_clients_file" ]; then
-  echo "cephfs clients have been scaled down"
-else
-  echo "Scaling down cephfs clients"
-  scale_down_cephfs_clients
-  mark_initialized $scale_down_cephfs_clients_file
-fi
+echo "Scaling down cephfs clients (if needed)"
+scale_down_cephfs_clients
 
 if [ -f "$convert_rgw_file" ]; then
   echo "Radosgw has already been converted"
@@ -183,10 +179,5 @@ ceph config set mgr mgr/cephadm/warn_on_stray_daemons true
 
 wait_for_health_ok
 
-if [ -f "$scale_up_cephfs_clients_file" ]; then
-  echo "cephfs clients have been scaled up"
-else
-  echo "Scaling up cephfs clients"
-  scale_up_cephfs_clients
-  mark_initialized $scale_up_cephfs_clients_file
-fi
+echo "Scaling up cephfs clients"
+scale_up_cephfs_clients
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-health.sh b/upgrade/1.0/scripts/ceph/lib/ceph-health.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 function wait_for_health_ok() {
   cnt=0
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-image-pull.sh b/upgrade/1.0/scripts/ceph/lib/ceph-image-pull.sh
@@ -1,4 +1,7 @@
 # Pre-pull images for upgrade so we can live without nexus during upgrade
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 function pre_pull_ceph_images () {
   IMAGE="$registry/ceph/ceph:v15.2.8"
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-install-dashboard.sh b/upgrade/1.0/scripts/ceph/lib/ceph-install-dashboard.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function install_dashboard () {
     echo "Enabling the Ceph Dashboard"
     until $(ceph mgr services|jq .dashboard) =~ "ncn-s00"
@@ -28,4 +32,4 @@ function install_dashboard () {
     echo "Disable ssl_verify until we are on signed certs"
     ceph dashboard set-rgw-api-ssl-verify False
     # Add checks for verifying the dashboard is up and functional
-}
+}
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-orch-tasks.sh b/upgrade/1.0/scripts/ceph/lib/ceph-orch-tasks.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function ceph_orch_tasks () {
  for host in $(ceph node ls| jq -r '.osd|keys[]')
   do
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-init.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-init.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function ceph_upgrade_init () {
  echo "Starting upgrade with initial tasks"
  for host in $(ceph node ls| jq -r '.osd|keys[]')
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-mdss.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-mdss.sh
@@ -1,4 +1,7 @@
 # Begin OSD conversion.  Run on each node that has OSDS
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 . ./lib/ceph-health.sh
 
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-mgrs.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-mgrs.sh
@@ -1,4 +1,8 @@
 ### Begin run on each mon/mgr
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function upgrade_ceph_mgrs () {
 for host in $(ceph node ls| jq -r '.mgr|keys[]')
  do
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-mons.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-mons.sh
@@ -1,4 +1,8 @@
 ### Begin run on each mon/mgr
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function upgrade_ceph_mons () {
 for host in $(ceph node ls| jq -r '.mon|keys[]')
  do
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-osds.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-osds.sh
@@ -1,4 +1,8 @@
 # Begin OSD conversion.  Run on each node that has OSDS
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function upgrade_osds () {
 for host in $(ceph node ls| jq -r '.osd|keys[]')
  do
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-rgws.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-rgws.sh
@@ -1,4 +1,8 @@
 # stop the ceph-rgw daemon on all hosts as the command needs the cluster status to be in HEALTH_OK
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function upgrade_rgws () {
 
   for host in $(ceph node ls| jq -r '.osd|keys|join(" ")'); do
diff --git a/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-step1.sh b/upgrade/1.0/scripts/ceph/lib/ceph-upgrade-step1.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 cephadm prepare-host
 cephadm ls
 ceph config assimilate-conf -i /etc/ceph/ceph.conf
diff --git a/upgrade/1.0/scripts/ceph/lib/cephadm-keys.sh b/upgrade/1.0/scripts/ceph/lib/cephadm-keys.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function create_cephadm_keys () {
  echo "Creating cephadm key"
  ceph cephadm generate-key
diff --git a/upgrade/1.0/scripts/ceph/lib/convert-radosgw.sh b/upgrade/1.0/scripts/ceph/lib/convert-radosgw.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function convert_radosgw () {
   echo "Converting radsogw to support Ceph 15.x requirements"
   echo "Verifying that a realm doesn't exist"
diff --git a/upgrade/1.0/scripts/ceph/lib/k8s-scale-utils.sh b/upgrade/1.0/scripts/ceph/lib/k8s-scale-utils.sh
@@ -1,4 +1,7 @@
 # Scale down cephfs clients to prevent mds corruption issues
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 cephfs_replica_counts_file="/etc/cray/ceph/cephfs_replica_counts"
 
@@ -7,10 +10,11 @@ function scale_down_cephfs_clients () {
   backup_name="$now-snapshot"
 
   echo "Taking a snapshot of nexus pvc ($backup_name)"
-  kubectl -n nexus exec -it $(kubectl get po -n nexus -l 'app=nexus' -o json | jq -r '.items[].metadata.name') -c nexus -- /bin/sh -c "mkdir /nexus-data/.snap/$backup_name"
+  output=$(kubectl -n nexus exec -it $(kubectl get po -n nexus -l 'app=nexus' -o json | jq -r '.items[].metadata.name') -c nexus -- /bin/sh -c "mkdir /nexus-data/.snap/$backup_name" 2>&1)
+  if [[ "$?" -ne 0 ]]; then
+    echo "Didn't find nexus pod to take snapshot from -- continuing..."
+  fi
 
-  echo "Sleeping 10 seconds after taking nexus pvc snapshot"
-  sleep 10
 
   rm -f $cephfs_replica_counts_file
   cnt=0
@@ -26,8 +30,20 @@ function scale_down_cephfs_clients () {
       kubectl get deployment -n $ns $deployment -o yaml | grep -q "claimName: $pvc_name"
       if [[ "$?" -eq 0 ]]; then
         num_replicas=$(kubectl -n $ns get deployment $deployment -o json | jq -r '.spec.replicas')
+        if [[ "$num_replicas" -eq 0 ]]; then
+          #
+          # We may have already scaled this deployment down or are re-running
+          # the upgrade script.  Let's be careful not to write zeros in the 
+          # replica count file.
+          #
+          if [ "$deployment" == "cray-ipxe" ]; then
+            num_replicas=3
+          else
+            num_replicas=1
+          fi
+        fi
         echo "${ns}_${deployment} $num_replicas" >> $cephfs_replica_counts_file
-        echo "Scaling $deployment deployment in namespace $ns from $num_replicas to zero"
+        echo "Ensuring $deployment deployment in namespace $ns is scaled from $num_replicas to zero"
         kubectl scale deployment -n $ns $deployment --replicas=0
       fi
     done
diff --git a/upgrade/1.0/scripts/ceph/lib/mark_step_complete.sh b/upgrade/1.0/scripts/ceph/lib/mark_step_complete.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function mark_initialized() {
   initialized_file=$1
   touch $initialized_file
diff --git a/upgrade/1.0/scripts/ceph/lib/update_container_images.sh b/upgrade/1.0/scripts/ceph/lib/update_container_images.sh
@@ -1,3 +1,7 @@
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
+
 function update_image_values () {
  IMAGE="$registry/ceph/ceph:v15.2.8"
  ceph config set global container_image $IMAGE
diff --git a/upgrade/1.0/scripts/k8s/determine-worker-order.sh b/upgrade/1.0/scripts/k8s/determine-worker-order.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 all_workers=$(kubectl get nodes | grep ncn-w | awk '{print $1}')
 kea_node=$(kubectl get po -n services -l 'app.kubernetes.io/name=cray-dhcp-kea' -o wide | grep -v NAME | awk '{print $7}')
diff --git a/upgrade/1.0/scripts/k8s/move-pod.sh b/upgrade/1.0/scripts/k8s/move-pod.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 pod_name=$1
 target_node=$2
diff --git a/upgrade/1.0/scripts/k8s/promote-initial-master.sh b/upgrade/1.0/scripts/k8s/promote-initial-master.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 source /srv/cray/scripts/metal/lib.sh
 export KUBERNETES_VERSION="v$(cat /etc/cray/kubernetes/version)"
diff --git a/upgrade/1.0/scripts/k8s/remove-k8s-node.sh b/upgrade/1.0/scripts/k8s/remove-k8s-node.sh
@@ -1,4 +1,7 @@
 #!/bin/bash
+#
+# Copyright 2021 Hewlett Packard Enterprise Development LP
+#
 
 if [ "$1" == "" ]
 then

Original file line number	Diff line number	Diff line change
`@@ -7,4 +7,4 @@ grep -n -R \” *.md && echo >&2 'Malformed quotes detected (bad: ” vs. good:`
`7`	`7`	`[ $error = 1 ] && echo '^FAILED'`
`8`	`8`
`9`	`9`
`10`		`-printf "+++++++++++++++ ... OK\n" && exit 0`
	`10`	`+printf "+++++++++++++++ ... OK\n" && exit 0`