master-helper.sh 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212
  1. #!/usr/bin/env bash
  2. # Copyright 2016 The Kubernetes Authors.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. # A library of helper functions and constant for GCI distro
  16. source "${KUBE_ROOT}/cluster/gce/gci/helper.sh"
  17. # create-master-instance creates the master instance. If called with
  18. # an argument, the argument is used as the name to a reserved IP
  19. # address for the master. (In the case of upgrade/repair, we re-use
  20. # the same IP.)
  21. #
  22. # It requires a whole slew of assumed variables, partially due to to
  23. # the call to write-master-env. Listing them would be rather
  24. # futile. Instead, we list the required calls to ensure any additional
  25. #
  26. # variables are set:
  27. # ensure-temp-dir
  28. # detect-project
  29. # get-bearer-token
  30. function create-master-instance {
  31. local address=""
  32. [[ -n ${1:-} ]] && address="${1}"
  33. local internal_address=""
  34. [[ -n ${2:-} ]] && internal_address="${2}"
  35. write-master-env
  36. ensure-gci-metadata-files
  37. create-master-instance-internal "${MASTER_NAME}" "${address}" "${internal_address}"
  38. }
  39. function replicate-master-instance() {
  40. local existing_master_zone="${1}"
  41. local existing_master_name="${2}"
  42. local existing_master_replicas="${3}"
  43. local kube_env="$(get-metadata "${existing_master_zone}" "${existing_master_name}" kube-env)"
  44. # Substitute INITIAL_ETCD_CLUSTER to enable etcd clustering.
  45. kube_env="$(echo "${kube_env}" | grep -v "INITIAL_ETCD_CLUSTER")"
  46. kube_env="$(echo -e "${kube_env}\nINITIAL_ETCD_CLUSTER: '${existing_master_replicas},${REPLICA_NAME}'")"
  47. # Substitute INITIAL_ETCD_CLUSTER_STATE
  48. kube_env="$(echo "${kube_env}" | grep -v "INITIAL_ETCD_CLUSTER_STATE")"
  49. kube_env="$(echo -e "${kube_env}\nINITIAL_ETCD_CLUSTER_STATE: 'existing'")"
  50. ETCD_CA_KEY="$(echo "${kube_env}" | grep "ETCD_CA_KEY" | sed "s/^.*: '//" | sed "s/'$//")"
  51. ETCD_CA_CERT="$(echo "${kube_env}" | grep "ETCD_CA_CERT" | sed "s/^.*: '//" | sed "s/'$//")"
  52. create-etcd-certs "${REPLICA_NAME}" "${ETCD_CA_CERT}" "${ETCD_CA_KEY}"
  53. kube_env="$(echo "${kube_env}" | grep -v "ETCD_PEER_KEY")"
  54. kube_env="$(echo -e "${kube_env}\nETCD_PEER_KEY: '${ETCD_PEER_KEY_BASE64}'")"
  55. kube_env="$(echo "${kube_env}" | grep -v "ETCD_PEER_CERT")"
  56. kube_env="$(echo -e "${kube_env}\nETCD_PEER_CERT: '${ETCD_PEER_CERT_BASE64}'")"
  57. local master_certs="$(get-metadata "${existing_master_zone}" "${existing_master_name}" kube-master-certs)"
  58. ETCD_APISERVER_CA_KEY="$(echo "${master_certs}" | grep "ETCD_APISERVER_CA_KEY" | sed "s/^.*: '//" | sed "s/'$//")"
  59. ETCD_APISERVER_CA_CERT="$(echo "${master_certs}" | grep "ETCD_APISERVER_CA_CERT" | sed "s/^.*: '//" | sed "s/'$//")"
  60. create-etcd-apiserver-certs "etcd-${REPLICA_NAME}" "${REPLICA_NAME}" "${ETCD_APISERVER_CA_CERT}" "${ETCD_APISERVER_CA_KEY}"
  61. master_certs="$(echo "${master_certs}" | grep -v "ETCD_APISERVER_SERVER_KEY")"
  62. master_certs="$(echo -e "${master_certs}\nETCD_APISERVER_SERVER_KEY: '${ETCD_APISERVER_SERVER_KEY_BASE64}'")"
  63. master_certs="$(echo "${master_certs}" | grep -v "ETCD_APISERVER_SERVER_CERT")"
  64. master_certs="$(echo -e "${master_certs}\nETCD_APISERVER_SERVER_CERT: '${ETCD_APISERVER_SERVER_CERT_BASE64}'")"
  65. master_certs="$(echo "${master_certs}" | grep -v "ETCD_APISERVER_CLIENT_KEY")"
  66. master_certs="$(echo -e "${master_certs}\nETCD_APISERVER_CLIENT_KEY: '${ETCD_APISERVER_CLIENT_KEY_BASE64}'")"
  67. master_certs="$(echo "${master_certs}" | grep -v "ETCD_APISERVER_CLIENT_CERT")"
  68. master_certs="$(echo -e "${master_certs}\nETCD_APISERVER_CLIENT_CERT: '${ETCD_APISERVER_CLIENT_CERT_BASE64}'")"
  69. echo "${kube_env}" > ${KUBE_TEMP}/master-kube-env.yaml
  70. echo "${master_certs}" > ${KUBE_TEMP}/kube-master-certs.yaml
  71. get-metadata "${existing_master_zone}" "${existing_master_name}" cluster-name > "${KUBE_TEMP}/cluster-name.txt"
  72. get-metadata "${existing_master_zone}" "${existing_master_name}" gci-update-strategy > "${KUBE_TEMP}/gci-update.txt"
  73. get-metadata "${existing_master_zone}" "${existing_master_name}" gci-ensure-gke-docker > "${KUBE_TEMP}/gci-ensure-gke-docker.txt"
  74. get-metadata "${existing_master_zone}" "${existing_master_name}" gci-docker-version > "${KUBE_TEMP}/gci-docker-version.txt"
  75. get-metadata "${existing_master_zone}" "${existing_master_name}" cluster-location > "${KUBE_TEMP}/cluster-location.txt"
  76. create-master-instance-internal "${REPLICA_NAME}"
  77. }
  78. # run-gcloud-command runs a given command over ssh with retries.
  79. function run-gcloud-command() {
  80. local master_name="${1}"
  81. local zone="${2}"
  82. local command="${3}"
  83. local retries=5
  84. local sleep_sec=10
  85. local result=""
  86. for attempt in $(seq 1 ${retries}); do
  87. if result=$(gcloud compute ssh "${master_name}" --project "${PROJECT}" --zone "${zone}" --command "${command}" -- -oConnectTimeout=60 2>&1); then
  88. echo "Successfully executed '${command}' on ${master_name}"
  89. return 0
  90. fi
  91. sleep "${sleep_sec}"
  92. done
  93. echo "Failed to execute '${command}' on ${master_name} despite ${retries} attempts" >&2
  94. echo "Last attempt failed with: ${result}" >&2
  95. return 1
  96. }
  97. function create-master-instance-internal() {
  98. local gcloud="gcloud"
  99. local retries=5
  100. local sleep_sec=10
  101. if [[ "${MASTER_SIZE##*-}" -ge 64 ]]; then # remove everything up to last dash (inclusive)
  102. # Workaround for #55777
  103. retries=30
  104. sleep_sec=60
  105. fi
  106. local -r master_name="${1}"
  107. local -r address="${2:-}"
  108. local -r internal_address="${3:-}"
  109. local preemptible_master=""
  110. if [[ "${PREEMPTIBLE_MASTER:-}" == "true" ]]; then
  111. preemptible_master="--preemptible --maintenance-policy TERMINATE"
  112. fi
  113. local enable_ip_aliases
  114. if [[ "${NODE_IPAM_MODE:-}" == "CloudAllocator" ]]; then
  115. enable_ip_aliases=true
  116. else
  117. enable_ip_aliases=false
  118. fi
  119. local network=$(make-gcloud-network-argument \
  120. "${NETWORK_PROJECT}" "${REGION}" "${NETWORK}" "${SUBNETWORK:-}" \
  121. "${address:-}" "${enable_ip_aliases:-}" "${IP_ALIAS_SIZE:-}")
  122. local metadata="kube-env=${KUBE_TEMP}/master-kube-env.yaml"
  123. metadata="${metadata},kubelet-config=${KUBE_TEMP}/master-kubelet-config.yaml"
  124. metadata="${metadata},user-data=${KUBE_ROOT}/cluster/gce/gci/master.yaml"
  125. metadata="${metadata},configure-sh=${KUBE_ROOT}/cluster/gce/gci/configure.sh"
  126. metadata="${metadata},cluster-location=${KUBE_TEMP}/cluster-location.txt"
  127. metadata="${metadata},cluster-name=${KUBE_TEMP}/cluster-name.txt"
  128. metadata="${metadata},gci-update-strategy=${KUBE_TEMP}/gci-update.txt"
  129. metadata="${metadata},gci-ensure-gke-docker=${KUBE_TEMP}/gci-ensure-gke-docker.txt"
  130. metadata="${metadata},gci-docker-version=${KUBE_TEMP}/gci-docker-version.txt"
  131. metadata="${metadata},kube-master-certs=${KUBE_TEMP}/kube-master-certs.yaml"
  132. metadata="${metadata},cluster-location=${KUBE_TEMP}/cluster-location.txt"
  133. metadata="${metadata},${MASTER_EXTRA_METADATA}"
  134. local disk="name=${master_name}-pd"
  135. disk="${disk},device-name=master-pd"
  136. disk="${disk},mode=rw"
  137. disk="${disk},boot=no"
  138. disk="${disk},auto-delete=no"
  139. for attempt in $(seq 1 ${retries}); do
  140. if result=$(${gcloud} compute instances create "${master_name}" \
  141. --project "${PROJECT}" \
  142. --zone "${ZONE}" \
  143. --machine-type "${MASTER_SIZE}" \
  144. --image-project="${MASTER_IMAGE_PROJECT}" \
  145. --image "${MASTER_IMAGE}" \
  146. --tags "${MASTER_TAG}" \
  147. --scopes "storage-ro,compute-rw,monitoring,logging-write" \
  148. --metadata-from-file "${metadata}" \
  149. --disk "${disk}" \
  150. --boot-disk-size "${MASTER_ROOT_DISK_SIZE}" \
  151. ${MASTER_MIN_CPU_ARCHITECTURE:+"--min-cpu-platform=${MASTER_MIN_CPU_ARCHITECTURE}"} \
  152. ${preemptible_master} \
  153. ${network} 2>&1); then
  154. echo "${result}" >&2
  155. if [[ -n "${internal_address:-}" ]]; then
  156. attach-internal-master-ip "${master_name}" "${ZONE}" "${internal_address}"
  157. fi
  158. return 0
  159. else
  160. echo "${result}" >&2
  161. if [[ ! "${result}" =~ "try again later" ]]; then
  162. echo "Failed to create master instance due to non-retryable error" >&2
  163. return 1
  164. fi
  165. sleep $sleep_sec
  166. fi
  167. done
  168. echo "Failed to create master instance despite ${retries} attempts" >&2
  169. return 1
  170. }
  171. function get-metadata() {
  172. local zone="${1}"
  173. local name="${2}"
  174. local key="${3}"
  175. gcloud compute ssh "${name}" \
  176. --project "${PROJECT}" \
  177. --zone "${zone}" \
  178. --command "curl \"http://metadata.google.internal/computeMetadata/v1/instance/attributes/${key}\" -H \"Metadata-Flavor: Google\"" 2>/dev/null
  179. }