829 lines
		
	
	
		
			23 KiB
		
	
	
	
		
			Bash
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			829 lines
		
	
	
		
			23 KiB
		
	
	
	
		
			Bash
		
	
	
		
			Executable File
		
	
	
	
	
| #!/usr/bin/env bash
 | |
| set -e
 | |
| 
 | |
| here=$(dirname "$0")
 | |
| # shellcheck source=net/common.sh
 | |
| source "$here"/common.sh
 | |
| 
 | |
| cloudProvider=$(basename "$0" .sh)
 | |
| bootDiskType=""
 | |
| case $cloudProvider in
 | |
| gce)
 | |
|   # shellcheck source=net/scripts/gce-provider.sh
 | |
|   source "$here"/scripts/gce-provider.sh
 | |
| 
 | |
|   cpuBootstrapLeaderMachineType="--custom-cpu 12 --custom-memory 32GB --min-cpu-platform Intel%20Skylake"
 | |
|   gpuBootstrapLeaderMachineType="$cpuBootstrapLeaderMachineType --accelerator count=1,type=nvidia-tesla-p100"
 | |
|   bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
 | |
|   fullNodeMachineType=$cpuBootstrapLeaderMachineType
 | |
|   clientMachineType="--custom-cpu 16 --custom-memory 20GB"
 | |
|   blockstreamerMachineType="--machine-type n1-standard-8"
 | |
|   replicatorMachineType="--custom-cpu 4 --custom-memory 16GB"
 | |
|   ;;
 | |
| ec2)
 | |
|   # shellcheck source=net/scripts/ec2-provider.sh
 | |
|   source "$here"/scripts/ec2-provider.sh
 | |
| 
 | |
|   cpuBootstrapLeaderMachineType=c5.2xlarge
 | |
| 
 | |
|   # NOTE: At this time only the p3dn.24xlarge EC2 instance type has GPU and
 | |
|   #       AVX-512 support.  The default, p2.xlarge, does not support
 | |
|   #       AVX-512
 | |
|   gpuBootstrapLeaderMachineType=p2.xlarge
 | |
|   bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
 | |
|   fullNodeMachineType=$cpuBootstrapLeaderMachineType
 | |
|   clientMachineType=c5.2xlarge
 | |
|   blockstreamerMachineType=c5.2xlarge
 | |
|   replicatorMachineType=c5.xlarge
 | |
|   ;;
 | |
| azure)
 | |
|   # shellcheck source=net/scripts/azure-provider.sh
 | |
|   source "$here"/scripts/azure-provider.sh
 | |
| 
 | |
|   # TODO: Dial in machine types for Azure
 | |
|   cpuBootstrapLeaderMachineType=Standard_D16s_v3
 | |
|   gpuBootstrapLeaderMachineType=Standard_NC12
 | |
|   bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
 | |
|   fullNodeMachineType=$cpuBootstrapLeaderMachineType
 | |
|   clientMachineType=Standard_D16s_v3
 | |
|   blockstreamerMachineType=Standard_D16s_v3
 | |
|   replicatorMachineType=Standard_D4s_v3
 | |
|   ;;
 | |
| colo)
 | |
|   # shellcheck source=net/scripts/colo-provider.sh
 | |
|   source "$here"/scripts/colo-provider.sh
 | |
| 
 | |
|   cpuBootstrapLeaderMachineType=0
 | |
|   gpuBootstrapLeaderMachineType=1
 | |
|   bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
 | |
|   fullNodeMachineType=$cpuBootstrapLeaderMachineType
 | |
|   clientMachineType=0
 | |
|   blockstreamerMachineType=0
 | |
|   replicatorMachineType=0
 | |
|   ;;
 | |
| *)
 | |
|   echo "Error: Unknown cloud provider: $cloudProvider"
 | |
|   ;;
 | |
| esac
 | |
| 
 | |
| 
 | |
| prefix=testnet-dev-${USER//[^A-Za-z0-9]/}
 | |
| additionalFullNodeCount=2
 | |
| clientNodeCount=1
 | |
| replicatorNodeCount=0
 | |
| blockstreamer=false
 | |
| fullNodeBootDiskSizeInGb=500
 | |
| clientBootDiskSizeInGb=75
 | |
| replicatorBootDiskSizeInGb=500
 | |
| fullNodeAdditionalDiskSizeInGb=
 | |
| externalNodes=false
 | |
| failOnValidatorBootupFailure=true
 | |
| 
 | |
| publicNetwork=false
 | |
| letsEncryptDomainName=
 | |
| enableGpu=false
 | |
| customAddress=
 | |
| zones=()
 | |
| 
 | |
| containsZone() {
 | |
|   local e match="$1"
 | |
|   shift
 | |
|   for e; do [[ "$e" == "$match" ]] && return 0; done
 | |
|   return 1
 | |
| }
 | |
| 
 | |
| usage() {
 | |
|   exitcode=0
 | |
|   if [[ -n "$1" ]]; then
 | |
|     exitcode=1
 | |
|     echo "Error: $*"
 | |
|   fi
 | |
|   cat <<EOF
 | |
| usage: $0 [create|config|delete] [common options] [command-specific options]
 | |
| 
 | |
| Manage testnet instances
 | |
| 
 | |
|  create - create a new testnet (implies 'config')
 | |
|  config - configure the testnet and write a config file describing it
 | |
|  delete - delete the testnet
 | |
|  info   - display information about the currently configured testnet
 | |
|  status - display status information of all resources
 | |
| 
 | |
|  common options:
 | |
|    -p [prefix]      - Optional common prefix for instance names to avoid
 | |
|                       collisions (default: $prefix)
 | |
|    -z [zone]        - Zone(s) for the nodes (default: $(cloud_DefaultZone))
 | |
|                       If specified multiple times, the fullnodes will be evenly
 | |
|                       distributed over all specified zones and
 | |
|                       client/blockstreamer nodes will be created in the first
 | |
|                       zone
 | |
|    -x               - append to the existing configuration instead of creating a
 | |
|                       new configuration
 | |
|    --allow-boot-failures
 | |
|                     - Discard from config validator nodes that didn't bootup
 | |
|                       successfully
 | |
| 
 | |
|  create-specific options:
 | |
|    -n [number]      - Number of additional fullnodes (default: $additionalFullNodeCount)
 | |
|    -c [number]      - Number of client nodes (default: $clientNodeCount)
 | |
|    -r [number]      - Number of replicator nodes (default: $replicatorNodeCount)
 | |
|    -u               - Include a Blockstreamer (default: $blockstreamer)
 | |
|    -P               - Use public network IP addresses (default: $publicNetwork)
 | |
|    -g               - Enable GPU (default: $enableGpu)
 | |
|    -G               - Enable GPU, and set count/type of GPUs to use
 | |
|                       (e.g $gpuBootstrapLeaderMachineType)
 | |
|    -a [address]     - Address to be be assigned to the Blockstreamer if present,
 | |
|                       otherwise the bootstrap fullnode.
 | |
|                       * For GCE, [address] is the "name" of the desired External
 | |
|                         IP Address.
 | |
|                       * For EC2, [address] is the "allocation ID" of the desired
 | |
|                         Elastic IP.
 | |
|    -d [disk-type]   - Specify a boot disk type (default None) Use pd-ssd to get ssd on GCE.
 | |
|    --letsencrypt [dns name] - Attempt to generate a TLS certificate using this
 | |
|                               DNS name (useful only when the -a and -P options
 | |
|                               are also provided)
 | |
|    --fullnode-additional-disk-size-gb [number]
 | |
|                     - Add an additional [number] GB SSD to all fullnodes to store the config directory.
 | |
|                       If not set, config will be written to the boot disk by default.
 | |
|                       Only supported on GCE.
 | |
|  config-specific options:
 | |
|    -P               - Use public network IP addresses (default: $publicNetwork)
 | |
| 
 | |
|  delete-specific options:
 | |
|    none
 | |
| 
 | |
|  info-specific options:
 | |
|    none
 | |
| 
 | |
| EOF
 | |
|   exit $exitcode
 | |
| }
 | |
| 
 | |
| command=$1
 | |
| [[ -n $command ]] || usage
 | |
| shift
 | |
| [[ $command = create || $command = config || $command = info || $command = delete || $command = status ]] ||
 | |
|   usage "Invalid command: $command"
 | |
| 
 | |
| shortArgs=()
 | |
| while [[ -n $1 ]]; do
 | |
|   if [[ ${1:0:2} = -- ]]; then
 | |
|     if [[ $1 = --letsencrypt ]]; then
 | |
|       letsEncryptDomainName="$2"
 | |
|       shift 2
 | |
|     elif [[ $1 = --fullnode-additional-disk-size-gb ]]; then
 | |
|       fullNodeAdditionalDiskSizeInGb="$2"
 | |
|       shift 2
 | |
|     elif [[ $1 == --machine-type* || $1 == --custom-cpu* ]]; then # Bypass quoted long args for GPUs
 | |
|       shortArgs+=("$1")
 | |
|       shift
 | |
|     elif [[ $1 == --allow-boot-failures ]]; then
 | |
|       failOnValidatorBootupFailure=false
 | |
|       shift
 | |
|     else
 | |
|       usage "Unknown long option: $1"
 | |
|     fi
 | |
|   else
 | |
|     shortArgs+=("$1")
 | |
|     shift
 | |
|   fi
 | |
| done
 | |
| 
 | |
| while getopts "h?p:Pn:c:r:z:gG:a:d:uxf" opt "${shortArgs[@]}"; do
 | |
|   case $opt in
 | |
|   h | \?)
 | |
|     usage
 | |
|     ;;
 | |
|   p)
 | |
|     [[ ${OPTARG//[^A-Za-z0-9-]/} == "$OPTARG" ]] || usage "Invalid prefix: \"$OPTARG\", alphanumeric only"
 | |
|     prefix=$OPTARG
 | |
|     ;;
 | |
|   P)
 | |
|     publicNetwork=true
 | |
|     ;;
 | |
|   n)
 | |
|     additionalFullNodeCount=$OPTARG
 | |
|     ;;
 | |
|   c)
 | |
|     clientNodeCount=$OPTARG
 | |
|     ;;
 | |
|   r)
 | |
|     replicatorNodeCount=$OPTARG
 | |
|     ;;
 | |
|   z)
 | |
|     containsZone "$OPTARG" "${zones[@]}" || zones+=("$OPTARG")
 | |
|     ;;
 | |
|   g)
 | |
|     enableGpu=true
 | |
|     bootstrapLeaderMachineType=$gpuBootstrapLeaderMachineType
 | |
|     fullNodeMachineType=$bootstrapLeaderMachineType
 | |
|     blockstreamerMachineType=$bootstrapLeaderMachineType
 | |
|     ;;
 | |
|   G)
 | |
|     enableGpu=true
 | |
|     bootstrapLeaderMachineType="$OPTARG"
 | |
|     fullNodeMachineType=$bootstrapLeaderMachineType
 | |
|     blockstreamerMachineType=$bootstrapLeaderMachineType
 | |
|     ;;
 | |
|   a)
 | |
|     customAddress=$OPTARG
 | |
|     ;;
 | |
|   d)
 | |
|     bootDiskType=$OPTARG
 | |
|     ;;
 | |
|   u)
 | |
|     blockstreamer=true
 | |
|     ;;
 | |
|   x)
 | |
|     externalNodes=true
 | |
|     ;;
 | |
|   *)
 | |
|     usage "unhandled option: $opt"
 | |
|     ;;
 | |
|   esac
 | |
| done
 | |
| 
 | |
| [[ ${#zones[@]} -gt 0 ]] || zones+=("$(cloud_DefaultZone)")
 | |
| 
 | |
| [[ -z $1 ]] || usage "Unexpected argument: $1"
 | |
| if [[ $cloudProvider = ec2 ]]; then
 | |
|   # EC2 keys can't be retrieved from running instances like GCE keys can so save
 | |
|   # EC2 keys in the user's home directory so |./ec2.sh config| can at least be
 | |
|   # used on the same host that ran |./ec2.sh create| .
 | |
|   sshPrivateKey="$HOME/.ssh/solana-net-id_$prefix"
 | |
| else
 | |
|   sshPrivateKey="$netConfigDir/id_$prefix"
 | |
| fi
 | |
| 
 | |
| case $cloudProvider in
 | |
| gce)
 | |
|   ;;
 | |
| ec2|azure|colo)
 | |
|   if [[ -n $fullNodeAdditionalDiskSizeInGb ]] ; then
 | |
|     usage "Error: --fullnode-additional-disk-size-gb currently only supported with cloud provider: gce"
 | |
|   fi
 | |
|   ;;
 | |
| *)
 | |
|   echo "Error: Unknown cloud provider: $cloudProvider"
 | |
|   ;;
 | |
| esac
 | |
| 
 | |
| # cloud_ForEachInstance [cmd] [extra args to cmd]
 | |
| #
 | |
| # Execute a command for each element in the `instances` array
 | |
| #
 | |
| #   cmd   - The command to execute on each instance
 | |
| #           The command will receive arguments followed by any
 | |
| #           additional arguments supplied to cloud_ForEachInstance:
 | |
| #               name     - name of the instance
 | |
| #               publicIp - The public IP address of this instance
 | |
| #               privateIp - The private IP address of this instance
 | |
| #               zone     - Zone of this instance
 | |
| #               count    - Monotonically increasing count for each
 | |
| #                          invocation of cmd, starting at 1
 | |
| #               ...      - Extra args to cmd..
 | |
| #
 | |
| #
 | |
| cloud_ForEachInstance() {
 | |
|   declare cmd="$1"
 | |
|   shift
 | |
|   [[ -n $cmd ]] || { echo cloud_ForEachInstance: cmd not specified; exit 1; }
 | |
| 
 | |
|   declare count=1
 | |
|   for info in "${instances[@]}"; do
 | |
|     declare name publicIp privateIp
 | |
|     IFS=: read -r name publicIp privateIp zone < <(echo "$info")
 | |
| 
 | |
|     eval "$cmd" "$name" "$publicIp" "$privateIp" "$zone" "$count" "$@"
 | |
|     count=$((count + 1))
 | |
|   done
 | |
| }
 | |
| 
 | |
| # Given a cloud provider zone, return an approximate lat,long location for the
 | |
| # data center.  Normal geoip lookups for cloud provider IP addresses are
 | |
| # sometimes widely inaccurate.
 | |
| zoneLocation() {
 | |
|   declare zone="$1"
 | |
|   case "$zone" in
 | |
|   us-west1*)
 | |
|     echo "[45.5946, -121.1787]"
 | |
|     ;;
 | |
|   us-central1*)
 | |
|     echo "[41.2619, -95.8608]"
 | |
|     ;;
 | |
|   us-east1*)
 | |
|     echo "[33.1960, -80.0131]"
 | |
|     ;;
 | |
|   asia-east2*)
 | |
|     echo "[22.3193, 114.1694]"
 | |
|     ;;
 | |
|   asia-northeast1*)
 | |
|     echo "[35.6762, 139.6503]"
 | |
|     ;;
 | |
|   asia-northeast2*)
 | |
|     echo "[34.6937, 135.5023]"
 | |
|     ;;
 | |
|   asia-south1*)
 | |
|     echo "[19.0760, 72.8777]"
 | |
|     ;;
 | |
|   asia-southeast1*)
 | |
|     echo "[1.3404, 103.7090]"
 | |
|     ;;
 | |
|   australia-southeast1*)
 | |
|     echo "[-33.8688, 151.2093]"
 | |
|     ;;
 | |
|   europe-north1*)
 | |
|     echo "[60.5693, 27.1878]"
 | |
|     ;;
 | |
|   europe-west2*)
 | |
|     echo "[51.5074, -0.1278]"
 | |
|     ;;
 | |
|   europe-west3*)
 | |
|     echo "[50.1109, 8.6821]"
 | |
|     ;;
 | |
|   europe-west4*)
 | |
|     echo "[53.4386, 6.8355]"
 | |
|     ;;
 | |
|   europe-west6*)
 | |
|     echo "[47.3769, 8.5417]"
 | |
|     ;;
 | |
|   northamerica-northeast1*)
 | |
|     echo "[45.5017, -73.5673]"
 | |
|     ;;
 | |
|   southamerica-east1*)
 | |
|     echo "[-23.5505, -46.6333]"
 | |
|     ;;
 | |
|   *)
 | |
|     ;;
 | |
|   esac
 | |
| }
 | |
| 
 | |
| prepareInstancesAndWriteConfigFile() {
 | |
|   $metricsWriteDatapoint "testnet-deploy net-config-begin=1"
 | |
| 
 | |
|   if $externalNodes; then
 | |
|     echo "Appending to existing config file"
 | |
|     echo "externalNodeSshKey=$sshPrivateKey" >> "$configFile"
 | |
|   else
 | |
|     rm -f "$geoipConfigFile"
 | |
|     cat >> "$configFile" <<EOF
 | |
| # autogenerated at $(date)
 | |
| netBasename=$prefix
 | |
| publicNetwork=$publicNetwork
 | |
| sshPrivateKey=$sshPrivateKey
 | |
| letsEncryptDomainName=$letsEncryptDomainName
 | |
| EOF
 | |
|   fi
 | |
|   touch "$geoipConfigFile"
 | |
| 
 | |
|   buildSshOptions
 | |
| 
 | |
|   fetchPrivateKey() {
 | |
|     declare nodeName
 | |
|     declare nodeIp
 | |
|     declare nodeZone
 | |
|     IFS=: read -r nodeName nodeIp _ nodeZone < <(echo "${instances[0]}")
 | |
| 
 | |
|     # Make sure the machine is alive or pingable
 | |
|     timeout_sec=90
 | |
|     cloud_WaitForInstanceReady "$nodeName" "$nodeIp" "$nodeZone" "$timeout_sec"
 | |
| 
 | |
|     if [[ ! -r $sshPrivateKey ]]; then
 | |
|       echo "Fetching $sshPrivateKey from $nodeName"
 | |
| 
 | |
|       # Try to scp in a couple times, sshd may not yet be up even though the
 | |
|       # machine can be pinged...
 | |
|       (
 | |
|         set -o pipefail
 | |
|         for i in $(seq 1 60); do
 | |
|           set -x
 | |
|           cloud_FetchFile "$nodeName" "$nodeIp" /solana-scratch/id_ecdsa "$sshPrivateKey" "$nodeZone" &&
 | |
|             cloud_FetchFile "$nodeName" "$nodeIp" /solana-scratch/id_ecdsa.pub "$sshPrivateKey.pub" "$nodeZone" &&
 | |
|               break
 | |
|           set +x
 | |
| 
 | |
|           sleep 1
 | |
|           echo "Retry $i..."
 | |
|         done
 | |
|       )
 | |
| 
 | |
|       chmod 400 "$sshPrivateKey"
 | |
|       ls -l "$sshPrivateKey"
 | |
|     fi
 | |
|   }
 | |
| 
 | |
|   recordInstanceIp() {
 | |
|     declare name="$1"
 | |
|     declare publicIp="$2"
 | |
|     declare privateIp="$3"
 | |
|     declare zone="$4"
 | |
|     #declare index="$5"
 | |
| 
 | |
|     declare failOnFailure="$6"
 | |
|     declare arrayName="$7"
 | |
| 
 | |
|     if [ "$publicIp" = "TERMINATED" ] || [ "$privateIp" = "TERMINATED" ]; then
 | |
|       if $failOnFailure; then
 | |
|         exit 1
 | |
|       else
 | |
|         return 0
 | |
|       fi
 | |
|     fi
 | |
| 
 | |
|     ok=true
 | |
|     echo "Waiting for $name to finish booting..."
 | |
|     (
 | |
|       set +e
 | |
|       fetchPrivateKey || exit 1
 | |
|       for i in $(seq 1 60); do
 | |
|         (
 | |
|           set -x
 | |
|           timeout --preserve-status --foreground 20s ssh "${sshOptions[@]}" "$publicIp" "ls -l /solana-scratch/.instance-startup-complete"
 | |
|         )
 | |
|         ret=$?
 | |
|         if [[ $ret -eq 0 ]]; then
 | |
|           echo "$name has booted."
 | |
|           exit 0
 | |
|         fi
 | |
|         sleep 5
 | |
|         echo "Retry $i..."
 | |
|       done
 | |
|       echo "$name failed to boot."
 | |
|       exit 1
 | |
|     ) || ok=false
 | |
| 
 | |
|     if ! $ok; then
 | |
|       if $failOnFailure; then
 | |
|         exit 1
 | |
|       fi
 | |
|     else
 | |
|       {
 | |
|         echo "$arrayName+=($publicIp)  # $name"
 | |
|         echo "${arrayName}Private+=($privateIp)  # $name"
 | |
|         echo "${arrayName}Zone+=($zone)  # $name"
 | |
|       } >> "$configFile"
 | |
| 
 | |
|       declare latlng=
 | |
|       latlng=$(zoneLocation "$zone")
 | |
|       if [[ -n $latlng ]]; then
 | |
|         echo "$publicIp: $latlng" >> "$geoipConfigFile"
 | |
|       fi
 | |
|     fi
 | |
|   }
 | |
| 
 | |
|   if $externalNodes; then
 | |
|     echo "Bootstrap leader is already configured"
 | |
|   else
 | |
|     echo "Looking for bootstrap leader instance..."
 | |
|     cloud_FindInstance "$prefix-bootstrap-leader"
 | |
|     [[ ${#instances[@]} -eq 1 ]] || {
 | |
|       echo "Unable to find bootstrap leader"
 | |
|       exit 1
 | |
|     }
 | |
| 
 | |
|     echo "fullnodeIpList=()" >> "$configFile"
 | |
|     echo "fullnodeIpListPrivate=()" >> "$configFile"
 | |
|     cloud_ForEachInstance recordInstanceIp true fullnodeIpList
 | |
|   fi
 | |
| 
 | |
|   if [[ $additionalFullNodeCount -gt 0 ]]; then
 | |
|     numZones=${#zones[@]}
 | |
|     if [[ $additionalFullNodeCount -gt $numZones ]]; then
 | |
|       numNodesPerZone=$((additionalFullNodeCount / numZones))
 | |
|       numLeftOverNodes=$((additionalFullNodeCount % numZones))
 | |
|     else
 | |
|       numNodesPerZone=1
 | |
|       numLeftOverNodes=0
 | |
|     fi
 | |
| 
 | |
|     for ((i=((numZones - 1)); i >= 0; i--)); do
 | |
|       zone=${zones[i]}
 | |
|       if [[ $i -eq 0 ]]; then
 | |
|         numNodesPerZone=$((numNodesPerZone + numLeftOverNodes))
 | |
|       fi
 | |
|       echo "Looking for additional fullnode instances in $zone ..."
 | |
|       cloud_FindInstances "$prefix-$zone-fullnode"
 | |
|       declare numInstances=${#instances[@]}
 | |
|       if [[ $numInstances -eq $numNodesPerZone || ( ! $failOnValidatorBootupFailure && $numInstances -gt 0 ) ]]; then
 | |
|         cloud_ForEachInstance recordInstanceIp "$failOnValidatorBootupFailure" fullnodeIpList
 | |
|       else
 | |
|         echo "Unable to find additional fullnodes"
 | |
|         if $failOnValidatorBootupFailure; then
 | |
|           exit 1
 | |
|         fi
 | |
|       fi
 | |
|     done
 | |
|   fi
 | |
| 
 | |
|   if ! $externalNodes; then
 | |
|     echo "clientIpList=()" >> "$configFile"
 | |
|     echo "clientIpListPrivate=()" >> "$configFile"
 | |
|   fi
 | |
|   echo "Looking for client bencher instances..."
 | |
|   cloud_FindInstances "$prefix-client"
 | |
|   [[ ${#instances[@]} -eq 0 ]] || {
 | |
|     cloud_ForEachInstance recordInstanceIp true clientIpList
 | |
|   }
 | |
| 
 | |
|   if ! $externalNodes; then
 | |
|     echo "blockstreamerIpList=()" >> "$configFile"
 | |
|     echo "blockstreamerIpListPrivate=()" >> "$configFile"
 | |
|   fi
 | |
|   echo "Looking for blockstreamer instances..."
 | |
|   cloud_FindInstances "$prefix-blockstreamer"
 | |
|   [[ ${#instances[@]} -eq 0 ]] || {
 | |
|     cloud_ForEachInstance recordInstanceIp true blockstreamerIpList
 | |
|   }
 | |
| 
 | |
|   if ! $externalNodes; then
 | |
|     echo "replicatorIpList=()" >> "$configFile"
 | |
|     echo "replicatorIpListPrivate=()" >> "$configFile"
 | |
|   fi
 | |
|   echo "Looking for replicator instances..."
 | |
|   cloud_FindInstances "$prefix-replicator"
 | |
|   [[ ${#instances[@]} -eq 0 ]] || {
 | |
|     cloud_ForEachInstance recordInstanceIp true replicatorIpList
 | |
|   }
 | |
| 
 | |
|   echo "Wrote $configFile"
 | |
|   $metricsWriteDatapoint "testnet-deploy net-config-complete=1"
 | |
| }
 | |
| 
 | |
| delete() {
 | |
|   $metricsWriteDatapoint "testnet-deploy net-delete-begin=1"
 | |
| 
 | |
|   # Filter for all nodes
 | |
|   filter="$prefix-"
 | |
| 
 | |
|   echo "Searching for instances: $filter"
 | |
|   cloud_FindInstances "$filter"
 | |
| 
 | |
|   if [[ ${#instances[@]} -eq 0 ]]; then
 | |
|     echo "No instances found matching '$filter'"
 | |
|   else
 | |
|     cloud_DeleteInstances true &
 | |
|   fi
 | |
| 
 | |
|   wait
 | |
| 
 | |
|   if $externalNodes; then
 | |
|     echo "Let's not delete the current configuration file"
 | |
|   else
 | |
|     rm -f "$configFile"
 | |
|   fi
 | |
| 
 | |
|   $metricsWriteDatapoint "testnet-deploy net-delete-complete=1"
 | |
| }
 | |
| 
 | |
| create_error_cleanup() {
 | |
|   declare RC=$?
 | |
|   if [[ "$RC" -ne 0 ]]; then
 | |
|     delete
 | |
|   fi
 | |
|   exit $RC
 | |
| }
 | |
| 
 | |
| case $command in
 | |
| delete)
 | |
|   delete
 | |
|   ;;
 | |
| 
 | |
| create)
 | |
|   [[ -n $additionalFullNodeCount ]] || usage "Need number of nodes"
 | |
| 
 | |
|   delete
 | |
| 
 | |
|   $metricsWriteDatapoint "testnet-deploy net-create-begin=1"
 | |
| 
 | |
|   if $failOnValidatorBootupFailure; then
 | |
|     trap create_error_cleanup EXIT
 | |
|   fi
 | |
| 
 | |
|   rm -rf "$sshPrivateKey"{,.pub}
 | |
| 
 | |
|   # Note: using rsa because |aws ec2 import-key-pair| seems to fail for ecdsa
 | |
|   ssh-keygen -t rsa -N '' -f "$sshPrivateKey"
 | |
| 
 | |
|   printNetworkInfo() {
 | |
|     cat <<EOF
 | |
| ==[ Network composition ]===============================================================
 | |
|   Bootstrap leader = $bootstrapLeaderMachineType (GPU=$enableGpu)
 | |
|   Additional fullnodes = $additionalFullNodeCount x $fullNodeMachineType
 | |
|   Client(s) = $clientNodeCount x $clientMachineType
 | |
|   Replicators(s) = $replicatorNodeCount x $replicatorMachineType
 | |
|   Blockstreamer = $blockstreamer
 | |
| ========================================================================================
 | |
| 
 | |
| EOF
 | |
|   }
 | |
|   printNetworkInfo
 | |
| 
 | |
|   creationDate=$(date)
 | |
|   creationInfo() {
 | |
|     cat <<EOF
 | |
| 
 | |
|   Instance running since: $creationDate
 | |
| 
 | |
| ========================================================================================
 | |
| EOF
 | |
|   }
 | |
| 
 | |
|   declare startupScript="$netConfigDir"/instance-startup-script.sh
 | |
|   cat > "$startupScript" <<EOF
 | |
| #!/usr/bin/env bash
 | |
| # autogenerated at $(date)
 | |
| set -ex
 | |
| 
 | |
| if [[ -f /solana-scratch/.instance-startup-complete ]]; then
 | |
|   $(
 | |
|     cd "$here"/scripts/
 | |
|     if "$enableGpu"; then
 | |
|       cat enable-nvidia-persistence-mode.sh
 | |
|     fi
 | |
|   )
 | |
| 
 | |
|   # Skip most setup on instance reboot
 | |
|   exit 0
 | |
| fi
 | |
| 
 | |
| cat > /etc/motd <<EOM
 | |
| !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
 | |
| 
 | |
|   This instance has not been fully configured.
 | |
| 
 | |
|   See startup script log messages in /var/log/syslog for status:
 | |
|     $ sudo cat /var/log/syslog | egrep \\(startup-script\\|cloud-init\)
 | |
| 
 | |
|   To block until setup is complete, run:
 | |
|     $ until [[ -f /solana-scratch/.instance-startup-complete ]]; do sleep 1; done
 | |
| 
 | |
| !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
 | |
| $(creationInfo)
 | |
| EOM
 | |
| 
 | |
| # Place the generated private key at /solana-scratch/id_ecdsa so it's retrievable by anybody
 | |
| # who is able to log into this machine
 | |
| mkdir -m 0777 /solana-scratch
 | |
| cat > /solana-scratch/id_ecdsa <<EOK
 | |
| $(cat "$sshPrivateKey")
 | |
| EOK
 | |
| cat > /solana-scratch/id_ecdsa.pub <<EOK
 | |
| $(cat "$sshPrivateKey.pub")
 | |
| EOK
 | |
| chmod 444 /solana-scratch/id_ecdsa
 | |
| 
 | |
| USER=\$(id -un)
 | |
| export DEBIAN_FRONTEND=noninteractive
 | |
| $(
 | |
|   cd "$here"/scripts/
 | |
|   cat \
 | |
|     disable-background-upgrades.sh \
 | |
|     create-solana-user.sh \
 | |
|     solana-user-authorized_keys.sh \
 | |
|     add-testnet-solana-user-authorized_keys.sh \
 | |
|     install-certbot.sh \
 | |
|     install-earlyoom.sh \
 | |
|     install-libssl-compatability.sh \
 | |
|     install-nodejs.sh \
 | |
|     install-redis.sh \
 | |
|     install-rsync.sh \
 | |
|     localtime.sh \
 | |
|     network-config.sh \
 | |
|     remove-docker-interface.sh \
 | |
| 
 | |
|   if "$enableGpu"; then
 | |
|     cat enable-nvidia-persistence-mode.sh
 | |
|   fi
 | |
| 
 | |
|   if [[ -n $fullNodeAdditionalDiskSizeInGb ]]; then
 | |
|     cat mount-additional-disk.sh
 | |
|   fi
 | |
| )
 | |
| 
 | |
| cat > /etc/motd <<EOM
 | |
| $(printNetworkInfo)
 | |
| $(creationInfo)
 | |
| EOM
 | |
| 
 | |
| touch /solana-scratch/.instance-startup-complete
 | |
| 
 | |
| EOF
 | |
| 
 | |
|   if $blockstreamer; then
 | |
|     blockstreamerAddress=$customAddress
 | |
|   else
 | |
|     bootstrapLeaderAddress=$customAddress
 | |
|   fi
 | |
| 
 | |
|   for zone in "${zones[@]}"; do
 | |
|     cloud_Initialize "$prefix" "$zone"
 | |
|   done
 | |
| 
 | |
|   if $externalNodes; then
 | |
|     echo "Bootstrap leader is already configured"
 | |
|   else
 | |
|     cloud_CreateInstances "$prefix" "$prefix-bootstrap-leader" 1 \
 | |
|       "$enableGpu" "$bootstrapLeaderMachineType" "${zones[0]}" "$fullNodeBootDiskSizeInGb" \
 | |
|       "$startupScript" "$bootstrapLeaderAddress" "$bootDiskType" "$fullNodeAdditionalDiskSizeInGb" \
 | |
|       "$sshPrivateKey"
 | |
|   fi
 | |
| 
 | |
|   if [[ $additionalFullNodeCount -gt 0 ]]; then
 | |
|     num_zones=${#zones[@]}
 | |
|     if [[ $additionalFullNodeCount -gt $num_zones ]]; then
 | |
|       numNodesPerZone=$((additionalFullNodeCount / num_zones))
 | |
|       numLeftOverNodes=$((additionalFullNodeCount % num_zones))
 | |
|     else
 | |
|       numNodesPerZone=1
 | |
|       numLeftOverNodes=0
 | |
|     fi
 | |
| 
 | |
|     for ((i=((num_zones - 1)); i >= 0; i--)); do
 | |
|       zone=${zones[i]}
 | |
|       if [[ $i -eq 0 ]]; then
 | |
|         numNodesPerZone=$((numNodesPerZone + numLeftOverNodes))
 | |
|       fi
 | |
|       cloud_CreateInstances "$prefix" "$prefix-$zone-fullnode" "$numNodesPerZone" \
 | |
|         "$enableGpu" "$fullNodeMachineType" "$zone" "$fullNodeBootDiskSizeInGb" \
 | |
|         "$startupScript" "" "$bootDiskType" "$fullNodeAdditionalDiskSizeInGb" \
 | |
|         "$sshPrivateKey" &
 | |
|     done
 | |
| 
 | |
|     wait
 | |
|   fi
 | |
| 
 | |
|   if [[ $clientNodeCount -gt 0 ]]; then
 | |
|     cloud_CreateInstances "$prefix" "$prefix-client" "$clientNodeCount" \
 | |
|       "$enableGpu" "$clientMachineType" "${zones[0]}" "$clientBootDiskSizeInGb" \
 | |
|       "$startupScript" "" "$bootDiskType" "" "$sshPrivateKey"
 | |
|   fi
 | |
| 
 | |
|   if $blockstreamer; then
 | |
|     cloud_CreateInstances "$prefix" "$prefix-blockstreamer" "1" \
 | |
|       "$enableGpu" "$blockstreamerMachineType" "${zones[0]}" "$fullNodeBootDiskSizeInGb" \
 | |
|       "$startupScript" "$blockstreamerAddress" "$bootDiskType" "" "$sshPrivateKey"
 | |
|   fi
 | |
| 
 | |
|   if [[ $replicatorNodeCount -gt 0 ]]; then
 | |
|     cloud_CreateInstances "$prefix" "$prefix-replicator" "$replicatorNodeCount" \
 | |
|       false "$replicatorMachineType" "${zones[0]}" "$replicatorBootDiskSizeInGb" \
 | |
|       "$startupScript" "" "" "" "$sshPrivateKey"
 | |
|   fi
 | |
| 
 | |
|   $metricsWriteDatapoint "testnet-deploy net-create-complete=1"
 | |
| 
 | |
|   prepareInstancesAndWriteConfigFile
 | |
|   ;;
 | |
| 
 | |
| config)
 | |
|   prepareInstancesAndWriteConfigFile
 | |
|   ;;
 | |
| info)
 | |
|   loadConfigFile
 | |
|   printNode() {
 | |
|     declare nodeType=$1
 | |
|     declare ip=$2
 | |
|     declare ipPrivate=$3
 | |
|     declare zone=$4
 | |
|     printf "  %-16s | %-15s | %-15s | %s\n" "$nodeType" "$ip" "$ipPrivate" "$zone"
 | |
|   }
 | |
| 
 | |
|   printNode "Node Type" "Public IP" "Private IP" "Zone"
 | |
|   echo "-------------------+-----------------+-----------------+--------------"
 | |
|   nodeType=bootstrap-leader
 | |
|   for i in $(seq 0 $(( ${#fullnodeIpList[@]} - 1)) ); do
 | |
|     ipAddress=${fullnodeIpList[$i]}
 | |
|     ipAddressPrivate=${fullnodeIpListPrivate[$i]}
 | |
|     zone=${fullnodeIpListZone[$i]}
 | |
|     printNode $nodeType "$ipAddress" "$ipAddressPrivate" "$zone"
 | |
|     nodeType=fullnode
 | |
|   done
 | |
| 
 | |
|   for i in $(seq 0 $(( ${#clientIpList[@]} - 1)) ); do
 | |
|     ipAddress=${clientIpList[$i]}
 | |
|     ipAddressPrivate=${clientIpListPrivate[$i]}
 | |
|     zone=${clientIpListZone[$i]}
 | |
|     printNode client "$ipAddress" "$ipAddressPrivate" "$zone"
 | |
|   done
 | |
| 
 | |
|   for i in $(seq 0 $(( ${#blockstreamerIpList[@]} - 1)) ); do
 | |
|     ipAddress=${blockstreamerIpList[$i]}
 | |
|     ipAddressPrivate=${blockstreamerIpListPrivate[$i]}
 | |
|     zone=${blockstreamerIpListZone[$i]}
 | |
|     printNode blockstreamer "$ipAddress" "$ipAddressPrivate" "$zone"
 | |
|   done
 | |
| 
 | |
|   for i in $(seq 0 $(( ${#replicatorIpList[@]} - 1)) ); do
 | |
|     ipAddress=${replicatorIpList[$i]}
 | |
|     ipAddressPrivate=${replicatorIpListPrivate[$i]}
 | |
|     zone=${replicatorIpListZone[$i]}
 | |
|     printNode replicator "$ipAddress" "$ipAddressPrivate" "$zone"
 | |
|   done
 | |
|   ;;
 | |
| status)
 | |
|   cloud_StatusAll
 | |
|   ;;
 | |
| *)
 | |
|   usage "Unknown command: $command"
 | |
| esac
 |