Switch to instances with AVX-512 if possible for better interop with dev machines (#4328)
automerge
This commit is contained in:
@ -49,7 +49,7 @@ Deploys a CD testnet
|
|||||||
-c [number] - Number of client bencher nodes (default: $clientNodeCount)
|
-c [number] - Number of client bencher nodes (default: $clientNodeCount)
|
||||||
-u - Include a Blockstreamer (default: $blockstreamer)
|
-u - Include a Blockstreamer (default: $blockstreamer)
|
||||||
-P - Use public network IP addresses (default: $publicNetwork)
|
-P - Use public network IP addresses (default: $publicNetwork)
|
||||||
-G - Enable GPU, and set count/type of GPUs to use (e.g n1-standard-16 --accelerator count=4,type=nvidia-tesla-k80)
|
-G - Enable GPU, and set count/type of GPUs to use (e.g n1-standard-16 --accelerator count=2,type=nvidia-tesla-v100)
|
||||||
-g - Enable GPU (default: $enableGpu)
|
-g - Enable GPU (default: $enableGpu)
|
||||||
-a [address] - Set the bootstrap fullnode's external IP address to this GCE address
|
-a [address] - Set the bootstrap fullnode's external IP address to this GCE address
|
||||||
-d [disk-type] - Specify a boot disk type (default None) Use pd-ssd to get ssd on GCE.
|
-d [disk-type] - Specify a boot disk type (default None) Use pd-ssd to get ssd on GCE.
|
||||||
|
18
net/gce.sh
18
net/gce.sh
@ -12,8 +12,8 @@ gce)
|
|||||||
# shellcheck source=net/scripts/gce-provider.sh
|
# shellcheck source=net/scripts/gce-provider.sh
|
||||||
source "$here"/scripts/gce-provider.sh
|
source "$here"/scripts/gce-provider.sh
|
||||||
|
|
||||||
cpuBootstrapLeaderMachineType="--machine-type n1-standard-16"
|
cpuBootstrapLeaderMachineType="--machine-type n1-standard-16 --min-cpu-platform Intel%20Skylake"
|
||||||
gpuBootstrapLeaderMachineType="$cpuBootstrapLeaderMachineType --accelerator count=4,type=nvidia-tesla-k80"
|
gpuBootstrapLeaderMachineType="$cpuBootstrapLeaderMachineType --accelerator count=1,type=nvidia-tesla-p100"
|
||||||
bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
|
bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
|
||||||
fullNodeMachineType=$cpuBootstrapLeaderMachineType
|
fullNodeMachineType=$cpuBootstrapLeaderMachineType
|
||||||
clientMachineType="--custom-cpu 16 --custom-memory 20GB"
|
clientMachineType="--custom-cpu 16 --custom-memory 20GB"
|
||||||
@ -23,12 +23,16 @@ ec2)
|
|||||||
# shellcheck source=net/scripts/ec2-provider.sh
|
# shellcheck source=net/scripts/ec2-provider.sh
|
||||||
source "$here"/scripts/ec2-provider.sh
|
source "$here"/scripts/ec2-provider.sh
|
||||||
|
|
||||||
cpuBootstrapLeaderMachineType=m4.2xlarge
|
cpuBootstrapLeaderMachineType=c5.2xlarge
|
||||||
|
|
||||||
|
# NOTE: At this time only the p3dn.24xlarge EC2 instance type has GPU and
|
||||||
|
# AVX-512 support. The default, p2.xlarge, does not support
|
||||||
|
# AVX-512
|
||||||
gpuBootstrapLeaderMachineType=p2.xlarge
|
gpuBootstrapLeaderMachineType=p2.xlarge
|
||||||
bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
|
bootstrapLeaderMachineType=$cpuBootstrapLeaderMachineType
|
||||||
fullNodeMachineType=$cpuBootstrapLeaderMachineType
|
fullNodeMachineType=$cpuBootstrapLeaderMachineType
|
||||||
clientMachineType=m4.2xlarge
|
clientMachineType=c5.2xlarge
|
||||||
blockstreamerMachineType=m4.2xlarge
|
blockstreamerMachineType=c5.2xlarge
|
||||||
;;
|
;;
|
||||||
azure)
|
azure)
|
||||||
# shellcheck source=net/scripts/azure-provider.sh
|
# shellcheck source=net/scripts/azure-provider.sh
|
||||||
@ -338,7 +342,7 @@ EOF
|
|||||||
# machine can be pinged...
|
# machine can be pinged...
|
||||||
(
|
(
|
||||||
set -o pipefail
|
set -o pipefail
|
||||||
for i in $(seq 1 30); do
|
for i in $(seq 1 60); do
|
||||||
set -x
|
set -x
|
||||||
cloud_FetchFile "$nodeName" "$nodeIp" /solana-id_ecdsa "$sshPrivateKey" "$nodeZone" &&
|
cloud_FetchFile "$nodeName" "$nodeIp" /solana-id_ecdsa "$sshPrivateKey" "$nodeZone" &&
|
||||||
cloud_FetchFile "$nodeName" "$nodeIp" /solana-id_ecdsa.pub "$sshPrivateKey.pub" "$nodeZone" &&
|
cloud_FetchFile "$nodeName" "$nodeIp" /solana-id_ecdsa.pub "$sshPrivateKey.pub" "$nodeZone" &&
|
||||||
@ -379,7 +383,7 @@ EOF
|
|||||||
(
|
(
|
||||||
set +e
|
set +e
|
||||||
fetchPrivateKey || exit 1
|
fetchPrivateKey || exit 1
|
||||||
for i in $(seq 1 30); do
|
for i in $(seq 1 60); do
|
||||||
(
|
(
|
||||||
set -x
|
set -x
|
||||||
timeout --preserve-status --foreground 20s ssh "${sshOptions[@]}" "$publicIp" "ls -l /.instance-startup-complete"
|
timeout --preserve-status --foreground 20s ssh "${sshOptions[@]}" "$publicIp" "ls -l /.instance-startup-complete"
|
||||||
|
@ -163,7 +163,11 @@ cloud_CreateInstances() {
|
|||||||
args+=(--image $imageName)
|
args+=(--image $imageName)
|
||||||
|
|
||||||
# shellcheck disable=SC2206 # Do not want to quote $machineType as it may contain extra args
|
# shellcheck disable=SC2206 # Do not want to quote $machineType as it may contain extra args
|
||||||
args+=($machineType)
|
for word in $machineType; do
|
||||||
|
# Special handling for the "--min-cpu-platform" argument which may contain a
|
||||||
|
# space (escaped as '%20')...
|
||||||
|
args+=("${word//%20/ }")
|
||||||
|
done
|
||||||
if [[ -n $optionalBootDiskSize ]]; then
|
if [[ -n $optionalBootDiskSize ]]; then
|
||||||
args+=(
|
args+=(
|
||||||
--boot-disk-size "${optionalBootDiskSize}GB"
|
--boot-disk-size "${optionalBootDiskSize}GB"
|
||||||
|
Reference in New Issue
Block a user