Skip to content

Commit

Permalink
Merge branch 'main' into ppawl-remove-kubectl-from-makefile
Browse files Browse the repository at this point in the history
  • Loading branch information
pawloch00 authored Jan 15, 2025
2 parents 49059fa + b9e78d3 commit a12ad5b
Showing 1 changed file with 7 additions and 7 deletions.
14 changes: 7 additions & 7 deletions xpk-large-scale-guide.sh
Original file line number Diff line number Diff line change
Expand Up @@ -148,14 +148,14 @@ echo python3 xpk.py cluster create \
--num-slices="${NUMSLICES}" \
--host-maintenance-interval=PERIODIC \
--custom-cluster-arguments="${CLUSTER_ARGUMENTS}" \
--custom-tpu-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"
--custom-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"

# example output ...
# python3 xpk.py cluster create --cluster NAME \
# --tpu-type=v5litepod-256 --num-slices=4 \
# --host-maintenance-interval=PERIODIC \
# --custom-cluster-arguments=" --network=NETWORK --subnetwork=SUBNET --scopes=storage-full,gke-default --enable-ip-alias --enable-private-nodes --master-ipv4-cidr 172.16.0.32/28 --cluster-ipv4-cidr=10.224.0.0/12 --no-enable-master-authorized-networks"
# --custom-tpu-nodepool-arguments=" --scopes=storage-full,gke-default --enable-gvnic --max-pods-per-node 15 --disk-size=50"
# --custom-nodepool-arguments=" --scopes=storage-full,gke-default --enable-gvnic --max-pods-per-node 15 --disk-size=50"


##### 2D #####################
Expand All @@ -168,7 +168,7 @@ python3 xpk.py cluster create \
--num-slices="${NUMSLICES}" \
--host-maintenance-interval=PERIODIC \
--custom-cluster-arguments="${CLUSTER_ARGUMENTS}" \
--custom-tpu-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"
--custom-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"

# This process takes around 4 minutes with 4 slices of v5e-256.

Expand Down Expand Up @@ -263,7 +263,7 @@ python3 xpk.py cluster create \
--num-slices="${NUMSLICES}" \
--host-maintenance-interval=PERIODIC \
--custom-cluster-arguments="${CLUSTER_ARGUMENTS}" \
--custom-tpu-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"
--custom-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"

##### STEP 4 ###################################################
##### PASS Cluster name and Project ID to Google POCs ##########
Expand Down Expand Up @@ -330,14 +330,14 @@ echo python3 xpk.py cluster create \
--num-slices="${NUMSLICES}" \
--host-maintenance-interval=PERIODIC \
--custom-cluster-arguments="${CLUSTER_ARGUMENTS}" \
--custom-tpu-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"
--custom-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"

# example output ...
# python3 xpk.py cluster create --cluster NAME \
# --tpu-type=v5litepod-256 --num-slices=64 \
# --host-maintenance-interval=PERIODIC \
# --custom-cluster-arguments=" --network=NETWORK --subnetwork=SUBNET --scopes=storage-full,gke-default --enable-ip-alias --enable-private-nodes --master-ipv4-cidr 172.16.0.32/28 --cluster-ipv4-cidr=10.224.0.0/12 --no-enable-master-authorized-networks"
# --custom-tpu-nodepool-arguments=" --scopes=storage-full,gke-default --enable-gvnic --max-pods-per-node 15 --disk-size=50"
# --custom-nodepool-arguments=" --scopes=storage-full,gke-default --enable-gvnic --max-pods-per-node 15 --disk-size=50"

##### 5C #####################
# Scale up to NUMSLICES (64 in the provided case) V5e-256s.
Expand All @@ -348,7 +348,7 @@ python3 xpk.py cluster create \
--num-slices="${NUMSLICES}" \
--host-maintenance-interval=PERIODIC \
--custom-cluster-arguments="${CLUSTER_ARGUMENTS}" \
--custom-tpu-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"
--custom-nodepool-arguments="${TPU_NODEPOOL_ARGUMENTS}"

###############################
##### 5C - POTENTIAL ERRORS ###
Expand Down

0 comments on commit a12ad5b

Please sign in to comment.