abstreet/cloud/start_batch_import.sh

#!/bin/bash
# This script packages up the importer as it exists in the current git repo,
# creates a bunch of GCE VMs, and runs the importer there on all cities, using
# static sharding.
#
# This process is only runnable by Dustin, due to current GCE/EC2 permissions.
#
# Run from the repo's root dir: cloud/start_batch_import.sh

set -e
set -x

EXPERIMENT_TAG=$1
if [ "$EXPERIMENT_TAG" == "" ]; then
	echo Missing args;
	exit 1;
fi

NUM_WORKERS=10
ZONE=us-east1-b
# See other options: https://cloud.google.com/compute/docs/machine-types
# Particularly... e2-standard-2, n2-standard-2, c2-standard-4
MACHINE_TYPE=e2-standard-2
# All of data/ is currently around 30GB
DISK_SIZE=40GB
# Compressing and checksumming gigantic files needs more IOPS
DISK_TYPE=pd-ssd
# Haha, using a project from college, my last traffic sim...
PROJECT=aorta-routes

function build_payload {
	# It's a faster workflow to copy the local binaries into the VMs, rather than
	# build them there. But it does require us to build the importer without the
	# GDAL bindings, since the dynamic linking won't transfer over to the VM due to
	# the GDAL version being different.
	#
	# GDAL bindings are only used when initially building popdat.bin for Seatle;
	# there's almost never a need to regenerate this, and it can be done locally
	# when required.
	cargo build --release --bin importer --bin updater

	# Build our payload for the VMs
	# This mkdir deliberately fails if the directory is already there; it probably
	# means the last run broke somehow
	mkdir worker_payload
	mkdir -p worker_payload/target/release
	cp target/release/importer worker_payload/target/release/
	cp target/release/updater worker_payload/target/release/
	mkdir worker_payload/data
	cp data/MANIFEST.json worker_payload/data
	mkdir worker_payload/importer
	cp -Rv importer/config worker_payload/importer
	cp cloud/worker_script.sh worker_payload/
	# Copy in AWS credentials! Obviously don't go making worker_payload/ public or
	# letting anybody into the VMs.
	#
	# Alternatively, I could just scp the files from the VMs back to my local
	# computer. But more than likely, GCE's upstream speed to S3 (even
	# cross-region) is better than Comcast. :)
	cp -Rv ~/.aws worker_payload/
	zip -r worker_payload worker_payload
}

function create_vms {
	# Create all of the VMs at once
	gcloud compute \
		--project=$PROJECT \
		instances bulk create \
		--name-pattern='worker-#' \
		--zone=$ZONE \
		--count=$NUM_WORKERS \
		--machine-type=$MACHINE_TYPE \
		--boot-disk-size=$DISK_SIZE \
		--boot-disk-type=$DISK_TYPE \
		--image-family=ubuntu-2004-lts \
		--image-project=ubuntu-os-cloud \
		--scopes=compute-rw

	# There's a funny history behind the whole "how do I wait for my VM to be
	# SSHable?" question...
	sleep 30s
}

function start_workers {
	for ((i = 0; i < $NUM_WORKERS; i++)); do
		gcloud compute scp \
			--project=$PROJECT \
			--zone=$ZONE \
			worker_payload.zip \
			worker-$i:~/worker_payload.zip
		gcloud compute ssh \
			--project=$PROJECT \
			--zone=$ZONE \
			worker-$i \
			--command="sudo apt-get -qq install -y unzip; unzip -q worker_payload.zip; ./worker_payload/worker_script.sh $EXPERIMENT_TAG $i $NUM_WORKERS 1> logs 2>&1 &"
	done
}

build_payload
create_vms
start_workers

# To follow along with a worker:
# > gcloud compute ssh worker-5 --command='tail -f logs'
#
# To see which workers are still running (or have failed):
# > gcloud compute instances list
Create a Docker image to run the map importer in the almighty cloud. #326 2021-05-07 00:55:51 +03:00			`#!/bin/bash`
			`# This script packages up the importer as it exists in the current git repo,`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`# creates a bunch of GCE VMs, and runs the importer there on all cities, using`
			`# static sharding.`
Create a Docker image to run the map importer in the almighty cloud. #326 2021-05-07 00:55:51 +03:00			`#`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`# This process is only runnable by Dustin, due to current GCE/EC2 permissions.`
Create a Docker image to run the map importer in the almighty cloud. #326 2021-05-07 00:55:51 +03:00			`#`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`# Run from the repo's root dir: cloud/start_batch_import.sh`
Create a Docker image to run the map importer in the almighty cloud. #326 2021-05-07 00:55:51 +03:00
			`set -e`
			`set -x`

			`EXPERIMENT_TAG=$1`
			`if [ "$EXPERIMENT_TAG" == "" ]; then`
			`echo Missing args;`
			`exit 1;`
			`fi`

Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`NUM_WORKERS=10`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`ZONE=us-east1-b`
			`# See other options: https://cloud.google.com/compute/docs/machine-types`
			`# Particularly... e2-standard-2, n2-standard-2, c2-standard-4`
			`MACHINE_TYPE=e2-standard-2`
			`# All of data/ is currently around 30GB`
			`DISK_SIZE=40GB`
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`# Compressing and checksumming gigantic files needs more IOPS`
			`DISK_TYPE=pd-ssd`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`# Haha, using a project from college, my last traffic sim...`
			`PROJECT=aorta-routes`

Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`function build_payload {`
			`# It's a faster workflow to copy the local binaries into the VMs, rather than`
			`# build them there. But it does require us to build the importer without the`
			`# GDAL bindings, since the dynamic linking won't transfer over to the VM due to`
			`# the GDAL version being different.`
			`#`
			`# GDAL bindings are only used when initially building popdat.bin for Seatle;`
			`# there's almost never a need to regenerate this, and it can be done locally`
			`# when required.`
			`cargo build --release --bin importer --bin updater`
Create a Docker image to run the map importer in the almighty cloud. #326 2021-05-07 00:55:51 +03:00
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`# Build our payload for the VMs`
			`# This mkdir deliberately fails if the directory is already there; it probably`
			`# means the last run broke somehow`
			`mkdir worker_payload`
			`mkdir -p worker_payload/target/release`
			`cp target/release/importer worker_payload/target/release/`
			`cp target/release/updater worker_payload/target/release/`
			`mkdir worker_payload/data`
			`cp data/MANIFEST.json worker_payload/data`
			`mkdir worker_payload/importer`
			`cp -Rv importer/config worker_payload/importer`
			`cp cloud/worker_script.sh worker_payload/`
			`# Copy in AWS credentials! Obviously don't go making worker_payload/ public or`
			`# letting anybody into the VMs.`
			`#`
			`# Alternatively, I could just scp the files from the VMs back to my local`
			`# computer. But more than likely, GCE's upstream speed to S3 (even`
			`# cross-region) is better than Comcast. :)`
			`cp -Rv ~/.aws worker_payload/`
			`zip -r worker_payload worker_payload`
			`}`
Create a Docker image to run the map importer in the almighty cloud. #326 2021-05-07 00:55:51 +03:00
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`function create_vms {`
			`# Create all of the VMs at once`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`gcloud compute \`
			`--project=$PROJECT \`
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`instances bulk create \`
			`--name-pattern='worker-#' \`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`--zone=$ZONE \`
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`--count=$NUM_WORKERS \`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`--machine-type=$MACHINE_TYPE \`
			`--boot-disk-size=$DISK_SIZE \`
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`--boot-disk-type=$DISK_TYPE \`
Give up on Docker and AWS Batch to bulk import cities. Switch to static sharding with GCE instead. #326 2021-05-18 19:50:28 +03:00			`--image-family=ubuntu-2004-lts \`
Working on the GCP importer workflow... #326 - Amp up number of workers (about 100 cities, so 10/worker now) - Use an SSD, since especially the setup and upload steps are extremely IO bound - Split the script into pieces that can be easily disabled to iterate faster - Use the bulk API to create instances - Make the overall start_batch_import.sh a bit quieter - Make successful VMs self-destruct so it's easier to track which're done - Setup Docker on the VMs, so elevation data works 2021-05-18 22:28:41 +03:00			`--image-project=ubuntu-os-cloud \`
			`--scopes=compute-rw`

			`# There's a funny history behind the whole "how do I wait for my VM to be`
			`# SSHable?" question...`
			`sleep 30s`
			`}`

			`function start_workers {`
			`for ((i = 0; i < $NUM_WORKERS; i++)); do`
			`gcloud compute scp \`
			`--project=$PROJECT \`
			`--zone=$ZONE \`
			`worker_payload.zip \`
			`worker-$i:~/worker_payload.zip`
			`gcloud compute ssh \`
			`--project=$PROJECT \`
			`--zone=$ZONE \`
			`worker-$i \`
			`--command="sudo apt-get -qq install -y unzip; unzip -q worker_payload.zip; ./worker_payload/worker_script.sh $EXPERIMENT_TAG $i $NUM_WORKERS 1> logs 2>&1 &"`
			`done`
			`}`

			`build_payload`
			`create_vms`
			`start_workers`

			`# To follow along with a worker:`
			`# > gcloud compute ssh worker-5 --command='tail -f logs'`
			`#`
			`# To see which workers are still running (or have failed):`
			`# > gcloud compute instances list`