Adds fly launcher

This commit is contained in:
erp12 2021-10-14 22:07:57 -04:00
parent 003426318b
commit 2d066d8089

117
scripts/fly_launcher.py Normal file
View File

@ -0,0 +1,117 @@
"""Launcher for Propeller GP runs on the Hampshire College Fly cluster.
Setup
=====
1. Get access to an account on the Fly cluster.
2. SSH into the Fly cluster.
3. Clone `propeller` (probably your personal fork) in your user directory.
4. Make sure that your have Python 3.6 or later on your path.
5. Run `/share/apps/bin/lein --version` to do a 1-time setup of Leiningen.
How To Run
==========
1. Put your version of Propeller on the correct version you would like to run. For example, checkout your
feature branch.
2. Run this this script with Python 3 with `python3 scripts/fly_launcher [PARAMS]`.
Parameters
==========
-h, --help show this help message and exit
-n NUM_RUNS, --num-runs NUM_RUNS The number of runs of the problem to start.
-o OUT, --out OUT The path to put the log files of the run captured from stdout.
-p PROBLEM, --problem PROBLEM The namespaces of the problem file in the propeller repository.
-d PROPELLER, --propeller PROPELLER The path to propeller.
-i ID, --id ID The identifier for the overall flight of propeller runs.
-t TAG, --tag TAG An optional tag to add to the runs.
or run `python3 scripts/fly_launcher.py -h` for help.
Example
=======
python3 fly_launcher.py \
--num-runs 10 \
--out "~/runs/propeller/my-experiment/" \
--problem "propeller.problems.simple-regression" \
--propeller "~/propeller" \
--id my-gp-experiment
"""
# @todo Add support for n runs of a set of problems?
import argparse
import os
import subprocess
def alf_cmd(opts: argparse.Namespace, run_id: int) -> str:
log_file = os.path.join(opts.out, f"run{run_id}.txt")
cmds = [
"echo Starting run",
"export PATH=$PATH:/usr/java/latest/bin",
f"cd {opts.propeller}",
f"mkdir -p {opts.out}",
f"/share/apps/bin/lein with-profiles production trampoline run -m {opts.problem} > {log_file}",
"echo Finished Run"
]
return f"""RemoteCmd {{/bin/sh -c {{{"; ".join(cmds)}}}}}"""
def alf_task(opts: argparse.Namespace, run_id: int) -> str:
title = f"Run {run_id} - {opts.problem} - {opts.id}"
return f"""Task -title {{{title}}} -cmds {{
{alf_cmd(opts, run_id)} -service {{tom}} -tags {{{opts.tag}}}
}}
"""
def alf_job(opts: argparse.Namespace) -> str:
tasks = "\n ".join([alf_task(opts, i) for i in range(opts.num_runs)])
return f"""##AlfredToDo 3.0
Job -title {{{opts.id}}} -subtasks {{
{tasks}
}}
"""
def cli_opts() -> argparse.ArgumentParser:
parser = argparse.ArgumentParser()
parser.add_argument("-n", "--num-runs", type=int, help="The number of runs of the problem to start.")
parser.add_argument("-o", "--out", help="The path to put the log files of the run captured from stdout.")
parser.add_argument("-p", "--problem", help="The namespaces of the problem file in the propeller repository.")
parser.add_argument("-d", "--propeller", help="The path to propeller.")
parser.add_argument("-i", "--id", help="The identifier for the overall flight of propeller runs.")
parser.add_argument("-t", "--tag", default="", help="An optional tag to add to the runs.")
return parser
PIXAR_INIT = "source /etc/sysconfig/pixar"
PIXAR_CMD = "/opt/pixar/tractor-blade-1.7.2/python/bin/python2.6 /opt/pixar/tractor-blade-1.7.2/tractor-spool.py --engine=fly:8000"
if __name__ == "__main__":
cli_parser = cli_opts()
args = cli_parser.parse_args()
args.out = os.path.abspath(os.path.expanduser(args.out))
args.propeller = os.path.abspath(os.path.expanduser(args.propeller))
if not os.path.isdir(args.propeller):
raise ValueError(f"Propeller not found at {args.propeller}")
if not os.path.isdir(args.out):
os.makedirs(args.out)
alf_file = os.path.join(args.out, "propeller_runs.alf")
with open(alf_file, "w") as alf:
alf.write(alf_job(args))
ret = subprocess.run(
f"{PIXAR_INIT};{PIXAR_CMD} {alf_file}",
shell=True
)