118 lines
4.0 KiB
Python
118 lines
4.0 KiB
Python
"""Launcher for Propeller GP runs on the Hampshire College Fly cluster.
|
|
|
|
Setup
|
|
=====
|
|
|
|
1. Get access to an account on the Fly cluster.
|
|
2. SSH into the Fly cluster.
|
|
3. Clone `propeller` (probably your personal fork) in your user directory.
|
|
4. Make sure that your have Python 3.6 or later on your path.
|
|
5. Run `/share/apps/bin/lein --version` to do a 1-time setup of Leiningen.
|
|
|
|
How To Run
|
|
==========
|
|
|
|
1. Put your version of Propeller on the correct version you would like to run. For example, checkout your
|
|
feature branch.
|
|
|
|
2. Run this this script with Python 3 with `python3 scripts/fly_launcher [PARAMS]`.
|
|
|
|
Parameters
|
|
==========
|
|
|
|
-h, --help show this help message and exit
|
|
-n NUM_RUNS, --num-runs NUM_RUNS The number of runs of the problem to start.
|
|
-o OUT, --out OUT The path to put the log files of the run captured from stdout.
|
|
-p PROBLEM, --problem PROBLEM The namespaces of the problem file in the propeller repository.
|
|
-d PROPELLER, --propeller PROPELLER The path to propeller.
|
|
-i ID, --id ID The identifier for the overall flight of propeller runs.
|
|
-t TAG, --tag TAG An optional tag to add to the runs.
|
|
|
|
or run `python3 scripts/fly_launcher.py -h` for help.
|
|
|
|
Example
|
|
=======
|
|
|
|
python3 fly_launcher.py \
|
|
--num-runs 10 \
|
|
--out "~/runs/propeller/my-experiment/" \
|
|
--problem "propeller.problems.simple-regression" \
|
|
--propeller "~/propeller" \
|
|
--id my-gp-experiment
|
|
|
|
"""
|
|
|
|
# @todo Add support for n runs of a set of problems?
|
|
|
|
import argparse
|
|
import os
|
|
import subprocess
|
|
|
|
|
|
def alf_cmd(opts: argparse.Namespace, run_id: int) -> str:
|
|
log_file = os.path.join(opts.out, f"run{run_id}.txt")
|
|
cmds = [
|
|
"echo Starting run",
|
|
"export PATH=$PATH:/usr/java/latest/bin",
|
|
f"cd {opts.propeller}",
|
|
f"mkdir -p {opts.out}",
|
|
f"/share/apps/bin/lein with-profiles production trampoline run -m {opts.problem} > {log_file}",
|
|
"echo Finished Run"
|
|
]
|
|
return f"""RemoteCmd {{/bin/sh -c {{{"; ".join(cmds)}}}}}"""
|
|
|
|
|
|
def alf_task(opts: argparse.Namespace, run_id: int) -> str:
|
|
title = f"Run {run_id} - {opts.problem} - {opts.id}"
|
|
return f"""Task -title {{{title}}} -cmds {{
|
|
{alf_cmd(opts, run_id)} -service {{tom}} -tags {{{opts.tag}}}
|
|
}}
|
|
"""
|
|
|
|
|
|
def alf_job(opts: argparse.Namespace) -> str:
|
|
tasks = "\n ".join([alf_task(opts, i) for i in range(opts.num_runs)])
|
|
return f"""##AlfredToDo 3.0
|
|
Job -title {{{opts.id}}} -subtasks {{
|
|
{tasks}
|
|
}}
|
|
"""
|
|
|
|
|
|
def cli_opts() -> argparse.ArgumentParser:
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument("-n", "--num-runs", type=int, help="The number of runs of the problem to start.")
|
|
parser.add_argument("-o", "--out", help="The path to put the log files of the run captured from stdout.")
|
|
parser.add_argument("-p", "--problem", help="The namespaces of the problem file in the propeller repository.")
|
|
parser.add_argument("-d", "--propeller", help="The path to propeller.")
|
|
parser.add_argument("-i", "--id", help="The identifier for the overall flight of propeller runs.")
|
|
parser.add_argument("-t", "--tag", default="", help="An optional tag to add to the runs.")
|
|
return parser
|
|
|
|
|
|
PIXAR_INIT = "source /etc/sysconfig/pixar"
|
|
PIXAR_CMD = "/opt/pixar/tractor-blade-1.7.2/python/bin/python2.6 /opt/pixar/tractor-blade-1.7.2/tractor-spool.py --engine=fly:8000"
|
|
|
|
|
|
if __name__ == "__main__":
|
|
cli_parser = cli_opts()
|
|
args = cli_parser.parse_args()
|
|
|
|
args.out = os.path.abspath(os.path.expanduser(args.out))
|
|
args.propeller = os.path.abspath(os.path.expanduser(args.propeller))
|
|
|
|
if not os.path.isdir(args.propeller):
|
|
raise ValueError(f"Propeller not found at {args.propeller}")
|
|
|
|
if not os.path.isdir(args.out):
|
|
os.makedirs(args.out)
|
|
|
|
alf_file = os.path.join(args.out, "propeller_runs.alf")
|
|
with open(alf_file, "w") as alf:
|
|
alf.write(alf_job(args))
|
|
|
|
ret = subprocess.run(
|
|
f"{PIXAR_INIT};{PIXAR_CMD} {alf_file}",
|
|
shell=True
|
|
)
|