-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhal-docker.py
executable file
·140 lines (110 loc) · 5.38 KB
/
hal-docker.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
#!/usr/bin/python3
import argparse
import subprocess
import sys,os
import random
# wrap a script in the docker environment and put it in output_script
# if no input script, uses args.cmd
def make_docker_script(args, uid, gid, input_script, output_script, verbose):
# start (run) the docker image
script = ''
if (verbose):
script += 'set -x\n'
script += "DOCKER_ID=`docker run -t -u " + str(uid) + ":" + str(gid) + " -w /home/{} -v /dev/urandom:/dev/random --privileged -d -v {}:/host:rw {}`\n".format(args.user, args.dir, args.image)
if args.verbose:
script += "docker ps\n"
# this is so we can control-c/oardel a process and close the docker
script += 'trap "echo stopping $DOCKER_ID with SIGINT; docker stop $DOCKER_ID; docker rm $DOCKER_ID;exit 1" SIGINT\n'
script += 'trap "echo stopping $DOCKER_ID with SIGKILL; docker stop $DOCKER_ID; docker rm $DOCKER_ID;exit 1" SIGKILL\n'
script += 'trap "echo stopping $DOCKER_ID with SIGTERM; docker stop $DOCKER_ID; docker rm $DOCKER_ID;exit 1" SIGTERM\n'
script += 'trap "echo stopping $DOCKER_ID with SIGQUIT; docker stop $DOCKER_ID; docker rm $DOCKER_ID;exit 1" SIGQUIT\n'
script += 'trap "echo stopping $DOCKER_ID with SIGABRT; docker stop $DOCKER_ID; docker rm $DOCKER_ID;exit 1" SIGABRT\n'
script += 'trap "echo stopping $DOCKER_ID with SIGABRT; docker stop $DOCKER_ID; docker rm $DOCKER_ID;exit 1" SIGCHLD\n'
script += 'trap\n'
s = ''
if verbose:
s = 'set -x;'
s += 'RAND=' + str(random.randint(1, 10000)) + ';'
if args.args:
s += "ARGS=\"{}\";".format(" ".join(args.args))
if args.result_dir:
s += "RESULT_DIR=\"{}\";".format(args.result_dir)
for l in open(input_script):
if '#' in l:
print("ERROR: comments are not allowed in scripts!")
sys.exit(1)
s += l.replace('\n', '') + ';'
script += "docker exec $DOCKER_ID /bin/bash -c \'{}\' & \n".format(s)
script += "CHILD=$!\n"
script += "wait \"$CHILD\"\n"
# stop and remove the docker image
script += "docker stop $DOCKER_ID;\n"
script += "docker rm $DOCKER_ID;\n"
if args.verbose:
print(script)
with open(output_script, 'w') as f:
f.write(script)
return output_script
def run(cmd, verbose):
if verbose:
print ("CMD: " + cmd)
subprocess.run(cmd, shell=True)
def parse_args():
# setup arguments
parser = argparse.ArgumentParser()
parser.add_argument("-a", "--args", help="arguments to the run script", type=str, nargs='+')
parser.add_argument("-c", "--cmd", help="command to run", type=str)
parser.add_argument("-C", "--compile", help="compilation script", type=str)
parser.add_argument("-d", "--dir", help="directory to be mounted as /host", type=str, default="exp")
parser.add_argument("-i", "--image", help="DOCKER image")
parser.add_argument("-k", "--kill", help="kill a job [--kill job_number]", type=str, nargs='+')
parser.add_argument("-n", "--cores", help="number of cores for OAR [use 24 for a full node, 32 for the 'fat nodes']", type=str, default="1")
parser.add_argument("-r", "--replicates", help="number of replicates", type=int, default=1)
parser.add_argument("-R", "--result_dir", help="set $RESULT_DIR in your execution script", type=str)
parser.add_argument("-S", "--script", help="script to compile and run", type=str)
parser.add_argument("-s", "--submit", help="submit the job to OAR", action="store_true")
parser.add_argument("-u", "--user", help="user name to connect to in the docker", type=str, default="user")
parser.add_argument("-v", "--verbose", help="print more information", action="store_true")
parser.add_argument("-w", "--walltime", help="walltime for the OAR job (warning the job will be killed after this time)", type=str, default="24:00")
args = parser.parse_args()
return args, parser
### main logic
args, parser = parse_args()
uid = os.getuid()
gid = os.getgid()
if args.kill:
run("oardel -s SIGTERM " + ' '.join(args.kill), args.verbose)
sys.exit(0)
if not args.image:
print("ERROR: we need a docker image!")
parser.print_help()
sys.exit(1)
if not args.dir:
print("ERROR: please specify a directory to be mounted in the image as /host!")
parser.print_help()
sys.exit(1)
if not args.cmd and not args.script and not args.compile:
print("ERROR: we need a command or a script!")
parser.print_help()
sys.exit(1)
pwd = os.environ['HOME'] + '/tmp/'
if not os.path.exists(pwd):
os.mkdir(pwd)
if args.compile:
s = make_docker_script(args, uid, gid, args.compile, pwd + "compile.sh", args.verbose)
run("/bin/bash " + s, args.verbose)
if args.cmd:
with open(pwd + "cmd.sh", 'w') as f:
f.write(args.cmd + "\n")
s = make_docker_script(args, uid, gid, pwd + "cmd.sh", pwd + "cmd.sh", args.verbose)
run("/bin/bash " + s, args.verbose)
if args.script and not args.submit:
print("script:", args.script)
s = make_docker_script(args, uid, gid, args.script, pwd + "script.sh", args.verbose)
run("/bin/bash " + s, args.verbose)
if args.script and args.submit:
oarsub_args = "-l/nodes=1/core={},walltime={}".format(args.cores, args.walltime)
s = make_docker_script(args, uid, gid, args.script, pwd + "script.sh", args.verbose)
cmd = "oarsub " + oarsub_args + " \"/bin/bash " + s + "\""
for i in range(0, args.replicates):
run(cmd, args.verbose)