-
Notifications
You must be signed in to change notification settings - Fork 48
/
Copy pathec2.py
374 lines (337 loc) · 12.2 KB
/
ec2.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
"""
ec2.py
~~~~~~
Simple EC2 cluster management with Python, designed to make it easy to
name and work with clusters, and to integrate with `fabric`.
For usage information see README.md.
"""
#### Library imports
# Standard library
import os
import shelve
import subprocess
import sys
import time
# Third party libraries
from boto.ec2.connection import EC2Connection
# My libraries
import ec2_classes
#### Constants and globals
# The list of EC2 AMIs to use, from alestic.com
AMIS = {"m1.small" : "ami-e2af508b",
"c1.medium" : "ami-e2af508b",
"m1.large" : "ami-68ad5201",
"m1.xlarge" : "ami-68ad5201",
"m2.xlarge" : "ami-68ad5201",
"m2.2xlarge" : "ami-68ad5201",
"m2.4xlarge" : "ami-68ad5201",
"c1.xlarge" : "ami-68ad5201",
"cc1.4xlarge" : "ami-1cad5275"
}
# The most important data structure we use is a persistent shelf which
# is used to represent all the clusters. The keys in this shelf are
# the `cluster_names`, and the values will be ec2_classes.Cluster
# objects, which represent named EC2 clusters.
#
# The shelf will be stored at "HOME/.ec2-shelf"
HOME = "/home/mnielsen"
# Check that the required environment variables exist
def check_environment_variables_exist(*args):
"""
Check that the environment variables in `*args` have all been
defined. If any do not, print an error message and exit.
"""
vars_exist = True
for var in args:
if var not in os.environ:
print "Need to set $%s environment variable" % var
vars_exist = False
if not vars_exist:
print "Exiting"
sys.exit()
check_environment_variables_exist(
"AWS_HOME", "AWS_KEYPAIR", "AWS_ACCESS_KEY_ID", "AWS_SECRET_ACCESS_KEY")
# EC2 connection object
ec2_conn = EC2Connection(
os.environ["AWS_ACCESS_KEY_ID"], os.environ["AWS_SECRET_ACCESS_KEY"])
#### The following are the functions corresponding to the command line
#### API calls: create, show, show_all etc.
def create(cluster_name, n, instance_type):
"""
Create an EC2 cluster with name `cluster_name`, and `n` instances
of type `instance_type`. Update the `clusters` shelf to include a
description of the new cluster.
"""
# Parameter check
if exists(cluster_name):
print ("A cluster with name %s already exists. Exiting."
% cluster_name)
sys.exit()
if n < 1 or n > 20:
print "Clusters must contain between 1 and 20 instances. Exiting."
sys.exit()
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
if not instance_type in AMIS:
print "Instance type not recognized, setting it to be 'm1.small'."
instance_type = "m1.small"
# Create the EC2 instances
instances = create_ec2_instances(n, instance_type)
# Update clusters
clusters[cluster_name] = ec2_classes.Cluster(
cluster_name, instance_type, instances)
clusters.close()
def show(cluster_name):
"""
Print the details of cluster `cluster_name` to stdout.
"""
cluster = get_cluster(cluster_name)
print "Displaying instances from cluster: %s" % cluster_name
print "Instances of type: %s" % cluster.instance_type
print "{0:8}{1:13}{2:35}".format(
"index", "EC2 id", "public dns name")
for (j, instance) in enumerate(cluster.instances):
print "{0:8}{1:13}{2:35}".format(
str(j), instance.id, instance.public_dns_name)
def show_all():
"""
Print the details of all clusters to stdout.
"""
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
if len(clusters) == 0:
print "No clusters present."
clusters.close()
sys.exit()
print "Showing all clusters."
for cluster_name in clusters:
show(cluster_name)
clusters.close()
def shutdown(cluster_name):
"""
Shutdown all EC2 instances in ``cluster_name``, and remove
``cluster_name`` from the shelf of clusters.
"""
if not exists(cluster_name):
print "No cluster with that name."
sys.exit()
print "Shutting down cluster %s." % cluster_name
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
ec2_conn.terminate_instances(
[instance.id for instance in clusters[cluster_name].instances])
del clusters[cluster_name]
clusters.sync()
clusters.close()
def shutdown_all():
"""
Shutdown all EC2 instances in all clusters, and remove all
clusters from the `clusters` shelf.
"""
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
if len(clusters) == 0:
print "No clusters to shut down. Exiting."
clusters.close()
sys.exit()
for cluster_name in clusters:
shutdown(cluster_name)
clusters.close()
def login(cluster_name, instance_index):
"""
ssh to `instance_index` in `cluster_name`.
"""
cluster = get_cluster(cluster_name)
instance = get_instance(cluster, instance_index)
print "SSHing to instance with address %s" % (instance.public_dns_name)
keypair = "%s/%s.pem" % (os.environ["AWS_HOME"], os.environ["AWS_KEYPAIR"])
os.system("ssh -i %s ubuntu@%s" % (keypair, instance.public_dns_name))
def kill(cluster_name, instance_index):
"""
Shutdown instance `instance_index` in cluster `cluster_name`, and
remove from the clusters shelf. If we're killing off the last
instance in the cluster then it runs `shutdown(cluster_name)`
instead.
"""
cluster = get_cluster(cluster_name)
instance = get_instance(cluster, instance_index)
if size(cluster_name)==1:
print "Last machine in cluster, shutting down entire cluster."
shutdown(cluster_name)
sys.exit()
print ("Shutting down instance %s on cluster %s." %
(instance_index, cluster_name))
ec2_conn.terminate_instances([instance.id])
del cluster.instances[instance_index]
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
clusters[cluster_name] = cluster
clusters.close()
def add(cluster_name, n):
"""
Add `n` instances to `cluster_name`, of the same instance type as
the other instances already in the cluster.
"""
cluster = get_cluster(cluster_name)
if n < 1:
print "Must be adding at least 1 instance to the cluster. Exiting."
sys.exit()
# Create the EC2 instances
instances = create_ec2_instances(n, cluster.instance_type)
# Update clusters
cluster.add(instances)
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
clusters[cluster_name] = cluster
clusters.close()
def ssh(cluster_name, instance_index, cmd, background=False):
"""
Run `cmd` on instance number `instance_index` on `cluster_name`.
Runs in the background if `background == True`. This feature is
not currently exposed from the command line API, but may be useful
in future.
"""
cluster = get_cluster(cluster_name)
instance = get_instance(cluster, instance_index)
keypair = "%s/%s.pem" % (os.environ["AWS_HOME"], os.environ["AWS_KEYPAIR"])
append = {True: " &", False: ""}[background]
remote_cmd = ("'nohup %s > foo.out 2> foo.err < /dev/null %s'" %
(cmd, append))
os.system(("ssh -o BatchMode=yes -i %s ubuntu@%s %s" %
(keypair, instance.public_dns_name, remote_cmd)))
def ssh_all(cluster_name, cmd):
"""
Run `cmd` on all instances in `cluster_name`.
"""
cluster = get_cluster(cluster_name)
for j in range(size(cluster_name)):
ssh(cluster_name, j, cmd)
def scp(cluster_name, instance_index, local_filename, remote_filename=False):
"""
scp `local_filename` to `remote_filename` on instance
`instance_index` on cluster `cluster_name`. If `remote_filename`
is not set or is set to `False` then `remote_filename` is set to
`local_filename`.
"""
cluster = get_cluster(cluster_name)
instance = get_instance(cluster, instance_index)
keypair = "%s/%s.pem" % (os.environ["AWS_HOME"], os.environ["AWS_KEYPAIR"])
if not remote_filename:
remote_filename = "."
os.system(("scp -r -i %s %s ubuntu@%s:%s" %
(keypair, local_filename,
instance.public_dns_name, remote_filename)))
def scp_all(cluster_name, local_filename, remote_filename=False):
"""
Run `scp` on all instances in `cluster_name`.
"""
for j in range(size(cluster_name)):
scp(cluster_name, j, local_filename, remote_filename)
#### Helper functions
def create_ec2_instances(n, instance_type):
"""
Create an EC2 cluster with `n` instances of type `instance_type`.
Return the corresponding boto `reservation.instances` object.
This code is used by both the `create` and `add` functions, which
is why it was factored out.
"""
ami = AMIS[instance_type]
image = ec2_conn.get_all_images(image_ids=[ami])[0]
reservation = image.run(
n, n, os.environ["AWS_KEYPAIR"], instance_type=instance_type)
for instance in reservation.instances: # Wait for the cluster to come up
while instance.update()== u'pending':
time.sleep(1)
return reservation.instances
def get_cluster(cluster_name):
"""
Check that a cluster with name `cluster_name` exists, and return
the corresponding Cluster object if so.
"""
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
if cluster_name not in clusters:
print "No cluster with the name %s exists. Exiting." % cluster_name
clusters.close()
sys.exit()
cluster = clusters[cluster_name]
clusters.close()
return cluster
def get_instance(cluster, instance_index):
"""
Check that ``cluster`` has an instance with index
``instance_index``, and if so return the corresponding
``ec2_classes.Instance object``.
"""
try:
return cluster.instances[instance_index]
except IndexError:
print ("The instance index must be in the range 0 to %s. Exiting." %
(len(cluster.instances)-1,))
sys.exit()
#### Methods to export externally
def exists(cluster_name):
"""
Return ``True`` if an EC2 cluster with name ``cluster_name`` exists, and
``False`` otherwise.
"""
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
value = cluster_name in clusters
clusters.close()
return value
def public_dns_names(cluster_name):
"""
Return a list containing the public dns names for `cluster_name`.
See README.md to see how this enables easy integration with
Fabric.
"""
clusters = shelve.open("%s/.ec2-shelf" % HOME, writeback=True)
if cluster_name not in clusters:
print (
"Cluster name %s not recognized. Exiting ec2.public_dns_names()." %
cluster_name)
clusters.close()
sys.exit()
else:
cluster = clusters[cluster_name]
clusters.close()
return [instance.public_dns_name for instance in cluster.instances]
def size(cluster_name):
"""
Return the size of the cluster with name ``cluster_name``.
"""
return len(get_cluster(cluster_name).instances)
#### External interface
if __name__ == "__main__":
args = sys.argv[1:]
l = len(args)
try:
cmd = args[0]
except:
cmd = None
if cmd=="create" and l==4:
create(args[1], int(args[2]), args[3])
elif cmd=="show" and l==2:
show(args[1])
elif cmd=="show_all" and l==1:
show_all()
elif cmd=="shutdown" and l==2:
shutdown(args[1])
elif cmd=="shutdown_all" and l==1:
shutdown_all()
elif cmd=="login" and l==2:
login(args[1], 0)
elif cmd=="login" and l==3:
login(args[1], int(args[2]))
elif cmd=="kill" and l==3:
kill(args[1], int(args[2]))
elif cmd=="add" and l==3:
add(args[1], int(args[2]))
elif cmd=="ssh" and l==4:
ssh(args[1], int(args[2]), args[3])
elif cmd=="ssh_all" and l==3:
ssh_all(args[1], args[2])
elif cmd=="scp" and l==4:
scp(args[1], int(args[2]), args[3])
elif cmd=="scp" and l==5:
scp(args[1], int(args[2]), args[3], args[4])
elif cmd=="scp_all" and l==3:
scp_all(args[1], args[2])
elif cmd=="scp_all" and l==4:
scp_all(args[1], args[2], args[3])
else:
print ("Command not recognized. "
"For usage information, see README.md.")