1 : |
agomez |
17 |
#
|
2 : |
|
|
# BonFIRE Virtual Clusters on Federated Clouds Demonstration Kit
|
3 : |
|
|
#
|
4 : |
|
|
# Copyright (c) Fundacion Centro Tecnologico de Supercomputacion de Galicia 2012
|
5 : |
|
|
#
|
6 : |
|
|
# License Apache Software
|
7 : |
|
|
#
|
8 : |
|
|
# The research leading to these results has received funding from
|
9 : |
|
|
# the European Community's Seventh Framework Programme (FP7/2007-2013)
|
10 : |
|
|
# under agreement number 257386
|
11 : |
|
|
#
|
12 : |
|
|
# This software is provided with ABSOLUTELY NO WARRANTY
|
13 : |
|
|
#
|
14 : |
|
|
require 'rubygems'
|
15 : |
|
|
require 'restfully'
|
16 : |
|
|
require 'restfully/addons/bonfire'
|
17 : |
|
|
|
18 : |
|
|
##Editable parameters
|
19 : |
|
|
#LOCATION = "de-hlrs"
|
20 : |
|
|
LOCATION = "fr-inria"
|
21 : |
|
|
#LOCATION = "uk-epcc"
|
22 : |
|
|
##
|
23 : |
|
|
|
24 : |
|
|
EXPERIMENT_NAME = "Build image client"
|
25 : |
|
|
EXPERIMENT_DESCRIPTION = "Build image client for virtual cluster."
|
26 : |
|
|
EXPERIMENT_WALLTIME = 3600
|
27 : |
|
|
IMAGE_NAME = "BonFIRE Debian Squeeze 2G v3"
|
28 : |
|
|
NEW_IMAGE_DESCRIPTION = "VirtualCluster Client image."
|
29 : |
|
|
WAN_NAME = "BonFIRE WAN"
|
30 : |
|
|
|
31 : |
|
|
session = Restfully::Session.new(
|
32 : |
|
|
:configuration_file => "~/.restfully/api.bonfire-project.eu",
|
33 : |
|
|
:cache => false,
|
34 : |
|
|
:gateway => "ssh.fr-inria.bonfire-project.eu",
|
35 : |
|
|
:keys => ["~/.ssh/id_rsa"]
|
36 : |
|
|
)
|
37 : |
|
|
session.logger.level = Logger::INFO
|
38 : |
|
|
#session.logger.level = Logger::DEBUG
|
39 : |
|
|
|
40 : |
|
|
NEW_IMAGE_NAME = "VirtualClusterClient-#{session.config[:username]}-v0.1"
|
41 : |
|
|
|
42 : |
|
|
experiment = nil
|
43 : |
|
|
|
44 : |
|
|
begin
|
45 : |
|
|
session.logger.info "Deploying experiment..."
|
46 : |
|
|
experiment = session.root.experiments.submit(
|
47 : |
|
|
:name => EXPERIMENT_NAME,
|
48 : |
|
|
:description => EXPERIMENT_DESCRIPTION + " - " + Time.now.to_s,
|
49 : |
|
|
:walltime => EXPERIMENT_WALLTIME
|
50 : |
|
|
)
|
51 : |
|
|
|
52 : |
|
|
location = session.root.locations[:"#{LOCATION}"]
|
53 : |
|
|
session.logger.info "Chosen location is: #{location['name']}"
|
54 : |
|
|
fail "Can't select the machine location" if location.nil?
|
55 : |
|
|
|
56 : |
|
|
session.logger.info "Deleting previous version"
|
57 : |
|
|
storage = location.storages.find{|s| s["name"] == NEW_IMAGE_NAME}
|
58 : |
|
|
storage.delete unless storage.nil?
|
59 : |
|
|
|
60 : |
|
|
session.logger.info "Launching machine..."
|
61 : |
|
|
machine = experiment.computes.submit(
|
62 : |
|
|
:name => "machine-experiment#{experiment['id']}",
|
63 : |
|
|
:instance_type => "small",
|
64 : |
|
|
:disk => [{:storage => location.storages.find{|s| s['name'] == IMAGE_NAME}}],
|
65 : |
|
|
:nic => [
|
66 : |
|
|
{:network => location.networks.find{|n| n['name'] == WAN_NAME}}
|
67 : |
|
|
],
|
68 : |
|
|
:location => location,
|
69 : |
|
|
:context => {}
|
70 : |
|
|
)
|
71 : |
|
|
hostname = "#{machine['name']}-#{machine['id']}"
|
72 : |
|
|
session.logger.info "Machine: #{hostname} #{machine['nic'][0]['ip']}"
|
73 : |
|
|
|
74 : |
|
|
session.logger.info "Starting experiment..."
|
75 : |
|
|
experiment.update(:status => "running")
|
76 : |
|
|
|
77 : |
|
|
session.logger.info "Checking if machine is ready..."
|
78 : |
|
|
until [machine].all?{|vm|
|
79 : |
|
|
vm.reload['state'] == 'RUNNING' && vm.ssh.accessible?
|
80 : |
|
|
} do
|
81 : |
|
|
fail "Machine has failed" if [machine].any?{|vm| vm['state'] == 'FAILED'}
|
82 : |
|
|
session.logger.info "Machine is not ready. Waiting..."
|
83 : |
|
|
sleep 20
|
84 : |
|
|
end
|
85 : |
|
|
|
86 : |
|
|
session.logger.info "Machine is ready"
|
87 : |
|
|
machine.ssh do |ssh|
|
88 : |
|
|
session.logger.info "Preinstallation..."
|
89 : |
|
|
output = ssh.scp.upload!('killproc.sh', '/root/')
|
90 : |
|
|
session.logger.info output unless output.nil?
|
91 : |
|
|
session.logger.info "Installing software..."
|
92 : |
|
|
output = ssh.exec!("apt-get update
|
93 : |
|
|
apt-get install -y -q nfs-common
|
94 : |
|
|
apt-get autoclean
|
95 : |
|
|
mkdir -p /root/vc
|
96 : |
|
|
mkdir -p /shared
|
97 : |
|
|
echo 'source /etc/default/bonfire' >> /root/.bashrc
|
98 : |
|
|
sed '2 i\ sleep 5' /etc/rc.local > /tmp/rc.local
|
99 : |
|
|
sed -i '2 i\ sleep 5' /etc/rc.local
|
100 : |
|
|
sed -i '2 i\ /root/killproc.sh &' /etc/rc.local
|
101 : |
|
|
sed -i '/^exit/ i\ nohup python -u /root/vc/vc-node-init.py /var/log/vc-node-init.log &' /etc/rc.local
|
102 : |
|
|
chmod 755 /etc/rc.local
|
103 : |
|
|
chmod u+x /root/killproc.sh")
|
104 : |
|
|
session.logger.info output unless output.nil?
|
105 : |
|
|
|
106 : |
|
|
session.logger.info "Uploading Virtual Cluster scripts..."
|
107 : |
|
|
output = ssh.exec!("mkdir -p /root/vc")
|
108 : |
|
|
session.logger.info output unless output.nil?
|
109 : |
|
|
Dir.glob("vc/*.py").each do |file|
|
110 : |
|
|
output = ssh.scp.upload!(file, '/root/vc/')
|
111 : |
|
|
session.logger.info output unless output.nil?
|
112 : |
|
|
end
|
113 : |
|
|
end
|
114 : |
|
|
session.logger.warn "Image installation finished"
|
115 : |
|
|
|
116 : |
|
|
session.logger.warn "Saving image and shutting down"
|
117 : |
|
|
machine.update(:disk => [{:save_as => {:name => NEW_IMAGE_NAME}}])
|
118 : |
|
|
machine.update(:state => 'SHUTDOWN')
|
119 : |
|
|
|
120 : |
|
|
until machine.reload['state'] == 'DONE' do
|
121 : |
|
|
session.logger.info "Machine is #{machine['state']}."
|
122 : |
|
|
sleep 20
|
123 : |
|
|
end
|
124 : |
|
|
|
125 : |
|
|
experiment.delete
|
126 : |
|
|
|
127 : |
|
|
session.logger.info "Image built: #{NEW_IMAGE_NAME}"
|
128 : |
|
|
session.logger.warn "Experiment terminated!"
|
129 : |
|
|
|
130 : |
|
|
rescue Exception => e
|
131 : |
|
|
session.logger.error "#{e.class.name}: #{e.message}"
|
132 : |
|
|
session.logger.error e.backtrace.join("\n")
|
133 : |
|
|
session.logger.warn "Cleaning up in 30 seconds. Hit CTRL-C now to keep your VMs..."
|
134 : |
|
|
sleep 30
|
135 : |
|
|
experiment.delete unless experiment.nil?
|
136 : |
|
|
end
|