Log In | Get Help   
Home My Page Projects Code Snippets Project Openings BonFIRE VCOC Demonstration Kit
Summary Activity SCM Files Wiki
[bonfiredemokit] Annotation of /virt-cluster/build-master.rb
[bonfiredemokit] / virt-cluster / build-master.rb Repository:
ViewVC logotype

Annotation of /virt-cluster/build-master.rb

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1 - (view) (download)

1 : agomez 1 require 'rubygems'
2 :     require 'restfully'
3 :     require 'restfully/addons/bonfire'
4 :    
5 :     ##Editable parameters
6 :     #LOCATION = "de-hlrs"
7 :     LOCATION = "fr-inria"
8 :     #LOCATION = "uk-epcc"
9 :     ##
10 :    
11 :     EXPERIMENT_NAME = "Build image master"
12 :     EXPERIMENT_DESCRIPTION = "Build image master for virtual cluster"
13 :     EXPERIMENT_WALLTIME = 3600
14 :     IMAGE_NAME = "BonFIRE Debian Squeeze 2G v3"
15 :     NEW_IMAGE_NAME = "VirtualClusterMaster-vcocdemo-v0.1"
16 :     WAN_NAME = "BonFIRE WAN"
17 :    
18 :     session = Restfully::Session.new(
19 :     :configuration_file => "~/.restfully/api.bonfire-project.eu",
20 :     :cache => false,
21 :     :gateway => "ssh.fr-inria.bonfire-project.eu",
22 :     :keys => ["~/.ssh/id_rsa"]
23 :     )
24 :     session.logger.level = Logger::INFO
25 :     #session.logger.level = Logger::DEBUG
26 :    
27 :     experiment = nil
28 :    
29 :     begin
30 :     session.logger.info "Deploying experiment..."
31 :     experiment = session.root.experiments.submit(
32 :     :name => EXPERIMENT_NAME,
33 :     :description => EXPERIMENT_DESCRIPTION + " - " + Time.now.to_s,
34 :     # :status => "waiting",
35 :     :walltime => EXPERIMENT_WALLTIME
36 :     )
37 :    
38 :     location = session.root.locations[:"#{LOCATION}"]
39 :     session.logger.info "Chosen location is: #{location['name']}"
40 :     fail "Can't select the machine location" if location.nil?
41 :    
42 :     session.logger.info "Deleting previous version"
43 :     storage = location.storages.find{|s| s["name"] == NEW_IMAGE_NAME}
44 :     storage.delete unless storage.nil?
45 :    
46 :     session.logger.info "Launching machine..."
47 :     machine = experiment.computes.submit(
48 :     :name => "machine-experiment#{experiment['id']}",
49 :     :instance_type => "small",
50 :     :disk => [{:storage => location.storages.find{|s| s['name'] == IMAGE_NAME}}],
51 :     :nic => [
52 :     {:network => location.networks.find{|n| n['name'] == WAN_NAME}}
53 :     ],
54 :     :location => location,
55 :     :context => {}
56 :     )
57 :     hostname = "#{machine['name']}-#{machine['id']}"
58 :     session.logger.info "Machine: #{hostname} #{machine['nic'][0]['ip']}"
59 :    
60 :     session.logger.info "Starting experiment..."
61 :     experiment.update(:status => "running")
62 :    
63 :     #Build SSH keys
64 :     #session.logger.info "Buildgin SSH keypair..."
65 :     #ssh_priv = "/tmp/ssh-#{Random.rand(1000)}"
66 :     #ssh_public = ssh_priv + ".pub"
67 :     #`ssh-keygen -f #{ssh_priv} -t rsa -P ""`
68 :    
69 :     session.logger.info "Checking if machine is ready..."
70 :     until [machine].all?{|vm|
71 :     vm.reload['state'] == 'RUNNING' && vm.ssh.accessible?
72 :     } do
73 :     fail "Machine has failed" if [machine].any?{|vm| vm['state'] == 'FAILED'}
74 :     session.logger.info "Machine is not ready. Waiting..."
75 :     sleep 20
76 :     end
77 :    
78 :     ocfs_debconf = "cat << EOF | debconf-set-selections
79 :     ocfs2-tools ocfs2-tools/idle_timeout select 30000
80 :     ocfs2-tools ocfs2-tools/reconnect_delay select 2000
81 :     ocfs2-tools ocfs2-tools/init select true
82 :     ocfs2-tools ocfs2-tools/clustername select ocfs2
83 :     ocfs2-tools ocfs2-tools/heartbeat_threshold select 31
84 :     ocfs2-tools ocfs2-tools/keepalive_delay select 2000
85 :    
86 :     ocfs2-tools ocfs2-tools/idle_timeout seen true
87 :     ocfs2-tools ocfs2-tools/reconnect_delay seen true
88 :     ocfs2-tools ocfs2-tools/init seen true
89 :     ocfs2-tools ocfs2-tools/clustername seen true
90 :     ocfs2-tools ocfs2-tools/heartbeat_threshold seen true
91 :     ocfs2-tools ocfs2-tools/keepalive_delay seen true
92 :     EOF"
93 :    
94 :     session.logger.info "Machine is ready"
95 :     machine.ssh do |ssh|
96 :     session.logger.info "Preinstallation..."
97 :     output = ssh.exec!(ocfs_debconf)
98 :     session.logger.info output unless output.nil?
99 :     output = ssh.scp.upload!('killproc.sh', '/root/')
100 :     session.logger.info output unless output.nil?
101 :     session.logger.info "Installing software..."
102 :     output = ssh.exec!("apt-get update
103 :     apt-get install -y -q python-paramiko
104 :     apt-get install -y -q drbd8-utils ocfs2-tools nfs-kernel-server
105 :     apt-get autoclean
106 :     dpkg-reconfigure --frontend=noninteractive ocfs2-tools
107 :     apt-get install -y -q ocfs2-tools
108 :     echo 'source /etc/default/bonfire' >> /root/.bashrc
109 :     sed -i '2 i\ sleep 5' /etc/rc.local
110 :     sed -i '2 i\ /root/killproc.sh &' /etc/rc.local
111 :     sed -i '/^exit/ i\python -u /root/vc/vc-main-init.py /var/log/vc-main-init.log' /etc/rc.local
112 :     chmod 755 /etc/rc.local
113 :     chmod u+x /root/killproc.sh")
114 :     session.logger.info output unless output.nil?
115 :     session.logger.info "Uploading OGS..."
116 :     output = ssh.scp.upload!('sge_root.tar.gz', '/root/')
117 :     session.logger.info output unless output.nil?
118 :    
119 :     #session.logger.info "Uploading SSH keys..."
120 :     #output = ssh.exec!("mkdir -p /root/.ssh")
121 :     #session.logger.info output unless output.nil?
122 :     #output = ssh.scp.upload!(ssh_priv, '/root/.ssh/id_rsa')
123 :     #session.logger.info output unless output.nil?
124 :     #output = ssh.scp.upload!(ssh_public, '/root/.ssh/id_rsa.pub')
125 :     #session.logger.info output unless output.nil?
126 :     #output = ssh.exec!("cat /root/.ssh/id_rsa.pub >> /root/.ssh/authorized_keys")
127 :     #session.logger.info output unless output.nil?
128 :    
129 :     session.logger.info "Uploading Virtual Cluster scripts..."
130 :     output = ssh.exec!("mkdir -p /root/vc")
131 :     session.logger.info output unless output.nil?
132 :     Dir.glob("vc/*.py").each do |file|
133 :     output = ssh.scp.upload!(file, '/root/vc/')
134 :     session.logger.info output unless output.nil?
135 :     end
136 :     end
137 :     session.logger.warn "Image installation finished"
138 :    
139 :     session.logger.warn "Saving image and shutting down"
140 :     machine.update(:disk => [{:save_as => {:name => NEW_IMAGE_NAME}}])
141 :     machine.update(:state => 'SHUTDOWN')
142 :    
143 :     until machine.reload['state'] == 'DONE' do
144 :     session.logger.info "Machine is #{machine['state']}."
145 :     sleep 20
146 :     end
147 :    
148 :     experiment.delete
149 :    
150 :     session.logger.info "Image built: #{NEW_IMAGE_NAME}"
151 :     session.logger.warn "Experiment terminated!"
152 :    
153 :     rescue Exception => e
154 :     session.logger.error "#{e.class.name}: #{e.message}"
155 :     session.logger.error e.backtrace.join("\n")
156 :     session.logger.warn "Cleaning up in 30 seconds. Hit CTRL-C now to keep your VMs..."
157 :     sleep 30
158 :     experiment.delete unless experiment.nil?
159 :     end

root@forge.cesga.es
ViewVC Help
Powered by ViewVC 1.0.0  

Powered By FusionForge