Log In | Get Help   
Home My Page Projects Code Snippets Project Openings BonFIRE VCOC Demonstration Kit
Summary Activity SCM Files Wiki
[bonfiredemokit] Annotation of /virt-cluster/build-master.rb
[bonfiredemokit] / virt-cluster / build-master.rb Repository:
ViewVC logotype

Annotation of /virt-cluster/build-master.rb

Parent Directory Parent Directory | Revision Log Revision Log


Revision 8 - (view) (download)

1 : agomez 1 require 'rubygems'
2 :     require 'restfully'
3 :     require 'restfully/addons/bonfire'
4 :    
5 :     ##Editable parameters
6 :     #LOCATION = "de-hlrs"
7 :     LOCATION = "fr-inria"
8 :     #LOCATION = "uk-epcc"
9 :     ##
10 :    
11 :     EXPERIMENT_NAME = "Build image master"
12 :     EXPERIMENT_DESCRIPTION = "Build image master for virtual cluster"
13 :     EXPERIMENT_WALLTIME = 3600
14 :     IMAGE_NAME = "BonFIRE Debian Squeeze 2G v3"
15 :     WAN_NAME = "BonFIRE WAN"
16 :    
17 :     session = Restfully::Session.new(
18 :     :configuration_file => "~/.restfully/api.bonfire-project.eu",
19 :     :cache => false,
20 :     :gateway => "ssh.fr-inria.bonfire-project.eu",
21 :     :keys => ["~/.ssh/id_rsa"]
22 :     )
23 :     session.logger.level = Logger::INFO
24 :     #session.logger.level = Logger::DEBUG
25 :    
26 : agomez 8 NEW_IMAGE_NAME = "VirtualClusterMaster-#{session.config[:username]}-v0.1"
27 :    
28 : agomez 1 experiment = nil
29 :    
30 :     begin
31 :     session.logger.info "Deploying experiment..."
32 :     experiment = session.root.experiments.submit(
33 :     :name => EXPERIMENT_NAME,
34 :     :description => EXPERIMENT_DESCRIPTION + " - " + Time.now.to_s,
35 :     # :status => "waiting",
36 :     :walltime => EXPERIMENT_WALLTIME
37 :     )
38 :    
39 :     location = session.root.locations[:"#{LOCATION}"]
40 :     session.logger.info "Chosen location is: #{location['name']}"
41 :     fail "Can't select the machine location" if location.nil?
42 :    
43 :     session.logger.info "Deleting previous version"
44 :     storage = location.storages.find{|s| s["name"] == NEW_IMAGE_NAME}
45 :     storage.delete unless storage.nil?
46 :    
47 :     session.logger.info "Launching machine..."
48 :     machine = experiment.computes.submit(
49 :     :name => "machine-experiment#{experiment['id']}",
50 :     :instance_type => "small",
51 :     :disk => [{:storage => location.storages.find{|s| s['name'] == IMAGE_NAME}}],
52 :     :nic => [
53 :     {:network => location.networks.find{|n| n['name'] == WAN_NAME}}
54 :     ],
55 :     :location => location,
56 :     :context => {}
57 :     )
58 :     hostname = "#{machine['name']}-#{machine['id']}"
59 :     session.logger.info "Machine: #{hostname} #{machine['nic'][0]['ip']}"
60 :    
61 :     session.logger.info "Starting experiment..."
62 :     experiment.update(:status => "running")
63 :    
64 :     #Build SSH keys
65 :     #session.logger.info "Buildgin SSH keypair..."
66 :     #ssh_priv = "/tmp/ssh-#{Random.rand(1000)}"
67 :     #ssh_public = ssh_priv + ".pub"
68 :     #`ssh-keygen -f #{ssh_priv} -t rsa -P ""`
69 :    
70 :     session.logger.info "Checking if machine is ready..."
71 :     until [machine].all?{|vm|
72 :     vm.reload['state'] == 'RUNNING' && vm.ssh.accessible?
73 :     } do
74 :     fail "Machine has failed" if [machine].any?{|vm| vm['state'] == 'FAILED'}
75 :     session.logger.info "Machine is not ready. Waiting..."
76 :     sleep 20
77 :     end
78 :    
79 :     ocfs_debconf = "cat << EOF | debconf-set-selections
80 :     ocfs2-tools ocfs2-tools/idle_timeout select 30000
81 :     ocfs2-tools ocfs2-tools/reconnect_delay select 2000
82 :     ocfs2-tools ocfs2-tools/init select true
83 :     ocfs2-tools ocfs2-tools/clustername select ocfs2
84 :     ocfs2-tools ocfs2-tools/heartbeat_threshold select 31
85 :     ocfs2-tools ocfs2-tools/keepalive_delay select 2000
86 :    
87 :     ocfs2-tools ocfs2-tools/idle_timeout seen true
88 :     ocfs2-tools ocfs2-tools/reconnect_delay seen true
89 :     ocfs2-tools ocfs2-tools/init seen true
90 :     ocfs2-tools ocfs2-tools/clustername seen true
91 :     ocfs2-tools ocfs2-tools/heartbeat_threshold seen true
92 :     ocfs2-tools ocfs2-tools/keepalive_delay seen true
93 :     EOF"
94 :    
95 :     session.logger.info "Machine is ready"
96 :     machine.ssh do |ssh|
97 :     session.logger.info "Preinstallation..."
98 :     output = ssh.exec!(ocfs_debconf)
99 :     session.logger.info output unless output.nil?
100 :     output = ssh.scp.upload!('killproc.sh', '/root/')
101 :     session.logger.info output unless output.nil?
102 :     session.logger.info "Installing software..."
103 :     output = ssh.exec!("apt-get update
104 :     apt-get install -y -q python-paramiko
105 :     apt-get install -y -q drbd8-utils ocfs2-tools nfs-kernel-server
106 :     apt-get autoclean
107 :     dpkg-reconfigure --frontend=noninteractive ocfs2-tools
108 :     apt-get install -y -q ocfs2-tools
109 :     echo 'source /etc/default/bonfire' >> /root/.bashrc
110 :     sed -i '2 i\ sleep 5' /etc/rc.local
111 :     sed -i '2 i\ /root/killproc.sh &' /etc/rc.local
112 :     sed -i '/^exit/ i\python -u /root/vc/vc-main-init.py /var/log/vc-main-init.log' /etc/rc.local
113 :     chmod 755 /etc/rc.local
114 :     chmod u+x /root/killproc.sh")
115 :     session.logger.info output unless output.nil?
116 :     session.logger.info "Uploading OGS..."
117 :     output = ssh.scp.upload!('sge_root.tar.gz', '/root/')
118 :     session.logger.info output unless output.nil?
119 :    
120 :     #session.logger.info "Uploading SSH keys..."
121 :     #output = ssh.exec!("mkdir -p /root/.ssh")
122 :     #session.logger.info output unless output.nil?
123 :     #output = ssh.scp.upload!(ssh_priv, '/root/.ssh/id_rsa')
124 :     #session.logger.info output unless output.nil?
125 :     #output = ssh.scp.upload!(ssh_public, '/root/.ssh/id_rsa.pub')
126 :     #session.logger.info output unless output.nil?
127 :     #output = ssh.exec!("cat /root/.ssh/id_rsa.pub >> /root/.ssh/authorized_keys")
128 :     #session.logger.info output unless output.nil?
129 :    
130 :     session.logger.info "Uploading Virtual Cluster scripts..."
131 :     output = ssh.exec!("mkdir -p /root/vc")
132 :     session.logger.info output unless output.nil?
133 :     Dir.glob("vc/*.py").each do |file|
134 :     output = ssh.scp.upload!(file, '/root/vc/')
135 :     session.logger.info output unless output.nil?
136 :     end
137 :     end
138 :     session.logger.warn "Image installation finished"
139 :    
140 :     session.logger.warn "Saving image and shutting down"
141 :     machine.update(:disk => [{:save_as => {:name => NEW_IMAGE_NAME}}])
142 :     machine.update(:state => 'SHUTDOWN')
143 :    
144 :     until machine.reload['state'] == 'DONE' do
145 :     session.logger.info "Machine is #{machine['state']}."
146 :     sleep 20
147 :     end
148 :    
149 :     experiment.delete
150 :    
151 :     session.logger.info "Image built: #{NEW_IMAGE_NAME}"
152 :     session.logger.warn "Experiment terminated!"
153 :    
154 :     rescue Exception => e
155 :     session.logger.error "#{e.class.name}: #{e.message}"
156 :     session.logger.error e.backtrace.join("\n")
157 :     session.logger.warn "Cleaning up in 30 seconds. Hit CTRL-C now to keep your VMs..."
158 :     sleep 30
159 :     experiment.delete unless experiment.nil?
160 :     end

root@forge.cesga.es
ViewVC Help
Powered by ViewVC 1.0.0  

Powered By FusionForge