-
Notifications
You must be signed in to change notification settings - Fork 23
/
Copy pathrhev-hypervisor-autoupgrade.py
executable file
·326 lines (271 loc) · 12.7 KB
/
rhev-hypervisor-autoupgrade.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
#!/usr/bin/env python
#
# Author: Pablo Iranzo Gomez ([email protected])
#
# Description: Script for automatic RHEV-H hypervisor upgrade when there's a new
# version available on RHEV-M
#
# Requires rhevm-sdk to work
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, version 2 of the License.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
# Goals:
# - Automatically put RHEV-H hosts on maintenace for upgrade
# - Once on maintenance, deploy updated install image
# - After timeout, set host to active (actual bug in RHEV)
# tags behaviour
# elas_manage: manage this host by using the elastic management script (EMS)
# elas_upgrade: this host status has been set by automatic upgrade, so it can be installed/activated
# elas_maint: this host status has been set by rhev-elastic, so it can be installed/activated
import glob
import optparse
from random import choice
from rhev_functions import *
description = """
RHEV-hypervisor-autoupgrade is a script for automatically upgrade RHEV-H hosts under RHEV
It's goal is to try upgrading each host one after one, starting with the
ones with no VM's running on them.
"""
# Option parsing
p = optparse.OptionParser("rhev-hypevisor-autoupgrade.py [arguments]", description=description)
p.add_option("-u", "--user", dest="username", help="Username to connect to RHEVM API", metavar="admin@internal",
default="admin@internal")
p.add_option("-w", "--password", dest="password", help="Password to use with username", metavar="admin",
default="admin")
p.add_option("-k", action="store_true", dest="keyring", help="use python keyring for user/password", metavar="keyring",
default=False)
p.add_option("-W", action="store_true", dest="askpassword", help="Ask for password", metavar="admin", default=False)
p.add_option("-s", "--server", dest="server", help="RHEV-M server address/hostname to contact", metavar="127.0.0.1",
default="127.0.0.1")
p.add_option("-p", "--port", dest="port", help="API port to contact", metavar="443", default="443")
p.add_option('-v', "--verbosity", dest="verbosity", help="Show messages while running", metavar='[0-n]', default=0,
type='int')
p.add_option('-c', "--cluster", dest="cluster", help="Select cluster name to process", metavar='cluster', default=None)
p.add_option('-t', "--tagall", dest="tagall", help="Tag all hosts with elas_manage", metavar='0/1', default=0,
type='int')
p.add_option('-r', "--release", dest="release", help="Select release to deploy. Like 20130528.0.el6_4",
metavar='release', default="latest")
p.add_option('-d', "--delay", dest="delay", help="Set delay to way until activation after install is sent",
metavar='delay', default=900)
(options, args) = p.parse_args()
options.username, options.password = getuserpass(options)
baseurl = "https://%s:%s/ovirt-engine/api" % (options.server, options.port)
api = apilogin(url=baseurl, username=options.username, password=options.password)
# FUNCTIONS
def upgrade_host(target):
"""Deactivates hosts putting it on maintenance and associating required tags before upgrading
@param target: Host ID to upgrade
"""
host = api.hosts.get(id=target)
# Shutting down one host at a time...
if options.verbosity > 0:
print("Preparing target %s" % target)
# Add elas_maint TAG to host
host.tags.add(params.Tag(name="elas_upgrade"))
# Set host on maintenance
try:
host.deactivate()
except:
print("Error deactivating host %s" % api.hosts.get(id=target).name)
# Should wait until host state is 'maintenance'
i = 0
while i < 30:
if api.hosts.get(id=target).status.state == "maintenance":
if options.verbosity > 6:
print("Host is now on maintenance...")
i = 30
else:
if options.verbosity > 6:
print("Host still not on maintenance... sleeping")
time.sleep(2)
i += 1
if api.hosts.get(id=target).status.state == "maintenance":
# Execute upgrade for host with latest available version
image = "%s" % get_max_version()
try:
print("Trying to upgrade %s" % host.name)
host.install(params.Action(image=image))
except:
print("Host failed to install")
i = 0
while i < options.delay:
if api.hosts.get(id=target).status.state == "up":
if options.verbosity > 6:
print("Host is now up again...")
i = options.delay
else:
if options.verbosity > 6:
print("Host still not up... sleeping")
time.sleep(1)
i += 1
# if host is listed as installation failed, enable it as this is a pending BZ, and probably host is OK
if api.hosts.get(id=target).status.state == "install_failed":
api.hosts.get(id=target).activate()
# Remove tags no longer used
api.hosts.get(id=host.id).tags.get(name="elas_upgrade").delete()
api.hosts.get(id=host.id).tags.get(name="elas_maint").delete()
return
def get_max_version():
"""Get maximum hipervisor version, checking first on disk, and if not, on higher version from hypervisors"""
version = None
# Check all available hypervisor versions on disk (only on RHEV-M host)
for fichero in glob.glob("/usr/share/rhev-hypervisor/rhevh-6.*.iso"):
fileversion = fichero.split("/")[-1]
if fileversion > version:
version = fileversion
# Couldn't get version from disk, get it from the API
if not version:
maxversion = None
release = None
version = None
# FIXME only query rhev-h hosts
for host in paginate(api.hosts, oquery=""):
if host.os.version.full_version > maxversion:
maxversion = host.os.version.full_version
version = maxversion.split("-")[1].strip() # 20130528.0.el6_4
release = maxversion.split("-")[0].strip() # 6.4
try:
version = "rhevh-%s-%s.iso" % (release, version)
except:
version = None
return version
def process_cluster(clusid):
"""Processes cluster
@param clusid: Cluster ID to process
"""
if options.verbosity > 1:
print("\nProcessing cluster with id %s and name %s" % (clusid, api.clusters.get(id=clusid).name))
print("#############################################################################")
# Emptying maintanable and activable hosts list
upgradable = []
upgradable_prio = []
hosts_total = 0
hosts_up = 0
hosts_maintenance = 0
hosts_other = 0
hosts_without_vms = 0
hosts_with_vms = 0
version = get_max_version()
# FIXME: only RHEV-H hosts
query = "cluster = %s" % api.clusters.get(id=clusid).name
for host in paginate(api.hosts, query):
if host.tags.get(name="elas_manage"):
vms = api.hosts.get(id=host.id).summary.total
inc = 1
if host.cluster.id != clusid:
# Not process this host if doesn't pertain to cluster
if options.verbosity >= 3:
print("Host %s doesn't pertain to cluster %s, discarding" % (host.id, clusid))
else:
# Preparing list of valid hosts
hostver = "rhevh-%s-%s.iso" % (
host.os.version.full_version.split("-")[0].strip(),
host.os.version.full_version.split("-")[1].strip())
if version > hostver:
status = "accepted upgrading from %s to %s" % (hostver, version)
if host.status.state == "up":
upgradable.append(host.id)
# Prioritize non-SPM host and hosts without VM's
if api.hosts.get(id=host.id).storage_manager.valueOf_ != "true" or vms == 0:
upgradable_prio.append(host.id)
if host.status.state == "maintenance":
# Add to prio list hosts set to maintenance by rhev-elastic
if host.tags.get(name="elas_maint") or host.tags.get(name="elas_upgrade"):
upgradable.append(host.id)
upgradable_prio.append(host.id)
else:
status = "No elas_maint tag discarded"
inc = 0
else:
# Host already upgraded
status = "already done"
if options.verbosity >= 2:
print("Host (%s) %s with %s vms detected with status %s and spm status %s (%s for operation)" % (
host.name, host.id, vms, api.hosts.get(id=host.id).status.state,
api.hosts.get(id=host.id).storage_manager.valueOf_, status))
# Counters
hosts_total += inc
if host.status.state == "up":
hosts_up += inc
if vms == 0:
hosts_without_vms += inc
else:
hosts_with_vms += inc
else:
if host.status.state == "maintenance":
hosts_maintenance += inc
else:
hosts_other += inc
if options.verbosity >= 1:
if hosts_total > 0:
print("\nMax version: %s" % version)
print("\nHost list to manage:")
print("\tCandidates to upgrade: %s" % upgradable)
print("\tPriority to upgrade: %s" % upgradable_prio)
print("\nHosts TOTAL (Total/Up/Maintenance/other): %s/%s/%s/%s" % (
hosts_total, hosts_up, hosts_maintenance, hosts_other))
print("Hosts UP (with VM's/ without): %s/%s" % (hosts_with_vms, hosts_without_vms))
else:
print("\nNo hosts in cluster %s, skipping" % clusid)
# CODE TO CHECK HOST COUNT, Host still active, etc
# Useful vars: hosts_total,hosts_up,hosts_maintenance,hosts_other,hosts_with_vms,hosts_without_vms
# Useful arrays: enablable / upgradable
# UPGRADE SECTION
if len(upgradable) != 0:
if len(upgradable_prio) != 0:
target = choice(upgradable_prio)
else:
target = choice(upgradable)
if options.verbosity >= 2:
print("\nPutting host %s into upgrade because there are more than 1 host without vm's\n" % target)
upgrade_host(target)
return 0
else:
print("\nNo host to put into maintenance for upgrade\n")
return 1
# MAIN PROGRAM
if __name__ == "__main__":
# Check if we have defined needed tags and create them if missing
check_tags(api, options)
# TAGALL?
# Add elas_upgrade TAG to every single host to automate the management
if options.tagall == 1:
if options.verbosity >= 1:
print("Tagging all hosts with elas_manage")
for host in paginate(api.hosts):
try:
host.tags.add(params.Tag(name="elas_manage"))
except:
print("Error adding elas_manage tag to host %s" % host.name)
# Sanity checks
# Check hosts with elas_upgrade tag and status active
query = "status = up"
for host in paginate(api.hosts, query):
if host.status.state == "up":
if api.hosts.get(id=host.id).tags.get(name="elas_upgrade"):
if options.verbosity >= 1:
print("Host %s is tagged as elas_upgrade and it's active, removing tag..." % host.id)
api.hosts.get(id=host.id).tags.get(name="elas_upgrade").delete()
# Check hosts with elas_maint tag and status active
query = "status = up"
for host in paginate(api.hosts, query):
if host.status.state == "up":
if api.hosts.get(id=host.id).tags.get(name="elas_maint"):
if options.verbosity >= 1:
print("Host %s is tagged as elas_maint and it's active, removing tag..." % host.id)
api.hosts.get(id=host.id).tags.get(name="elas_maint").delete()
if not check_version(api, major=3, minor=2):
print("This functionality requires api >= 3.2")
sys.exit(1)
if not options.cluster:
# Processing each cluster of our RHEVM
for cluster in api.clusters.list():
process_cluster(cluster.id)
else:
process_cluster(api.clusters.get(name=options.cluster).id)