X-Git-Url: http://xvm.mit.edu/gitweb/invirt/scripts/prod-migration.git/blobdiff_plain/b281a0601fda1a8793dcd793a168ffca7a1290dd..ee5b63f9fcb8dccb9ceb31cb96d5ca8aa30b1be0:/xvm-migrate-machine diff --git a/xvm-migrate-machine b/xvm-migrate-machine old mode 100644 new mode 100755 index 0403ff5..8d76225 --- a/xvm-migrate-machine +++ b/xvm-migrate-machine @@ -1,15 +1,17 @@ -#!/bin/python +#!/usr/bin/python # Migrates the machine passed as arguments from the dev cluster. # To be run on the prod cluster. -## The present version is NOT A REAL SCRIPT. -## Things may not even be tested. Copy and paste. -not_ready_yet_do_not_run_me - from invirt import remctl as r from lib import database import subprocess import sys +import time +import os + +sys.stdout = os.fdopen(sys.stdout.fileno(), 'w', 0) + +kinit = dict(principal='host/aperture-science.mit.edu', keytab='/etc/krb5.keytab') dev_db_uri = 'postgres://sipb-xen@sipb-xen-dev.mit.edu/sipb_xen' database.connect(dev_db_uri) @@ -27,12 +29,33 @@ def take_data(machine_name): machine.acl = [] dev_sess.update(machine) + print 'VM Info:' + print ' name: %s' % machine.name + print ' description: %s' % machine.description + print ' cpus: %s' % machine.cpus + print ' memory: %s' % machine.memory + print ' owner: %s' % machine.owner + print ' contact: %s' % machine.contact + print ' administrator: %s' % machine.administrator + print ' uuid: %s' % machine.uuid + print ' type: %s' % machine.type.type_id + print ' autorestart: %s' % machine.autorestart + print ' adminable: %s' % machine.adminable + print ' Disks:' + for disk in machine.disks: + print ' - %s (%s)' % (disk.guest_device_name, disk.size) + print ' NICs:' + for nic in machine.nics: + print ' - %s, %s, %s' % (nic.mac_addr, nic.ip, nic.hostname) + print '===============================================' + print + disks = machine.disks nics = machine.nics for r in disks + nics + [machine]: dev_sess.delete(r) - dev_sess.commit() + dev_sess.flush() for r in disks + nics + [machine]: dev_sess.expunge(r) @@ -41,43 +64,87 @@ def take_data(machine_name): return machine ## add to prod db -def restore_data(machine): +def restore_data(machine, session): # The machine's type is still the one attached to the dev database; # get the right one - machine.type = prod_sess.query(database.Type).filter_by(type_id=machine.type.type_id).one() - prod_sess.begin() - prod_sess.save(machine) - prod_sess.commit() + machine.type = session.query(database.Type).filter_by(type_id=machine.type.type_id).one() + session.begin() + session.save(machine) + session.commit() def migrate_vm(machine_name): # Power off the VM on dev # # This has to be done first, because once the machine is deleted # from the database, we can't remctl for it anymore - out, err = r.remctl('xvm-remote.mit.edu', 'control', machine_name, 'destroy', err=True) + out, err = r.remctl('xvm-remote.mit.edu', 'control', machine_name, 'destroy', err=True, **kinit) print out machine = take_data(machine_name) + subprocess.call(['zwrite', '-d', '-c', 'xvm-auto', '-i', 'migration', '-s', 'XVM Migration Script', '-m', + 'Migrating %s, disk size %0.2fG...' % (machine.name, sum(disk.size for disk in machine.disks) / 1024.0)]) + success = True ## copy disk image... copy, copy... for disk in machine.disks: lvname='d_%s_%s' % (machine.name, disk.guest_device_name) - subprocess.check_call(['lvcreate', '-L%sM' % str(disk.size), '-n', lvname, 'xenvg']) + if 0 != subprocess.call(['lvcreate', '-L%sM' % str(disk.size), '-n', lvname, 'xenvg']): + success = False + break - ssh = subprocess.Popen(['ssh', '-o', 'GSSAPIDelegateCredentials=no', - 'torchwood-institute.mit.edu', + ssh = subprocess.Popen(['rsh', + '10.6.0.165', 'dd', 'if=/dev/xenvg/%s' % lvname, 'bs=1M'], stdout=subprocess.PIPE) dd = subprocess.Popen(['dd', 'of=/dev/xenvg/%s' % lvname, 'bs=1M'], stdin=ssh.stdout) - dd.wait() + if 0 != dd.wait(): + success = False + break + if 0 != ssh.wait(): + success = False + break - restore_data(machine) + if not success: + dev_sess.rollback() + + print '===============================================' + print 'ERROR: VM %s failed to migrate' % machine.name + print '===============================================' + else: + restore_data(machine, prod_sess) + dev_sess.commit() + + return success if __name__ == '__main__': - for vm in sys.argv[1:]: + while True: + r.checkKinit(**kinit) + p = subprocess.Popen(['curl', '-s', '-k', '--negotiate', '-u', ':', 'https://xvm.mit.edu:442/offlist'], stdout=subprocess.PIPE) + if 0 != p.wait(): + subprocess.call(['zwrite', '-d', '-c', 'xvm', '-i', 'migration', '-s', 'XVM Migration Script', '-m', + 'Failed to get list of remaining VMs. Will try again in 15 seconds']) + time.sleep(15) + continue + + next_line = p.stdout.read().split('\n')[0] + if next_line == '': + subprocess.call(['zwrite', '-d', '-c', 'xvm', '-i', 'migration', '-s', 'XVM Migration Script', '-m', + 'XVM migration complete']) + break + + next, uptime = next_line.split('\t')[:2] + print '===============================================' - print 'Migrating %s' % vm + print 'Migrating %s' % next print '===============================================' - migrate_vm(vm.strip()) + if not migrate_vm(next): + subprocess.call(['zwrite', '-d', '-c', 'xvm', '-i', 'migration', '-s', 'XVM Migration Script', '-m', + 'Error in migrating %s' % next]) + sys.exit(1) + if uptime.strip() != '': + r.remctl('xvm-remote-dev.mit.edu', 'control', next, 'create', **kinit) + + subprocess.call(['zwrite', '-d', '-c', 'xvm-auto', '-i', 'migration', '-s', 'XVM Migration Script', '-m', + 'done'])