| [1629] | 1 | #!/usr/bin/python |
|---|
| [1626] | 2 | # Migrates the machine passed as arguments from the dev cluster. |
|---|
| [1429] | 3 | # To be run on the prod cluster. |
|---|
| 4 | |
|---|
| [1626] | 5 | from invirt import remctl as r |
|---|
| [1611] | 6 | from lib import database |
|---|
| [1626] | 7 | import subprocess |
|---|
| 8 | import sys |
|---|
| [1662] | 9 | import time |
|---|
| 10 | import os |
|---|
| [1429] | 11 | |
|---|
| [1662] | 12 | sys.stdout = os.fdopen(sys.stdout.fileno(), 'w', 0) |
|---|
| 13 | |
|---|
| 14 | kinit = dict(principal='host/aperture-science.mit.edu', keytab='/etc/krb5.keytab') |
|---|
| 15 | |
|---|
| [1437] | 16 | dev_db_uri = 'postgres://sipb-xen@sipb-xen-dev.mit.edu/sipb_xen' |
|---|
| [1611] | 17 | database.connect(dev_db_uri) |
|---|
| 18 | dev_sess = database.session |
|---|
| [1437] | 19 | |
|---|
| [1611] | 20 | database.connect() |
|---|
| 21 | prod_sess = database.session |
|---|
| [1437] | 22 | |
|---|
| [1626] | 23 | ## dump from dev db |
|---|
| [1437] | 24 | def take_data(machine_name): |
|---|
| [1611] | 25 | dev_sess.begin() |
|---|
| 26 | machine = dev_sess.query(database.Machine).filter_by(name=machine_name).one() |
|---|
| 27 | |
|---|
| 28 | # Clean out the ACL just so we don't have to think about it |
|---|
| 29 | machine.acl = [] |
|---|
| 30 | dev_sess.update(machine) |
|---|
| 31 | |
|---|
| [1627] | 32 | print 'VM Info:' |
|---|
| 33 | print ' name: %s' % machine.name |
|---|
| 34 | print ' description: %s' % machine.description |
|---|
| 35 | print ' cpus: %s' % machine.cpus |
|---|
| 36 | print ' memory: %s' % machine.memory |
|---|
| 37 | print ' owner: %s' % machine.owner |
|---|
| 38 | print ' contact: %s' % machine.contact |
|---|
| 39 | print ' administrator: %s' % machine.administrator |
|---|
| 40 | print ' uuid: %s' % machine.uuid |
|---|
| 41 | print ' type: %s' % machine.type.type_id |
|---|
| 42 | print ' autorestart: %s' % machine.autorestart |
|---|
| 43 | print ' adminable: %s' % machine.adminable |
|---|
| 44 | print ' Disks:' |
|---|
| 45 | for disk in machine.disks: |
|---|
| 46 | print ' - %s (%s)' % (disk.guest_device_name, disk.size) |
|---|
| 47 | print ' NICs:' |
|---|
| 48 | for nic in machine.nics: |
|---|
| 49 | print ' - %s, %s, %s' % (nic.mac_addr, nic.ip, nic.hostname) |
|---|
| 50 | print '===============================================' |
|---|
| 51 | print |
|---|
| 52 | |
|---|
| [1611] | 53 | disks = machine.disks |
|---|
| 54 | nics = machine.nics |
|---|
| [1437] | 55 | for r in disks + nics + [machine]: |
|---|
| [1626] | 56 | dev_sess.delete(r) |
|---|
| [1611] | 57 | |
|---|
| [1662] | 58 | dev_sess.flush() |
|---|
| [1611] | 59 | |
|---|
| 60 | for r in disks + nics + [machine]: |
|---|
| [1620] | 61 | dev_sess.expunge(r) |
|---|
| 62 | del r._instance_key |
|---|
| [1611] | 63 | |
|---|
| 64 | return machine |
|---|
| [1429] | 65 | |
|---|
| [1626] | 66 | ## add to prod db |
|---|
| [1632] | 67 | def restore_data(machine, session): |
|---|
| [1626] | 68 | # The machine's type is still the one attached to the dev database; |
|---|
| 69 | # get the right one |
|---|
| [1632] | 70 | machine.type = session.query(database.Type).filter_by(type_id=machine.type.type_id).one() |
|---|
| 71 | session.begin() |
|---|
| 72 | session.save(machine) |
|---|
| 73 | session.commit() |
|---|
| [1626] | 74 | |
|---|
| 75 | def migrate_vm(machine_name): |
|---|
| 76 | # Power off the VM on dev |
|---|
| 77 | # |
|---|
| 78 | # This has to be done first, because once the machine is deleted |
|---|
| 79 | # from the database, we can't remctl for it anymore |
|---|
| [1662] | 80 | out, err = r.remctl('xvm-remote.mit.edu', 'control', machine_name, 'destroy', err=True, **kinit) |
|---|
| [1626] | 81 | print out |
|---|
| 82 | |
|---|
| 83 | machine = take_data(machine_name) |
|---|
| [1662] | 84 | subprocess.call(['zwrite', '-d', '-c', 'xvm-auto', '-i', 'migration', '-s', 'XVM Migration Script', '-m', |
|---|
| 85 | 'Migrating %s, disk size %0.2fG...' % (machine.name, sum(disk.size for disk in machine.disks) / 1024.0)]) |
|---|
| [1626] | 86 | |
|---|
| [1632] | 87 | success = True |
|---|
| [1626] | 88 | ## copy disk image... copy, copy... |
|---|
| 89 | for disk in machine.disks: |
|---|
| 90 | lvname='d_%s_%s' % (machine.name, disk.guest_device_name) |
|---|
| 91 | |
|---|
| [1632] | 92 | if 0 != subprocess.call(['lvcreate', '-L%sM' % str(disk.size), '-n', lvname, 'xenvg']): |
|---|
| 93 | success = False |
|---|
| [1633] | 94 | break |
|---|
| [1626] | 95 | |
|---|
| [1662] | 96 | ssh = subprocess.Popen(['rsh', |
|---|
| 97 | '10.6.0.165', |
|---|
| [1626] | 98 | 'dd', 'if=/dev/xenvg/%s' % lvname, 'bs=1M'], |
|---|
| 99 | stdout=subprocess.PIPE) |
|---|
| 100 | dd = subprocess.Popen(['dd', 'of=/dev/xenvg/%s' % lvname, 'bs=1M'], |
|---|
| 101 | stdin=ssh.stdout) |
|---|
| [1632] | 102 | if 0 != dd.wait(): |
|---|
| 103 | success = False |
|---|
| [1633] | 104 | break |
|---|
| [1632] | 105 | if 0 != ssh.wait(): |
|---|
| 106 | success = False |
|---|
| [1633] | 107 | break |
|---|
| [1626] | 108 | |
|---|
| [1632] | 109 | if not success: |
|---|
| [1662] | 110 | dev_sess.rollback() |
|---|
| [1632] | 111 | |
|---|
| 112 | print '===============================================' |
|---|
| 113 | print 'ERROR: VM %s failed to migrate' % machine.name |
|---|
| 114 | print '===============================================' |
|---|
| 115 | else: |
|---|
| 116 | restore_data(machine, prod_sess) |
|---|
| [1662] | 117 | dev_sess.commit() |
|---|
| 118 | |
|---|
| 119 | return success |
|---|
| [1429] | 120 | |
|---|
| [1626] | 121 | if __name__ == '__main__': |
|---|
| [1662] | 122 | while True: |
|---|
| 123 | r.checkKinit(**kinit) |
|---|
| 124 | p = subprocess.Popen(['curl', '-s', '-k', '--negotiate', '-u', ':', 'https://xvm.mit.edu:442/offlist'], stdout=subprocess.PIPE) |
|---|
| 125 | if 0 != p.wait(): |
|---|
| 126 | subprocess.call(['zwrite', '-d', '-c', 'xvm', '-i', 'migration', '-s', 'XVM Migration Script', '-m', |
|---|
| 127 | 'Failed to get list of remaining VMs. Will try again in 15 seconds']) |
|---|
| 128 | time.sleep(15) |
|---|
| 129 | continue |
|---|
| 130 | |
|---|
| 131 | next_line = p.stdout.read().split('\n')[0] |
|---|
| 132 | if next_line == '': |
|---|
| 133 | subprocess.call(['zwrite', '-d', '-c', 'xvm', '-i', 'migration', '-s', 'XVM Migration Script', '-m', |
|---|
| 134 | 'XVM migration complete']) |
|---|
| 135 | break |
|---|
| 136 | |
|---|
| 137 | next, uptime = next_line.split('\t')[:2] |
|---|
| 138 | |
|---|
| [1626] | 139 | print '===============================================' |
|---|
| [1662] | 140 | print 'Migrating %s' % next |
|---|
| [1626] | 141 | print '===============================================' |
|---|
| [1662] | 142 | if not migrate_vm(next): |
|---|
| 143 | subprocess.call(['zwrite', '-d', '-c', 'xvm', '-i', 'migration', '-s', 'XVM Migration Script', '-m', |
|---|
| 144 | 'Error in migrating %s' % next]) |
|---|
| 145 | sys.exit(1) |
|---|
| 146 | if uptime.strip() != '': |
|---|
| 147 | r.remctl('xvm-remote-dev.mit.edu', 'control', next, 'create', **kinit) |
|---|
| 148 | |
|---|
| 149 | subprocess.call(['zwrite', '-d', '-c', 'xvm-auto', '-i', 'migration', '-s', 'XVM Migration Script', '-m', |
|---|
| 150 | 'done']) |
|---|