operations.py 62.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
# Copyright 2014 Budapest University of Technology and Economics (BME IK)
#
# This file is part of CIRCLE Cloud.
#
# CIRCLE is free software: you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation, either version 3 of the License, or (at your option)
# any later version.
#
# CIRCLE is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
# FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more
# details.
#
# You should have received a copy of the GNU General Public License along
# with CIRCLE.  If not, see <http://www.gnu.org/licenses/>.

18
from __future__ import absolute_import, unicode_literals
Bach Dániel committed
19 20
from base64 import encodestring
from hashlib import md5
Dudás Ádám committed
21
from logging import getLogger
Bach Dániel committed
22
import os
23
from re import search
Őry Máté committed
24
from string import ascii_lowercase
Bach Dániel committed
25 26 27
from StringIO import StringIO
from tarfile import TarFile, TarInfo
import time
Kálmán Viktor committed
28
from urlparse import urlsplit
Dudás Ádám committed
29

30
from django.core.exceptions import PermissionDenied, SuspiciousOperation
31
from django.core.urlresolvers import reverse
Dudás Ádám committed
32
from django.utils import timezone
33
from django.utils.translation import ugettext_lazy as _, ugettext_noop
Kálmán Viktor committed
34
from django.conf import settings
Bach Dániel committed
35
from django.db.models import Q
Dudás Ádám committed
36

37 38
from sizefield.utils import filesizeformat

39 40
from celery.contrib.abortable import AbortableAsyncResult
from celery.exceptions import TimeLimitExceeded, TimeoutError
41

42 43 44
from common.models import (
    create_readable, humanize_exception, HumanReadableException
)
45
from common.operations import Operation, register_operation, SubOperationMixin
Bach Dániel committed
46
from manager.scheduler import SchedulerError
47 48 49
from .tasks.local_tasks import (
    abortable_async_instance_operation, abortable_async_node_operation,
)
50
from .models import (
51
    Instance, InstanceActivity, InstanceTemplate, Interface, Node,
52
    NodeActivity, pwgen
53
)
Bach Dániel committed
54
from .tasks import agent_tasks, vm_tasks
Dudás Ádám committed
55

Kálmán Viktor committed
56
from dashboard.store_api import Store, NoStoreException
Bach Dániel committed
57 58
from firewall.models import Host
from monitor.client import Client
59
from storage.tasks import storage_tasks
Kálmán Viktor committed
60

Dudás Ádám committed
61
logger = getLogger(__name__)
62 63


64 65 66 67 68
class RemoteOperationMixin(object):

    remote_timeout = 30

    def _operation(self, **kwargs):
Őry Máté committed
69
        args = self._get_remote_args(**kwargs)
70 71 72 73 74 75 76 77 78
        return self.task.apply_async(
            args=args, queue=self._get_remote_queue()
        ).get(timeout=self.remote_timeout)

    def check_precond(self):
        super(RemoteOperationMixin, self).check_precond()
        self._get_remote_queue()


79 80 81 82 83 84 85
class AbortableRemoteOperationMixin(object):
    remote_step = property(lambda self: self.remote_timeout / 10)

    def _operation(self, task, **kwargs):
        args = self._get_remote_args(**kwargs),
        remote = self.task.apply_async(
            args=args, queue=self._get_remote_queue())
86
        for i in xrange(0, self.remote_timeout, self.remote_step):
87 88 89 90 91 92 93
            try:
                return remote.get(timeout=self.remote_step)
            except TimeoutError as e:
                if task is not None and task.is_aborted():
                    AbortableAsyncResult(remote.id).abort()
                    raise humanize_exception(ugettext_noop(
                        "Operation aborted by user."), e)
94
        raise TimeLimitExceeded()
95 96


97
class InstanceOperation(Operation):
98
    acl_level = 'owner'
99
    async_operation = abortable_async_instance_operation
100
    host_cls = Instance
101
    concurrency_check = True
102 103
    accept_states = None
    deny_states = None
104
    resultant_state = None
Dudás Ádám committed
105

106
    def __init__(self, instance):
107
        super(InstanceOperation, self).__init__(subject=instance)
108 109 110
        self.instance = instance

    def check_precond(self):
111 112
        if self.instance.destroyed_at:
            raise self.instance.InstanceDestroyedError(self.instance)
113 114 115 116 117 118 119 120 121 122 123 124 125 126
        if self.accept_states:
            if self.instance.status not in self.accept_states:
                logger.debug("precond failed for %s: %s not in %s",
                             unicode(self.__class__),
                             unicode(self.instance.status),
                             unicode(self.accept_states))
                raise self.instance.WrongStateError(self.instance)
        if self.deny_states:
            if self.instance.status in self.deny_states:
                logger.debug("precond failed for %s: %s in %s",
                             unicode(self.__class__),
                             unicode(self.instance.status),
                             unicode(self.accept_states))
                raise self.instance.WrongStateError(self.instance)
127 128

    def check_auth(self, user):
129
        if not self.instance.has_level(user, self.acl_level):
130 131 132
            raise humanize_exception(ugettext_noop(
                "%(acl_level)s level is required for this operation."),
                PermissionDenied(), acl_level=self.acl_level)
133

134
        super(InstanceOperation, self).check_auth(user=user)
135

136 137
        if (self.instance.node and not self.instance.node.online and
                not user.is_superuser):
138 139
            raise self.instance.WrongStateError(self.instance)

140 141
    def create_activity(self, parent, user, kwargs):
        name = self.get_activity_name(kwargs)
142 143 144 145 146 147 148 149 150 151
        if parent:
            if parent.instance != self.instance:
                raise ValueError("The instance associated with the specified "
                                 "parent activity does not match the instance "
                                 "bound to the operation.")
            if parent.user != user:
                raise ValueError("The user associated with the specified "
                                 "parent activity does not match the user "
                                 "provided as parameter.")

152 153 154
            return parent.create_sub(
                code_suffix=self.get_activity_code_suffix(),
                readable_name=name, resultant_state=self.resultant_state)
155 156
        else:
            return InstanceActivity.create(
157 158
                code_suffix=self.get_activity_code_suffix(),
                instance=self.instance,
159
                readable_name=name, user=user,
160 161
                concurrency_check=self.concurrency_check,
                resultant_state=self.resultant_state)
162

163 164 165 166 167
    def is_preferred(self):
        """If this is the recommended op in the current state of the instance.
        """
        return False

168

169 170 171 172 173 174 175 176 177 178 179
class RemoteInstanceOperation(RemoteOperationMixin, InstanceOperation):

    remote_queue = ('vm', 'fast')

    def _get_remote_queue(self):
        return self.instance.get_remote_queue_name(*self.remote_queue)

    def _get_remote_args(self, **kwargs):
        return [self.instance.vm_name]


Bach Dániel committed
180 181 182 183 184 185 186 187 188 189 190 191 192 193
class EnsureAgentMixin(object):
    accept_states = ('RUNNING', )

    def check_precond(self):
        super(EnsureAgentMixin, self).check_precond()

        last_boot_time = self.instance.activity_log.filter(
            succeeded=True, activity_code__in=(
                "vm.Instance.deploy", "vm.Instance.reset",
                "vm.Instance.reboot")).latest("finished").finished

        try:
            InstanceActivity.objects.filter(
                activity_code="vm.Instance.agent.starting",
194 195
                started__gt=last_boot_time, instance=self.instance
            ).latest("started")
Bach Dániel committed
196 197 198 199 200 201 202 203 204
        except InstanceActivity.DoesNotExist:  # no agent since last boot
            raise self.instance.NoAgentError(self.instance)


class RemoteAgentOperation(EnsureAgentMixin, RemoteInstanceOperation):
    remote_queue = ('agent', )
    concurrency_check = False


205
@register_operation
206 207 208 209 210
class AddInterfaceOperation(InstanceOperation):
    id = 'add_interface'
    name = _("add interface")
    description = _("Add a new network interface for the specified VLAN to "
                    "the VM.")
211
    required_perms = ()
212
    accept_states = ('STOPPED', 'PENDING', 'RUNNING')
213

214 215 216 217 218 219 220
    def rollback(self, net, activity):
        with activity.sub_activity(
            'destroying_net',
                readable_name=ugettext_noop("destroy network (rollback)")):
            net.destroy()
            net.delete()

221
    def _operation(self, activity, user, system, vlan, managed=None):
222
        if not vlan.has_level(user, 'user'):
223 224 225
            raise humanize_exception(ugettext_noop(
                "User acces to vlan %(vlan)s is required."),
                PermissionDenied(), vlan=vlan)
226 227 228 229 230 231 232
        if managed is None:
            managed = vlan.managed

        net = Interface.create(base_activity=activity, instance=self.instance,
                               managed=managed, owner=user, vlan=vlan)

        if self.instance.is_running:
233
            try:
234 235
                self.instance._attach_network(
                    interface=net, parent_activity=activity)
236 237 238 239
            except Exception as e:
                if hasattr(e, 'libvirtError'):
                    self.rollback(net, activity)
                raise
240
            net.deploy()
Bach Dániel committed
241 242
            self.instance._change_ip(parent_activity=activity)
            self.instance._restart_networking(parent_activity=activity)
243

244 245 246 247
    def get_activity_name(self, kwargs):
        return create_readable(ugettext_noop("add %(vlan)s interface"),
                               vlan=kwargs['vlan'])

248

249
@register_operation
250
class CreateDiskOperation(InstanceOperation):
251

252 253
    id = 'create_disk'
    name = _("create disk")
254
    description = _("Create and attach empty disk to the virtual machine.")
255
    required_perms = ('storage.create_empty_disk', )
256
    accept_states = ('STOPPED', 'PENDING', 'RUNNING')
257

258
    def _operation(self, user, size, activity, name=None):
Bach Dániel committed
259 260
        from storage.models import Disk

261 262 263
        if not name:
            name = "new disk"
        disk = Disk.create(size=size, name=name, type="qcow2-norm")
264
        disk.full_clean()
265 266 267 268
        devnums = list(ascii_lowercase)
        for d in self.instance.disks.all():
            devnums.remove(d.dev_num)
        disk.dev_num = devnums.pop(0)
269
        disk.save()
270 271
        self.instance.disks.add(disk)

272
        if self.instance.is_running:
273 274 275 276
            with activity.sub_activity(
                'deploying_disk',
                readable_name=ugettext_noop("deploying disk")
            ):
277
                disk.deploy()
278
            self.instance._attach_disk(parent_activity=activity, disk=disk)
279

280
    def get_activity_name(self, kwargs):
281 282 283
        return create_readable(
            ugettext_noop("create disk %(name)s (%(size)s)"),
            size=filesizeformat(kwargs['size']), name=kwargs['name'])
284 285


286
@register_operation
287
class ResizeDiskOperation(RemoteInstanceOperation):
288 289 290 291 292

    id = 'resize_disk'
    name = _("resize disk")
    description = _("Resize the virtual disk image. "
                    "Size must be greater value than the actual size.")
293
    required_perms = ('storage.resize_disk', )
294 295
    accept_states = ('RUNNING', )
    async_queue = "localhost.man.slow"
296 297
    remote_queue = ('vm', 'slow')
    task = vm_tasks.resize_disk
298

299 300 301
    def _get_remote_args(self, disk, size, **kwargs):
        return (super(ResizeDiskOperation, self)
                ._get_remote_args(**kwargs) + [disk.path, size])
302 303 304 305 306 307

    def get_activity_name(self, kwargs):
        return create_readable(
            ugettext_noop("resize disk %(name)s to %(size)s"),
            size=filesizeformat(kwargs['size']), name=kwargs['disk'].name)

308
    def _operation(self, disk, size):
309 310 311
        if not disk.is_resizable:
            raise HumanReadableException.create(ugettext_noop(
                'Disk type "%(type)s" is not resizable.'), type=disk.type)
312 313 314 315
        super(ResizeDiskOperation, self)._operation(disk=disk, size=size)
        disk.size = size
        disk.save()

316

317
@register_operation
318 319 320
class DownloadDiskOperation(InstanceOperation):
    id = 'download_disk'
    name = _("download disk")
321 322 323 324
    description = _("Download and attach disk image (ISO file) for the "
                    "virtual machine. Most operating systems do not detect a "
                    "new optical drive, so you may have to reboot the "
                    "machine.")
325
    abortable = True
326
    has_percentage = True
327
    required_perms = ('storage.download_disk', )
328
    accept_states = ('STOPPED', 'PENDING', 'RUNNING')
329
    async_queue = "localhost.man.slow"
330

331
    def _operation(self, user, url, task, activity, name=None):
Bach Dániel committed
332 333
        from storage.models import Disk

334
        disk = Disk.download(url=url, name=name, task=task)
335 336 337 338
        devnums = list(ascii_lowercase)
        for d in self.instance.disks.all():
            devnums.remove(d.dev_num)
        disk.dev_num = devnums.pop(0)
339
        disk.full_clean()
340
        disk.save()
341
        self.instance.disks.add(disk)
342 343
        activity.readable_name = create_readable(
            ugettext_noop("download %(name)s"), name=disk.name)
344

345 346 347 348
        activity.result = create_readable(ugettext_noop(
            "Downloading %(url)s is finished. The file md5sum "
            "is: '%(checksum)s'."),
            url=url, checksum=disk.checksum)
Őry Máté committed
349
        # TODO iso (cd) hot-plug is not supported by kvm/guests
350
        if self.instance.is_running and disk.type not in ["iso"]:
351
            self.instance._attach_disk(parent_activity=activity, disk=disk)
352

353

354
@register_operation
355
class DeployOperation(InstanceOperation):
Dudás Ádám committed
356 357
    id = 'deploy'
    name = _("deploy")
358 359
    description = _("Deploy and start the virtual machine (including storage "
                    "and network configuration).")
360
    required_perms = ()
361
    deny_states = ('SUSPENDED', 'RUNNING')
362
    resultant_state = 'RUNNING'
Dudás Ádám committed
363

364 365
    def is_preferred(self):
        return self.instance.status in (self.instance.STATUS.STOPPED,
366
                                        self.instance.STATUS.PENDING,
367 368
                                        self.instance.STATUS.ERROR)

369 370 371
    def on_abort(self, activity, error):
        activity.resultant_state = 'STOPPED'

Dudás Ádám committed
372 373
    def on_commit(self, activity):
        activity.resultant_state = 'RUNNING'
374
        activity.result = create_readable(
Guba Sándor committed
375
            ugettext_noop("virtual machine successfully "
376 377
                          "deployed to node: %(node)s"),
            node=self.instance.node)
Dudás Ádám committed
378

379
    def _operation(self, activity, node=None):
Dudás Ádám committed
380 381
        # Allocate VNC port and host node
        self.instance.allocate_vnc_port()
382 383 384 385 386
        if node is not None:
            self.instance.node = node
            self.instance.save()
        else:
            self.instance.allocate_node()
Dudás Ádám committed
387 388

        # Deploy virtual images
389 390 391 392 393 394
        try:
            self.instance._deploy_disks(parent_activity=activity)
        except:
            self.instance.yield_node()
            self.instance.yield_vnc_port()
            raise
Dudás Ádám committed
395 396

        # Deploy VM on remote machine
397
        if self.instance.state not in ['PAUSED']:
398
            self.instance._deploy_vm(parent_activity=activity)
Dudás Ádám committed
399 400

        # Establish network connection (vmdriver)
401 402 403
        with activity.sub_activity(
            'deploying_net', readable_name=ugettext_noop(
                "deploy network")):
Dudás Ádám committed
404 405
            self.instance.deploy_net()

406 407 408 409 410
        try:
            self.instance.renew(parent_activity=activity)
        except:
            pass

411
        self.instance._resume_vm(parent_activity=activity)
Dudás Ádám committed
412

413 414 415
        if self.instance.has_agent:
            activity.sub_activity('os_boot', readable_name=ugettext_noop(
                "wait operating system loading"), interruptible=True)
Dudás Ádám committed
416

417
    @register_operation
Őry Máté committed
418
    class DeployVmOperation(SubOperationMixin, RemoteInstanceOperation):
419 420
        id = "_deploy_vm"
        name = _("deploy vm")
Őry Máté committed
421
        description = _("Deploy virtual machine.")
422 423 424
        remote_queue = ("vm", "slow")
        task = vm_tasks.deploy

Őry Máté committed
425
        def _get_remote_args(self, **kwargs):
426 427 428 429 430 431 432 433 434
            return [self.instance.get_vm_desc()]
            # intentionally not calling super

        def get_activity_name(self, kwargs):
            return create_readable(ugettext_noop("deploy virtual machine"),
                                   ugettext_noop("deploy vm to %(node)s"),
                                   node=self.instance.node)

    @register_operation
435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451
    class DeployDisksOperation(SubOperationMixin, InstanceOperation):
        id = "_deploy_disks"
        name = _("deploy disks")
        description = _("Deploy all associated disks.")

        def _operation(self):
            devnums = list(ascii_lowercase)  # a-z
            for disk in self.instance.disks.all():
                # assign device numbers
                if disk.dev_num in devnums:
                    devnums.remove(disk.dev_num)
                else:
                    disk.dev_num = devnums.pop(0)
                    disk.save()
                # deploy disk
                disk.deploy()

452
    @register_operation
Őry Máté committed
453
    class ResumeVmOperation(SubOperationMixin, RemoteInstanceOperation):
454 455 456 457 458
        id = "_resume_vm"
        name = _("boot virtual machine")
        remote_queue = ("vm", "slow")
        task = vm_tasks.resume

Dudás Ádám committed
459

460
@register_operation
461
class DestroyOperation(InstanceOperation):
Dudás Ádám committed
462 463
    id = 'destroy'
    name = _("destroy")
464 465
    description = _("Permanently destroy virtual machine, its network "
                    "settings and disks.")
466
    required_perms = ()
467
    resultant_state = 'DESTROYED'
Dudás Ádám committed
468

469 470 471
    def on_abort(self, activity, error):
        activity.resultant_state = None

472
    def _operation(self, activity, system):
473
        # Destroy networks
474 475 476
        with activity.sub_activity(
                'destroying_net',
                readable_name=ugettext_noop("destroy network")):
477
            if self.instance.node:
478
                self.instance.shutdown_net()
479
            self.instance.destroy_net()
Dudás Ádám committed
480

481
        if self.instance.node:
482
            self.instance._delete_vm(parent_activity=activity)
Dudás Ádám committed
483 484

        # Destroy disks
485 486 487
        with activity.sub_activity(
                'destroying_disks',
                readable_name=ugettext_noop("destroy disks")):
Dudás Ádám committed
488
            self.instance.destroy_disks()
Dudás Ádám committed
489

Dudás Ádám committed
490 491
        # Delete mem. dump if exists
        try:
492
            self.instance._delete_mem_dump(parent_activity=activity)
Dudás Ádám committed
493 494 495 496 497 498
        except:
            pass

        # Clear node and VNC port association
        self.instance.yield_node()
        self.instance.yield_vnc_port()
Dudás Ádám committed
499 500 501 502

        self.instance.destroyed_at = timezone.now()
        self.instance.save()

503
    @register_operation
504
    class DeleteVmOperation(SubOperationMixin, RemoteInstanceOperation):
505 506 507 508 509
        id = "_delete_vm"
        name = _("destroy virtual machine")
        task = vm_tasks.destroy
        # if e.libvirtError and "Domain not found" in str(e):

510 511 512 513 514 515 516 517 518 519 520 521 522 523
    @register_operation
    class DeleteMemDumpOperation(RemoteOperationMixin, SubOperationMixin,
                                 InstanceOperation):
        id = "_delete_mem_dump"
        name = _("removing memory dump")
        task = storage_tasks.delete_dump

        def _get_remote_queue(self):
            return self.instance.mem_dump['datastore'].get_remote_queue_name(
                "storage", "fast")

        def _get_remote_args(self, **kwargs):
            return [self.instance.mem_dump['path']]

Dudás Ádám committed
524

525
@register_operation
526
class MigrateOperation(RemoteInstanceOperation):
Dudás Ádám committed
527 528
    id = 'migrate'
    name = _("migrate")
529 530
    description = _("Move a running virtual machine to an other worker node "
                    "keeping its full state.")
531
    required_perms = ()
532
    superuser_required = True
533
    accept_states = ('RUNNING', )
534
    async_queue = "localhost.man.slow"
535 536
    task = vm_tasks.migrate
    remote_queue = ("vm", "slow")
537
    remote_timeout = 1000
538

539
    def _get_remote_args(self, to_node, live_migration, **kwargs):
540 541
        return (super(MigrateOperation, self)._get_remote_args(**kwargs) +
                [to_node.host.hostname, live_migration])
Dudás Ádám committed
542

543
    def rollback(self, activity):
544 545 546
        with activity.sub_activity(
            'rollback_net', readable_name=ugettext_noop(
                "redeploy network (rollback)")):
547 548
            self.instance.deploy_net()

549
    def _operation(self, activity, to_node=None, live_migration=True):
Dudás Ádám committed
550
        if not to_node:
Bach Dániel committed
551 552 553 554 555 556
            with activity.sub_activity('scheduling',
                                       readable_name=ugettext_noop(
                                           "schedule")) as sa:
                to_node = self.instance.select_node()
                sa.result = to_node

557
        try:
558 559 560
            with activity.sub_activity(
                'migrate_vm', readable_name=create_readable(
                    ugettext_noop("migrate to %(node)s"), node=to_node)):
561 562
                super(MigrateOperation, self)._operation(
                    to_node=to_node, live_migration=live_migration)
563 564 565
        except Exception as e:
            if hasattr(e, 'libvirtError'):
                self.rollback(activity)
Bach Dániel committed
566
            raise
Dudás Ádám committed
567

568
        # Shutdown networks
569 570 571
        with activity.sub_activity(
            'shutdown_net', readable_name=ugettext_noop(
                "shutdown network")):
572 573
            self.instance.shutdown_net()

Dudás Ádám committed
574 575 576
        # Refresh node information
        self.instance.node = to_node
        self.instance.save()
577

Dudás Ádám committed
578
        # Estabilish network connection (vmdriver)
579 580 581
        with activity.sub_activity(
            'deploying_net', readable_name=ugettext_noop(
                "deploy network")):
Dudás Ádám committed
582
            self.instance.deploy_net()
Dudás Ádám committed
583 584


585
@register_operation
586
class RebootOperation(RemoteInstanceOperation):
Dudás Ádám committed
587 588
    id = 'reboot'
    name = _("reboot")
589 590
    description = _("Warm reboot virtual machine by sending Ctrl+Alt+Del "
                    "signal to its console.")
591
    required_perms = ()
592
    accept_states = ('RUNNING', )
593
    task = vm_tasks.reboot
Dudás Ádám committed
594

595 596
    def _operation(self, activity):
        super(RebootOperation, self)._operation()
597 598 599
        if self.instance.has_agent:
            activity.sub_activity('os_boot', readable_name=ugettext_noop(
                "wait operating system loading"), interruptible=True)
Dudás Ádám committed
600 601


602
@register_operation
603 604 605
class RemoveInterfaceOperation(InstanceOperation):
    id = 'remove_interface'
    name = _("remove interface")
606 607 608
    description = _("Remove the specified network interface and erase IP "
                    "address allocations, related firewall rules and "
                    "hostnames.")
609
    required_perms = ()
610
    accept_states = ('STOPPED', 'PENDING', 'RUNNING')
611

612 613
    def _operation(self, activity, user, system, interface):
        if self.instance.is_running:
614 615
            self.instance._detach_network(interface=interface,
                                          parent_activity=activity)
616 617 618 619 620
            interface.shutdown()

        interface.destroy()
        interface.delete()

621 622
    def get_activity_name(self, kwargs):
        return create_readable(ugettext_noop("remove %(vlan)s interface"),
623
                               vlan=kwargs['interface'].vlan)
624

625

626
@register_operation
627 628 629 630 631
class RemovePortOperation(InstanceOperation):
    id = 'remove_port'
    name = _("close port")
    description = _("Close the specified port.")
    concurrency_check = False
632
    acl_level = "operator"
633
    required_perms = ('vm.config_ports', )
634 635 636 637

    def _operation(self, activity, rule):
        interface = rule.host.interface_set.get()
        if interface.instance != self.instance:
638
            raise SuspiciousOperation()
639 640 641 642 643 644 645
        activity.readable_name = create_readable(
            ugettext_noop("close %(proto)s/%(port)d on %(host)s"),
            proto=rule.proto, port=rule.dport, host=rule.host)
        rule.delete()


@register_operation
646 647 648 649 650
class AddPortOperation(InstanceOperation):
    id = 'add_port'
    name = _("open port")
    description = _("Open the specified port.")
    concurrency_check = False
651
    acl_level = "operator"
652
    required_perms = ('vm.config_ports', )
653 654 655

    def _operation(self, activity, host, proto, port):
        if host.interface_set.get().instance != self.instance:
656
            raise SuspiciousOperation()
657 658 659 660 661 662 663
        host.add_port(proto, private=port)
        activity.readable_name = create_readable(
            ugettext_noop("open %(proto)s/%(port)d on %(host)s"),
            proto=proto, port=port, host=host)


@register_operation
664 665 666
class RemoveDiskOperation(InstanceOperation):
    id = 'remove_disk'
    name = _("remove disk")
667 668
    description = _("Remove the specified disk from the virtual machine, and "
                    "destroy the data.")
669
    required_perms = ()
670
    accept_states = ('STOPPED', 'PENDING', 'RUNNING')
671 672

    def _operation(self, activity, user, system, disk):
673
        if self.instance.is_running and disk.type not in ["iso"]:
674
            self.instance._detach_disk(disk=disk, parent_activity=activity)
675 676 677 678
        with activity.sub_activity(
            'destroy_disk',
            readable_name=ugettext_noop('destroy disk')
        ):
679
            disk.destroy()
680
            return self.instance.disks.remove(disk)
681

682 683 684
    def get_activity_name(self, kwargs):
        return create_readable(ugettext_noop('remove disk %(name)s'),
                               name=kwargs["disk"].name)
685 686


687
@register_operation
688
class ResetOperation(RemoteInstanceOperation):
Dudás Ádám committed
689 690
    id = 'reset'
    name = _("reset")
691
    description = _("Cold reboot virtual machine (power cycle).")
692
    required_perms = ()
693
    accept_states = ('RUNNING', )
694
    task = vm_tasks.reset
Dudás Ádám committed
695

696 697
    def _operation(self, activity):
        super(ResetOperation, self)._operation()
698 699 700
        if self.instance.has_agent:
            activity.sub_activity('os_boot', readable_name=ugettext_noop(
                "wait operating system loading"), interruptible=True)
Dudás Ádám committed
701 702


703
@register_operation
704
class SaveAsTemplateOperation(InstanceOperation):
Dudás Ádám committed
705 706
    id = 'save_as_template'
    name = _("save as template")
707 708 709 710
    description = _("Save virtual machine as a template so they can be shared "
                    "with users and groups.  Anyone who has access to a "
                    "template (and to the networks it uses) will be able to "
                    "start an instance of it.")
711
    has_percentage = True
712
    abortable = True
713
    required_perms = ('vm.create_template', )
714
    accept_states = ('RUNNING', 'STOPPED')
715
    async_queue = "localhost.man.slow"
Dudás Ádám committed
716

717 718 719 720
    def is_preferred(self):
        return (self.instance.is_base and
                self.instance.status == self.instance.STATUS.RUNNING)

721 722 723 724 725 726
    @staticmethod
    def _rename(name):
        m = search(r" v(\d+)$", name)
        if m:
            v = int(m.group(1)) + 1
            name = search(r"^(.*) v(\d+)$", name).group(1)
727
        else:
728 729
            v = 1
        return "%s v%d" % (name, v)
730

731
    def on_abort(self, activity, error):
732
        if hasattr(self, 'disks'):
733 734 735
            for disk in self.disks:
                disk.destroy()

736
    def _operation(self, activity, user, system, name=None,
737
                   with_shutdown=True, clone=False, task=None, **kwargs):
738 739
        try:
            self.instance._cleanup(parent_activity=activity, user=user)
740
        except:
741 742
            pass

743
        if with_shutdown:
744
            try:
745 746
                self.instance.shutdown(parent_activity=activity,
                                       user=user, task=task)
747 748 749
            except Instance.WrongStateError:
                pass

Dudás Ádám committed
750 751 752 753 754 755 756 757
        # prepare parameters
        params = {
            'access_method': self.instance.access_method,
            'arch': self.instance.arch,
            'boot_menu': self.instance.boot_menu,
            'description': self.instance.description,
            'lease': self.instance.lease,  # Can be problem in new VM
            'max_ram_size': self.instance.max_ram_size,
758
            'name': name or self._rename(self.instance.name),
Dudás Ádám committed
759 760
            'num_cores': self.instance.num_cores,
            'owner': user,
761
            'parent': self.instance.template or None,  # Can be problem
Dudás Ádám committed
762 763 764 765 766 767
            'priority': self.instance.priority,
            'ram_size': self.instance.ram_size,
            'raw_data': self.instance.raw_data,
            'system': self.instance.system,
        }
        params.update(kwargs)
Bach Dániel committed
768
        params.pop("parent_activity", None)
Dudás Ádám committed
769

770 771
        from storage.models import Disk

Dudás Ádám committed
772 773
        def __try_save_disk(disk):
            try:
774
                return disk.save_as(task)
Dudás Ádám committed
775 776 777
            except Disk.WrongDiskTypeError:
                return disk

778
        self.disks = []
779 780 781 782 783 784 785
        for disk in self.instance.disks.all():
            with activity.sub_activity(
                'saving_disk',
                readable_name=create_readable(
                    ugettext_noop("saving disk %(name)s"),
                    name=disk.name)
            ):
786 787
                self.disks.append(__try_save_disk(disk))

Dudás Ádám committed
788 789 790 791
        # create template and do additional setup
        tmpl = InstanceTemplate(**params)
        tmpl.full_clean()  # Avoiding database errors.
        tmpl.save()
792
        # Copy traits from the VM instance
793
        tmpl.req_traits.add(*self.instance.req_traits.all())
794 795
        if clone:
            tmpl.clone_acl(self.instance.template)
Guba Sándor committed
796
            # Add permission for the original owner of the template
797 798
            tmpl.set_level(self.instance.template.owner, 'owner')
            tmpl.set_level(user, 'owner')
Dudás Ádám committed
799
        try:
800
            tmpl.disks.add(*self.disks)
Dudás Ádám committed
801 802 803 804 805 806 807
            # create interface templates
            for i in self.instance.interface_set.all():
                i.save_as_template(tmpl)
        except:
            tmpl.delete()
            raise
        else:
808 809 810 811
            return create_readable(
                ugettext_noop("New template: %(template)s"),
                template=reverse('dashboard.views.template-detail',
                                 kwargs={'pk': tmpl.pk}))
Dudás Ádám committed
812 813


814
@register_operation
815 816
class ShutdownOperation(AbortableRemoteOperationMixin,
                        RemoteInstanceOperation):
Dudás Ádám committed
817 818
    id = 'shutdown'
    name = _("shutdown")
819 820 821 822
    description = _("Try to halt virtual machine by a standard ACPI signal, "
                    "allowing the operating system to keep a consistent "
                    "state. The operation will fail if the machine does not "
                    "turn itself off in a period.")
Kálmán Viktor committed
823
    abortable = True
824
    required_perms = ()
825
    accept_states = ('RUNNING', )
826
    resultant_state = 'STOPPED'
827 828
    task = vm_tasks.shutdown
    remote_queue = ("vm", "slow")
829
    remote_timeout = 180
Dudás Ádám committed
830

831 832
    def _operation(self, task):
        super(ShutdownOperation, self)._operation(task=task)
Dudás Ádám committed
833
        self.instance.yield_node()
Dudás Ádám committed
834

835 836 837 838 839 840 841 842 843 844 845
    def on_abort(self, activity, error):
        if isinstance(error, TimeLimitExceeded):
            activity.result = humanize_exception(ugettext_noop(
                "The virtual machine did not switch off in the provided time "
                "limit. Most of the time this is caused by incorrect ACPI "
                "settings. You can also try to power off the machine from the "
                "operating system manually."), error)
            activity.resultant_state = None
        else:
            super(ShutdownOperation, self).on_abort(activity, error)

Dudás Ádám committed
846

847
@register_operation
848
class ShutOffOperation(InstanceOperation):
Dudás Ádám committed
849 850
    id = 'shut_off'
    name = _("shut off")
851 852 853 854 855 856 857
    description = _("Forcibly halt a virtual machine without notifying the "
                    "operating system. This operation will even work in cases "
                    "when shutdown does not, but the operating system and the "
                    "file systems are likely to be in an inconsistent state,  "
                    "so data loss is also possible. The effect of this "
                    "operation is the same as interrupting the power supply "
                    "of a physical machine.")
858
    required_perms = ()
859
    accept_states = ('RUNNING', 'PAUSED')
860
    resultant_state = 'STOPPED'
Dudás Ádám committed
861

862
    def _operation(self, activity):
Dudás Ádám committed
863
        # Shutdown networks
864 865 866
        with activity.sub_activity('shutdown_net',
                                   readable_name=ugettext_noop(
                                       "shutdown network")):
Dudás Ádám committed
867
            self.instance.shutdown_net()
Dudás Ádám committed
868

869
        self.instance._delete_vm(parent_activity=activity)
Dudás Ádám committed
870
        self.instance.yield_node()
Dudás Ádám committed
871 872


873
@register_operation
874
class SleepOperation(InstanceOperation):
Dudás Ádám committed
875 876
    id = 'sleep'
    name = _("sleep")
877 878 879 880 881 882 883 884
    description = _("Suspend virtual machine. This means the machine is "
                    "stopped and its memory is saved to disk, so if the "
                    "machine is waked up, all the applications will keep "
                    "running. Most of the applications will be able to "
                    "continue even after a long suspension, but those which "
                    "need a continous network connection may fail when "
                    "resumed. In the meantime, the machine will only use "
                    "storage resources, and keep network resources allocated.")
885
    required_perms = ()
886
    accept_states = ('RUNNING', )
887
    resultant_state = 'SUSPENDED'
888
    async_queue = "localhost.man.slow"
Dudás Ádám committed
889

890 891 892 893
    def is_preferred(self):
        return (not self.instance.is_base and
                self.instance.status == self.instance.STATUS.RUNNING)

Dudás Ádám committed
894 895 896 897 898 899
    def on_abort(self, activity, error):
        if isinstance(error, TimeLimitExceeded):
            activity.resultant_state = None
        else:
            activity.resultant_state = 'ERROR'

900
    def _operation(self, activity, system):
901 902 903
        with activity.sub_activity('shutdown_net',
                                   readable_name=ugettext_noop(
                                       "shutdown network")):
Dudás Ádám committed
904
            self.instance.shutdown_net()
905
        self.instance._suspend_vm(parent_activity=activity)
906
        self.instance.yield_node()
Dudás Ádám committed
907

908 909 910 911
    @register_operation
    class SuspendVmOperation(SubOperationMixin, RemoteInstanceOperation):
        id = "_suspend_vm"
        name = _("suspend virtual machine")
912
        task = vm_tasks.sleep
913
        remote_queue = ("vm", "slow")
914
        remote_timeout = 1000
Dudás Ádám committed
915

916 917
        def _get_remote_args(self, **kwargs):
            return (super(SleepOperation.SuspendVmOperation, self)
918 919
                    ._get_remote_args(**kwargs) +
                    [self.instance.mem_dump['path']])
Dudás Ádám committed
920 921


922
@register_operation
923
class WakeUpOperation(InstanceOperation):
Dudás Ádám committed
924 925
    id = 'wake_up'
    name = _("wake up")
926 927 928
    description = _("Wake up sleeping (suspended) virtual machine. This will "
                    "load the saved memory of the system and start the "
                    "virtual machine from this state.")
929
    required_perms = ()
930
    accept_states = ('SUSPENDED', )
931
    resultant_state = 'RUNNING'
932
    async_queue = "localhost.man.slow"
Dudás Ádám committed
933

934
    def is_preferred(self):
935
        return self.instance.status == self.instance.STATUS.SUSPENDED
936

Dudás Ádám committed
937
    def on_abort(self, activity, error):
Bach Dániel committed
938 939 940 941
        if isinstance(error, SchedulerError):
            activity.resultant_state = None
        else:
            activity.resultant_state = 'ERROR'
Dudás Ádám committed
942

943
    def _operation(self, activity):
Dudás Ádám committed
944
        # Schedule vm
Dudás Ádám committed
945
        self.instance.allocate_vnc_port()
946
        self.instance.allocate_node()
Dudás Ádám committed
947 948

        # Resume vm
949
        self.instance._wake_up_vm(parent_activity=activity)
Dudás Ádám committed
950 951

        # Estabilish network connection (vmdriver)
952 953 954
        with activity.sub_activity(
            'deploying_net', readable_name=ugettext_noop(
                "deploy network")):
Dudás Ádám committed
955
            self.instance.deploy_net()
Dudás Ádám committed
956

957 958 959 960
        try:
            self.instance.renew(parent_activity=activity)
        except:
            pass
Dudás Ádám committed
961

962 963 964 965 966 967
    @register_operation
    class WakeUpVmOperation(SubOperationMixin, RemoteInstanceOperation):
        id = "_wake_up_vm"
        name = _("resume virtual machine")
        task = vm_tasks.wake_up
        remote_queue = ("vm", "slow")
968
        remote_timeout = 1000
969 970 971

        def _get_remote_args(self, **kwargs):
            return (super(WakeUpOperation.WakeUpVmOperation, self)
972 973
                    ._get_remote_args(**kwargs) +
                    [self.instance.mem_dump['path']])
974

Dudás Ádám committed
975

976
@register_operation
977 978 979
class RenewOperation(InstanceOperation):
    id = 'renew'
    name = _("renew")
980 981 982 983
    description = _("Virtual machines are suspended and destroyed after they "
                    "expire. This operation renews expiration times according "
                    "to the lease type. If the machine is close to the "
                    "expiration, its owner will be notified.")
984
    acl_level = "operator"
985
    required_perms = ()
986
    concurrency_check = False
987

988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009
    def set_time_of_suspend(self, activity, suspend, force):
        with activity.sub_activity(
            'renew_suspend', concurrency_check=False,
                readable_name=ugettext_noop('set time of suspend')):
            if (not force and suspend and self.instance.time_of_suspend and
                    suspend < self.instance.time_of_suspend):
                raise HumanReadableException.create(ugettext_noop(
                    "Renewing the machine with the selected lease would "
                    "result in its suspension time get earlier than before."))
            self.instance.time_of_suspend = suspend

    def set_time_of_delete(self, activity, delete, force):
        with activity.sub_activity(
            'renew_delete', concurrency_check=False,
                readable_name=ugettext_noop('set time of delete')):
            if (not force and delete and self.instance.time_of_delete and
                    delete < self.instance.time_of_delete):
                raise HumanReadableException.create(ugettext_noop(
                    "Renewing the machine with the selected lease would "
                    "result in its delete time get earlier than before."))
            self.instance.time_of_delete = delete

Őry Máté committed
1010
    def _operation(self, activity, lease=None, force=False, save=False):
1011
        suspend, delete = self.instance.get_renew_times(lease)
1012 1013 1014 1015 1016 1017 1018 1019 1020
        try:
            self.set_time_of_suspend(activity, suspend, force)
        except HumanReadableException:
            pass
        try:
            self.set_time_of_delete(activity, delete, force)
        except HumanReadableException:
            pass

Őry Máté committed
1021 1022
        if save:
            self.instance.lease = lease
1023

1024
        self.instance.save()
1025

1026
        return create_readable(ugettext_noop(
1027
            "Renewed to suspend at %(suspend)s and destroy at %(delete)s."),
1028 1029
            suspend=self.instance.time_of_suspend,
            delete=self.instance.time_of_suspend)
1030 1031


1032
@register_operation
1033
class ChangeStateOperation(InstanceOperation):
Guba Sándor committed
1034
    id = 'emergency_change_state'
1035 1036 1037 1038 1039 1040
    name = _("emergency state change")
    description = _("Change the virtual machine state to NOSTATE. This "
                    "should only be used if manual intervention was needed in "
                    "the virtualization layer, and the machine has to be "
                    "redeployed without losing its storage and network "
                    "resources.")
1041
    acl_level = "owner"
Guba Sándor committed
1042
    required_perms = ('vm.emergency_change_state', )
1043
    concurrency_check = False
1044

1045 1046
    def _operation(self, user, activity, new_state="NOSTATE", interrupt=False,
                   reset_node=False):
1047
        activity.resultant_state = new_state
1048 1049 1050 1051 1052 1053 1054
        if interrupt:
            msg_txt = ugettext_noop("Activity is forcibly interrupted.")
            message = create_readable(msg_txt, msg_txt)
            for i in InstanceActivity.objects.filter(
                    finished__isnull=True, instance=self.instance):
                i.finish(False, result=message)
                logger.error('Forced finishing activity %s', i)
1055

1056 1057 1058 1059
        if reset_node:
            self.instance.node = None
            self.instance.save()

1060

1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085
@register_operation
class RedeployOperation(InstanceOperation):
    id = 'redeploy'
    name = _("redeploy")
    description = _("Change the virtual machine state to NOSTATE "
                    "and redeploy the VM. This operation allows starting "
                    "machines formerly running on a failed node.")
    acl_level = "owner"
    required_perms = ('vm.redeploy', )
    concurrency_check = False

    def _operation(self, user, activity, with_emergency_change_state=True):
        if with_emergency_change_state:
            ChangeStateOperation(self.instance).call(
                parent_activity=activity, user=user,
                new_state='NOSTATE', interrupt=False, reset_node=True)
        else:
            ShutOffOperation(self.instance).call(
                parent_activity=activity, user=user)

        self.instance._update_status()

        DeployOperation(self.instance).call(
            parent_activity=activity, user=user)

1086

1087
class NodeOperation(Operation):
1088
    async_operation = abortable_async_node_operation
1089
    host_cls = Node
1090 1091
    online_required = True
    superuser_required = True
1092 1093 1094 1095 1096

    def __init__(self, node):
        super(NodeOperation, self).__init__(subject=node)
        self.node = node

1097 1098 1099 1100 1101 1102 1103
    def check_precond(self):
        super(NodeOperation, self).check_precond()
        if self.online_required and not self.node.online:
            raise humanize_exception(ugettext_noop(
                "You cannot call this operation on an offline node."),
                Exception())

1104 1105
    def create_activity(self, parent, user, kwargs):
        name = self.get_activity_name(kwargs)
1106 1107 1108 1109 1110 1111 1112 1113 1114 1115
        if parent:
            if parent.node != self.node:
                raise ValueError("The node associated with the specified "
                                 "parent activity does not match the node "
                                 "bound to the operation.")
            if parent.user != user:
                raise ValueError("The user associated with the specified "
                                 "parent activity does not match the user "
                                 "provided as parameter.")

1116 1117 1118
            return parent.create_sub(
                code_suffix=self.get_activity_code_suffix(),
                readable_name=name)
1119
        else:
1120 1121 1122
            return NodeActivity.create(
                code_suffix=self.get_activity_code_suffix(), node=self.node,
                user=user, readable_name=name)
1123 1124


1125
@register_operation
1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143
class ResetNodeOperation(NodeOperation):
    id = 'reset'
    name = _("reset")
    description = _("Disable missing node and redeploy all instances "
                    "on other ones.")
    required_perms = ()
    online_required = False
    async_queue = "localhost.man.slow"

    def check_precond(self):
        super(ResetNodeOperation, self).check_precond()
        if not self.node.enabled or self.node.online:
            raise humanize_exception(ugettext_noop(
                "You cannot reset a disabled or online node."), Exception())

    def _operation(self, activity, user):
        for i in self.node.instance_set.all():
            name = create_readable(ugettext_noop(
1144
                "redeploy %(instance)s (%(pk)s)"), instance=i.name, pk=i.pk)
1145 1146 1147 1148
            with activity.sub_activity('migrate_instance_%d' % i.pk,
                                       readable_name=name):
                i.redeploy(user=user)

1149 1150 1151 1152
        self.node.enabled = False
        self.node.schedule_enabled = False
        self.node.save()

1153 1154

@register_operation
1155 1156 1157
class FlushOperation(NodeOperation):
    id = 'flush'
    name = _("flush")
1158
    description = _("Passivate node and move all instances to other ones.")
1159
    required_perms = ()
1160
    async_queue = "localhost.man.slow"
1161

1162
    def _operation(self, activity, user):
1163 1164 1165
        if self.node.schedule_enabled:
            PassivateOperation(self.node).call(parent_activity=activity,
                                               user=user)
1166
        for i in self.node.instance_set.all():
1167 1168 1169 1170
            name = create_readable(ugettext_noop(
                "migrate %(instance)s (%(pk)s)"), instance=i.name, pk=i.pk)
            with activity.sub_activity('migrate_instance_%d' % i.pk,
                                       readable_name=name):
Bach Dániel committed
1171
                i.migrate(user=user)
1172 1173


1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190
@register_operation
class ActivateOperation(NodeOperation):
    id = 'activate'
    name = _("activate")
    description = _("Make node active, i.e. scheduler is allowed to deploy "
                    "virtual machines to it.")
    required_perms = ()

    def check_precond(self):
        super(ActivateOperation, self).check_precond()
        if self.node.enabled and self.node.schedule_enabled:
            raise humanize_exception(ugettext_noop(
                "You cannot activate an active node."), Exception())

    def _operation(self):
        self.node.enabled = True
        self.node.schedule_enabled = True
1191
        self.node.get_info(invalidate_cache=True)
1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212
        self.node.save()


@register_operation
class PassivateOperation(NodeOperation):
    id = 'passivate'
    name = _("passivate")
    description = _("Make node passive, i.e. scheduler is denied to deploy "
                    "virtual machines to it, but remaining instances and "
                    "the ones manually migrated will continue running.")
    required_perms = ()

    def check_precond(self):
        if self.node.enabled and not self.node.schedule_enabled:
            raise humanize_exception(ugettext_noop(
                "You cannot passivate a passive node."), Exception())
        super(PassivateOperation, self).check_precond()

    def _operation(self):
        self.node.enabled = True
        self.node.schedule_enabled = False
1213
        self.node.get_info(invalidate_cache=True)
1214 1215 1216 1217 1218 1219 1220 1221 1222 1223
        self.node.save()


@register_operation
class DisableOperation(NodeOperation):
    id = 'disable'
    name = _("disable")
    description = _("Disable node.")
    required_perms = ()
    online_required = False
1224

1225 1226 1227 1228 1229 1230 1231 1232 1233
    def check_precond(self):
        if not self.node.enabled:
            raise humanize_exception(ugettext_noop(
                "You cannot disable a disabled node."), Exception())
        if self.node.instance_set.exists():
            raise humanize_exception(ugettext_noop(
                "You cannot disable a node which is hosting instances."),
                Exception())
        super(DisableOperation, self).check_precond()
1234

1235 1236 1237 1238
    def _operation(self):
        self.node.enabled = False
        self.node.schedule_enabled = False
        self.node.save()
1239 1240


1241
@register_operation
1242 1243 1244
class UpdateNodeOperation(NodeOperation):
    id = 'update_node'
    name = _("update node")
1245 1246
    description = _("Upgrade or install node software (vmdriver, agentdriver, "
                    "monitor-client) with Salt.")
1247 1248 1249 1250 1251
    required_perms = ()
    online_required = False
    async_queue = "localhost.man.slow"

    def minion_cmd(self, module, params, timeout=3600):
1252 1253
        # see https://git.ik.bme.hu/circle/cloud/issues/377
        from salt.client import LocalClient
1254 1255 1256
        name = self.node.host.hostname
        client = LocalClient()
        data = client.cmd(
1257 1258
            name, module, params, timeout=timeout)

1259
        try:
1260
            data = data[name]
1261 1262
        except KeyError:
            raise HumanReadableException.create(ugettext_noop(
1263 1264
                "No minions matched the target (%(target)s). "
                "Data: (%(data)s)"), target=name, data=data)
1265

1266 1267 1268 1269 1270 1271
        if not isinstance(data, dict):
            raise HumanReadableException.create(ugettext_noop(
                "Unhandled exception: %(msg)s"), msg=unicode(data))

        return data

1272 1273 1274 1275 1276
    def _operation(self, activity):
        with activity.sub_activity(
                'upgrade_packages',
                readable_name=ugettext_noop('upgrade packages')) as sa:
            data = self.minion_cmd('pkg.upgrade', [])
1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288
            if not data.get('result'):
                raise HumanReadableException.create(ugettext_noop(
                    "Unhandled exception: %(msg)s"), msg=unicode(data))

            # data = {'vim': {'new': '1.2.7', 'old': '1.3.7'}}
            data = [v for v in data.values() if isinstance(v, dict)]
            upgraded = len([x for x in data
                            if x.get('old') and x.get('new')])
            installed = len([x for x in data
                             if not x.get('old') and x.get('new')])
            removed = len([x for x in data
                           if x.get('old') and not x.get('new')])
1289 1290 1291 1292 1293
            sa.result = create_readable(ugettext_noop(
                "Upgraded: %(upgraded)s, Installed: %(installed)s, "
                "Removed: %(removed)s"), upgraded=upgraded,
                installed=installed, removed=removed)

1294
        data = self.minion_cmd('state.sls', ['node'])
1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314
        failed = 0
        for k, v in data.iteritems():
            logger.debug('salt state %s %s', k, v)
            act_name = ': '.join(k.split('_|-')[:2])
            if not v["result"] or v["changes"]:
                act = activity.create_sub(
                    act_name[:70], readable_name=act_name)
                act.result = create_readable(ugettext_noop(
                    "Changes: %(changes)s Comment: %(comment)s"),
                    changes=v["changes"], comment=v["comment"])
                act.finish(v["result"])
                if not v["result"]:
                    failed += 1

        if failed:
            raise HumanReadableException.create(ugettext_noop(
                "Failed: %(failed)s"), failed=failed)


@register_operation
1315
class ScreenshotOperation(RemoteInstanceOperation):
1316 1317
    id = 'screenshot'
    name = _("screenshot")
1318 1319 1320
    description = _("Get a screenshot about the virtual machine's console. A "
                    "key will be pressed on the keyboard to stop "
                    "screensaver.")
1321
    acl_level = "owner"
1322
    required_perms = ()
1323
    accept_states = ('RUNNING', )
1324
    task = vm_tasks.screenshot
1325 1326


1327
@register_operation
Bach Dániel committed
1328 1329 1330
class RecoverOperation(InstanceOperation):
    id = 'recover'
    name = _("recover")
1331 1332 1333
    description = _("Try to recover virtual machine disks from destroyed "
                    "state. Network resources (allocations) are already lost, "
                    "so you will have to manually add interfaces afterwards.")
Bach Dániel committed
1334 1335
    acl_level = "owner"
    required_perms = ('vm.recover', )
1336
    accept_states = ('DESTROYED', )
1337
    resultant_state = 'PENDING'
Bach Dániel committed
1338 1339

    def check_precond(self):
1340 1341 1342 1343
        try:
            super(RecoverOperation, self).check_precond()
        except Instance.InstanceDestroyedError:
            pass
Bach Dániel committed
1344

1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365
    def _operation(self, user, activity):
        with activity.sub_activity(
            'recover_instance',
                readable_name=ugettext_noop("recover instance")):
            self.instance.destroyed_at = None
            for disk in self.instance.disks.all():
                disk.destroyed = None
                disk.restore()
                disk.save()
            self.instance.status = 'PENDING'
            self.instance.save()

        try:
            self.instance.renew(parent_activity=activity)
        except:
            pass

        if self.instance.template:
            for net in self.instance.template.interface_set.all():
                self.instance.add_interface(
                    parent_activity=activity, user=user, vlan=net.vlan)
Bach Dániel committed
1366 1367


1368
@register_operation
1369 1370 1371
class ResourcesOperation(InstanceOperation):
    id = 'resources_change'
    name = _("resources change")
1372
    description = _("Change resources of a stopped virtual machine.")
1373
    acl_level = "owner"
1374
    required_perms = ('vm.change_resources', )
1375
    accept_states = ('STOPPED', 'PENDING', 'RUNNING')
1376

1377
    def _operation(self, user, activity,
1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389
                   num_cores, ram_size, max_ram_size, priority,
                   with_shutdown=False, task=None):
        if self.instance.status == 'RUNNING' and not with_shutdown:
            raise Instance.WrongStateError(self.instance)

        try:
            self.instance.shutdown(parent_activity=activity, task=task)
        except Instance.WrongStateError:
            pass

        self.instance._update_status()

1390 1391 1392 1393 1394
        self.instance.num_cores = num_cores
        self.instance.ram_size = ram_size
        self.instance.max_ram_size = max_ram_size
        self.instance.priority = priority

1395
        self.instance.full_clean()
1396 1397
        self.instance.save()

1398
        return create_readable(ugettext_noop(
1399 1400 1401 1402 1403
            "Priority: %(priority)s, Num cores: %(num_cores)s, "
            "Ram size: %(ram_size)s"), priority=priority, num_cores=num_cores,
            ram_size=ram_size
        )

1404

1405
@register_operation
Bach Dániel committed
1406
class PasswordResetOperation(RemoteAgentOperation):
1407 1408
    id = 'password_reset'
    name = _("password reset")
1409 1410 1411 1412 1413
    description = _("Generate and set a new login password on the virtual "
                    "machine. This operation requires the agent running. "
                    "Resetting the password is not warranted to allow you "
                    "logging in as other settings are possible to prevent "
                    "it.")
1414
    acl_level = "owner"
Bach Dániel committed
1415
    task = agent_tasks.change_password
1416 1417
    required_perms = ()

1418 1419 1420
    def _get_remote_args(self, password, **kwrgs):
        return (super(PasswordResetOperation, self)._get_remote_args(**kwrgs) +
                [password])
Bach Dániel committed
1421 1422 1423 1424 1425 1426

    def _operation(self, password=None):
        if not password:
            password = pwgen()
        super(PasswordResetOperation, self)._operation(password=password)
        self.instance.pw = password
1427
        self.instance.save()
1428 1429


1430
@register_operation
1431 1432 1433
class InstallKeysOperation(RemoteAgentOperation):
    id = 'install_keys'
    name = _("install SSH keys")
1434 1435
    description = _("Copy your public keys to the virtual machines. "
                    "Only works on UNIX-like operating systems.")
1436 1437 1438 1439 1440 1441 1442
    acl_level = "user"
    task = agent_tasks.add_keys
    required_perms = ()

    def _get_remote_args(self, user, keys=None, **kwargs):
        if keys is None:
            keys = list(user.userkey_set.values_list('key', flat=True))
1443 1444
        return (super(InstallKeysOperation, self)._get_remote_args(**kwargs) +
                [keys])
1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455


@register_operation
class RemoveKeysOperation(RemoteAgentOperation):
    id = 'remove_keys'
    name = _("remove SSH keys")
    acl_level = "user"
    task = agent_tasks.del_keys
    required_perms = ()

    def _get_remote_args(self, user, keys, **kwargs):
1456 1457
        return (super(RemoveKeysOperation, self)._get_remote_args(**kwargs) +
                [keys])
1458 1459 1460


@register_operation
Bach Dániel committed
1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532
class AgentStartedOperation(InstanceOperation):
    id = 'agent_started'
    name = _("agent")
    acl_level = "owner"
    required_perms = ()
    concurrency_check = False

    @classmethod
    def get_activity_code_suffix(cls):
        return 'agent'

    @property
    def initialized(self):
        return self.instance.activity_log.filter(
            activity_code='vm.Instance.agent._cleanup').exists()

    def measure_boot_time(self):
        if not self.instance.template:
            return

        deploy_time = InstanceActivity.objects.filter(
            instance=self.instance, activity_code="vm.Instance.deploy"
        ).latest("finished").finished

        total_boot_time = (timezone.now() - deploy_time).total_seconds()

        Client().send([
            "template.%(pk)d.boot_time %(val)f %(time)s" % {
                'pk': self.instance.template.pk,
                'val': total_boot_time,
                'time': time.time(),
            }
        ])

    def finish_agent_wait(self):
        for i in InstanceActivity.objects.filter(
                (Q(activity_code__endswith='.os_boot') |
                 Q(activity_code__endswith='.agent_wait')),
                instance=self.instance, finished__isnull=True):
            i.finish(True)

    def _operation(self, user, activity, old_version=None, agent_system=None):
        with activity.sub_activity('starting', concurrency_check=False,
                                   readable_name=ugettext_noop('starting')):
            pass

        self.finish_agent_wait()

        self.instance._change_ip(parent_activity=activity)
        self.instance._restart_networking(parent_activity=activity)

        new_version = settings.AGENT_VERSION
        if new_version and old_version and new_version != old_version:
            try:
                self.instance.update_agent(
                    parent_activity=activity, agent_system=agent_system)
            except TimeoutError:
                pass
            else:
                activity.sub_activity(
                    'agent_wait', readable_name=ugettext_noop(
                        "wait agent restarting"), interruptible=True)
                return  # agent is going to restart

        if not self.initialized:
            try:
                self.measure_boot_time()
            except:
                logger.exception('Unhandled error in measure_boot_time()')
            self.instance._cleanup(parent_activity=activity)
            self.instance.password_reset(
                parent_activity=activity, password=self.instance.pw)
1533
            self.instance.install_keys(parent_activity=activity)
Bach Dániel committed
1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550
            self.instance._set_time(parent_activity=activity)
            self.instance._set_hostname(parent_activity=activity)

    @register_operation
    class CleanupOperation(SubOperationMixin, RemoteAgentOperation):
        id = '_cleanup'
        name = _("cleanup")
        task = agent_tasks.cleanup

    @register_operation
    class SetTimeOperation(SubOperationMixin, RemoteAgentOperation):
        id = '_set_time'
        name = _("set time")
        task = agent_tasks.set_time

        def _get_remote_args(self, **kwargs):
            cls = AgentStartedOperation.SetTimeOperation
1551 1552
            return (super(cls, self)._get_remote_args(**kwargs) +
                    [time.time()])
Bach Dániel committed
1553 1554 1555 1556 1557 1558 1559 1560 1561

    @register_operation
    class SetHostnameOperation(SubOperationMixin, RemoteAgentOperation):
        id = '_set_hostname'
        name = _("set hostname")
        task = agent_tasks.set_hostname

        def _get_remote_args(self, **kwargs):
            cls = AgentStartedOperation.SetHostnameOperation
1562 1563
            return (super(cls, self)._get_remote_args(**kwargs) +
                    [self.instance.short_hostname])
Bach Dániel committed
1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581

    @register_operation
    class RestartNetworkingOperation(SubOperationMixin, RemoteAgentOperation):
        id = '_restart_networking'
        name = _("restart networking")
        task = agent_tasks.restart_networking

    @register_operation
    class ChangeIpOperation(SubOperationMixin, RemoteAgentOperation):
        id = '_change_ip'
        name = _("change ip")
        task = agent_tasks.change_ip

        def _get_remote_args(self, **kwargs):
            hosts = Host.objects.filter(interface__instance=self.instance)
            interfaces = {str(host.mac): host.get_network_config()
                          for host in hosts}
            cls = AgentStartedOperation.ChangeIpOperation
1582 1583
            return (super(cls, self)._get_remote_args(**kwargs) +
                    [interfaces, settings.FIREWALL_SETTINGS['rdns_ip']])
Bach Dániel committed
1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675


@register_operation
class UpdateAgentOperation(RemoteAgentOperation):
    id = 'update_agent'
    name = _("update agent")
    acl_level = "owner"
    required_perms = ()

    def get_activity_name(self, kwargs):
        return create_readable(
            ugettext_noop('update agent to %(version)s'),
            version=settings.AGENT_VERSION)

    @staticmethod
    def create_linux_tar():
        def exclude(tarinfo):
            ignored = ('./.', './misc', './windows')
            if any(tarinfo.name.startswith(x) for x in ignored):
                return None
            else:
                return tarinfo

        f = StringIO()

        with TarFile.open(fileobj=f, mode='w:gz') as tar:
            agent_path = os.path.join(settings.AGENT_DIR, "agent-linux")
            tar.add(agent_path, arcname='.', filter=exclude)

            version_fileobj = StringIO(settings.AGENT_VERSION)
            version_info = TarInfo(name='version.txt')
            version_info.size = len(version_fileobj.buf)
            tar.addfile(version_info, version_fileobj)

        return encodestring(f.getvalue()).replace('\n', '')

    @staticmethod
    def create_windows_tar():
        f = StringIO()

        agent_path = os.path.join(settings.AGENT_DIR, "agent-win")
        with TarFile.open(fileobj=f, mode='w|gz') as tar:
            tar.add(agent_path, arcname='.')

            version_fileobj = StringIO(settings.AGENT_VERSION)
            version_info = TarInfo(name='version.txt')
            version_info.size = len(version_fileobj.buf)
            tar.addfile(version_info, version_fileobj)

        return encodestring(f.getvalue()).replace('\n', '')

    def _operation(self, user, activity, agent_system):
        queue = self._get_remote_queue()
        instance = self.instance
        if agent_system == "Windows":
            executable = os.listdir(
                os.path.join(settings.AGENT_DIR, "agent-win"))[0]
            data = self.create_windows_tar()
        elif agent_system == "Linux":
            executable = ""
            data = self.create_linux_tar()
        else:
            # Legacy update method
            executable = ""
            return agent_tasks.update_legacy.apply_async(
                queue=queue,
                args=(instance.vm_name, self.create_linux_tar())
            ).get(timeout=60)

        checksum = md5(data).hexdigest()
        chunk_size = 1024 * 1024
        chunk_number = 0
        index = 0
        filename = settings.AGENT_VERSION + ".tar"
        while True:
            chunk = data[index:index+chunk_size]
            if chunk:
                agent_tasks.append.apply_async(
                    queue=queue,
                    args=(instance.vm_name, chunk,
                          filename, chunk_number)).get(timeout=60)
                index = index + chunk_size
                chunk_number = chunk_number + 1
            else:
                agent_tasks.update.apply_async(
                    queue=queue,
                    args=(instance.vm_name, filename, executable, checksum)
                ).get(timeout=60)
                break


@register_operation
1676
class MountStoreOperation(EnsureAgentMixin, InstanceOperation):
1677 1678 1679
    id = 'mount_store'
    name = _("mount store")
    description = _(
1680
        "This operation attaches your personal file store. Other users who "
Őry Máté committed
1681
        "have access to this machine can see these files as well."
1682
    )
1683 1684 1685
    acl_level = "owner"
    required_perms = ()

Kálmán Viktor committed
1686 1687 1688 1689 1690 1691 1692
    def check_auth(self, user):
        super(MountStoreOperation, self).check_auth(user)
        try:
            Store(user)
        except NoStoreException:
            raise PermissionDenied  # not show the button at all

1693
    def _operation(self, user):
1694 1695
        inst = self.instance
        queue = self.instance.get_remote_queue_name("agent")
1696
        host = urlsplit(settings.STORE_URL).hostname
1697 1698
        username = Store(user).username
        password = user.profile.smb_password
1699 1700
        agent_tasks.mount_store.apply_async(
            queue=queue, args=(inst.vm_name, host, username, password))
1701 1702 1703 1704 1705 1706


class AbstractDiskOperation(SubOperationMixin, RemoteInstanceOperation):
    required_perms = ()

    def _get_remote_args(self, disk, **kwargs):
1707 1708
        return (super(AbstractDiskOperation, self)._get_remote_args(**kwargs) +
                [disk.get_vmdisk_desc()])
1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758


@register_operation
class AttachDisk(AbstractDiskOperation):
    id = "_attach_disk"
    name = _("attach disk")
    task = vm_tasks.attach_disk


class DetachMixin(object):
    def _operation(self, activity, **kwargs):
        try:
            super(DetachMixin, self)._operation(**kwargs)
        except Exception as e:
            if hasattr(e, "libvirtError") and "not found" in unicode(e):
                activity.result = create_readable(
                    ugettext_noop("Resource was not found."),
                    ugettext_noop("Resource was not found. %(exception)s"),
                    exception=unicode(e))
            else:
                raise


@register_operation
class DetachDisk(DetachMixin, AbstractDiskOperation):
    id = "_detach_disk"
    name = _("detach disk")
    task = vm_tasks.detach_disk


class AbstractNetworkOperation(SubOperationMixin, RemoteInstanceOperation):
    required_perms = ()

    def _get_remote_args(self, interface, **kwargs):
        return (super(AbstractNetworkOperation, self)
                ._get_remote_args(**kwargs) + [interface.get_vmnetwork_desc()])


@register_operation
class AttachNetwork(AbstractNetworkOperation):
    id = "_attach_network"
    name = _("attach network")
    task = vm_tasks.attach_network


@register_operation
class DetachNetwork(DetachMixin, AbstractNetworkOperation):
    id = "_detach_network"
    name = _("detach network")
    task = vm_tasks.detach_network