lib/portlayer/exec/base.go

// Copyright 2016-2017 VMware, Inc. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//    http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package exec

import (
	"context"
	"errors"
	"fmt"
	"strconv"
	"time"

	"golang.org/x/crypto/ssh"

	"github.com/vmware/govmomi/guest"
	"github.com/vmware/govmomi/task"
	"github.com/vmware/govmomi/vim25/mo"
	"github.com/vmware/govmomi/vim25/types"
	"github.com/vmware/vic/lib/config/executor"
	"github.com/vmware/vic/lib/migration"
	"github.com/vmware/vic/lib/tether/shared"
	"github.com/vmware/vic/pkg/trace"
	"github.com/vmware/vic/pkg/vsphere/extraconfig"
	"github.com/vmware/vic/pkg/vsphere/extraconfig/vmomi"
	"github.com/vmware/vic/pkg/vsphere/tasks"
	"github.com/vmware/vic/pkg/vsphere/vm"
)

var extraconfigIDKey = extraconfig.CalculateKey(executor.ExecutorConfig{}, "ExecutorConfigCommon.ID", "")

// NotYetExistError is returned when a call that requires a VM exist is made
type NotYetExistError struct {
	ID string
}

func (e NotYetExistError) Error() string {
	return fmt.Sprintf("%s is not completely created", e.ID)
}

// containerBase holds fields common between Handle and Container. The fields and
// methods in containerBase should not require locking as they're primary use is:
// a. for read-only reference when used in Container
// b. single use/no-concurrent modification when used in Handle
type containerBase struct {
	ExecConfig *executor.ExecutorConfig

	// Migrated is used during in memory migration to assign whether an execConfig is viable for a commit phase
	Migrated bool
	// MigrationError means the errors happens during data migration, some operation might fail for we cannot extract the whole container configuration
	MigrationError error
	DataVersion    int

	// original - can be pointers so long as refreshes
	// use different instances of the structures
	Config  *types.VirtualMachineConfigInfo
	Runtime *types.VirtualMachineRuntimeInfo

	// doesn't change so can be copied here
	vm *vm.VirtualMachine
}

func newBase(vm *vm.VirtualMachine, c *types.VirtualMachineConfigInfo, r *types.VirtualMachineRuntimeInfo) *containerBase {
	base := &containerBase{
		ExecConfig: &executor.ExecutorConfig{},
		Config:     c,
		Runtime:    r,
		vm:         vm,
	}

	// construct a working copy of the exec config
	if c != nil && c.ExtraConfig != nil {
		var migratedConf map[string]string
		containerExecKeyValues := vmomi.OptionValueMap(c.ExtraConfig)
		// #nosec: Errors unhandled.
		base.DataVersion, _ = migration.ContainerDataVersion(containerExecKeyValues)
		migratedConf, base.Migrated, base.MigrationError = migration.MigrateContainerConfig(containerExecKeyValues)
		extraconfig.Decode(extraconfig.MapSource(migratedConf), base.ExecConfig)
	}

	return base
}

// String returns the string representation of ContainerBase
func (c *containerBase) String() string {
	return c.ExecConfig.ID
}

// VMReference will provide the vSphere vm managed object reference
func (c *containerBase) VMReference() types.ManagedObjectReference {
	var moref types.ManagedObjectReference
	if c.vm != nil {
		moref = c.vm.Reference()
	}
	return moref
}

// unlocked refresh of container state
func (c *containerBase) refresh(op trace.Operation) error {
	base, err := c.updates(op)
	if err != nil {
		op.Errorf("Update: unable to update container %s: %s", c, err)
		return err
	}

	// copy over the new state
	*c = *base
	return nil
}

func (c *containerBase) GetContainerVM() *vm.VirtualMachine {
	return c.vm
}

// updates acquires updates from the infrastructure without holding a lock
func (c *containerBase) updates(op trace.Operation) (*containerBase, error) {
	defer trace.End(trace.Begin(c.ExecConfig.ID, op))

	var o mo.VirtualMachine

	// make sure we have vm
	if c.vm == nil {
		return nil, NotYetExistError{c.ExecConfig.ID}
	}

	if c.Config != nil {
		op.Debugf("Update: for %s, refreshing from change version %s", c, c.Config.ChangeVersion)
	}

	if err := c.vm.Properties(op, c.vm.Reference(), []string{"config", "runtime"}, &o); err != nil {
		return nil, err
	}

	base := &containerBase{
		vm:         c.vm,
		Config:     o.Config,
		Runtime:    &o.Runtime,
		ExecConfig: &executor.ExecutorConfig{},
	}

	// Get the ExtraConfig
	var migratedConf map[string]string
	containerExecKeyValues := vmomi.OptionValueMap(o.Config.ExtraConfig)
	if containerExecKeyValues[extraconfigIDKey] == "" {
		return nil, fmt.Errorf("Update: change version %s failed assertion extraconfig id != nil", o.Config.ChangeVersion)
	}

	op.Debugf("Update: for %s, change version %s, extraconfig id: %+v", c, o.Config.ChangeVersion, containerExecKeyValues[extraconfigIDKey])
	// #nosec: Errors unhandled.
	base.DataVersion, _ = migration.ContainerDataVersion(containerExecKeyValues)
	migratedConf, base.Migrated, base.MigrationError = migration.MigrateContainerConfig(containerExecKeyValues)
	extraconfig.Decode(extraconfig.MapSource(migratedConf), base.ExecConfig)

	return base, nil
}

// determine if the containerVM has started - this could pick up stale data in the started field for an out-of-band
// power change such as HA or user intervention where we have not had an opportunity to reset the entry.
func (c *containerBase) cleanStart(op trace.Operation) bool {
	if len(c.ExecConfig.Sessions) == 0 {
		op.Warnf("Container %c has no sessions stored in in-memory config", c.ExecConfig.ID)
		return true
	}

	for _, session := range c.ExecConfig.Sessions {
		if session.Started != "true" {
			return false
		}
	}
	return true
}

// determine if the containerVM has ever been started - we use the session started time for this as we have no
// cVM global record to indicate the fact.
func (c *containerBase) hasStarted(op trace.Operation) bool {
	if len(c.ExecConfig.Sessions) == 0 {
		op.Warnf("Container %c has no sessions stored in in-memory config", c.ExecConfig.ID)
		return true
	}

	for _, session := range c.ExecConfig.Sessions {
		if session.Detail.StartTime != 0 || session.Detail.StopTime != 0 {
			return true
		}
	}
	return false
}

// State returns the state of the containerVM based on data in the handle, with no refresh
func (c *containerBase) State(op trace.Operation) State {
	powerState := c.Runtime.PowerState
	state := StateUnknown

	switch powerState {
	case types.VirtualMachinePowerStatePoweredOn:
		if c.cleanStart(op) {
			state = StateRunning
		} else {
			// could be stopping but this is a better guess and is still transient
			state = StateStarting
		}
	case types.VirtualMachinePowerStatePoweredOff:
		if c.hasStarted(op) {
			state = StateStopped
		} else {
			state = StateCreated
		}
	case types.VirtualMachinePowerStateSuspended:
		state = StateSuspended
	}

	return state
}

func (c *containerBase) ReloadConfig(op trace.Operation) error {
	defer trace.End(trace.Begin(c.ExecConfig.ID, op))

	return c.startGuestProgram(op, shared.GuestActionReload, "")
}

// WaitForExec waits exec'ed task to set started field or timeout
func (c *containerBase) WaitForExec(op trace.Operation, id string) error {
	defer trace.End(trace.Begin(id, op))

	return c.waitForExec(op, id)
}

// WaitForSession waits non-exec'ed task to set started field or timeout
func (c *containerBase) WaitForSession(ctx context.Context, id string) error {
	defer trace.End(trace.Begin(id, ctx))

	return c.waitForSession(ctx, id)
}

func (c *containerBase) startGuestProgram(op trace.Operation, name string, args string) error {
	// make sure we have vm
	if c.vm == nil {
		return NotYetExistError{c.ExecConfig.ID}
	}

	defer trace.End(trace.Begin(c.ExecConfig.ID+":"+name, op))
	o := guest.NewOperationsManager(c.vm.Client.Client, c.vm.Reference())
	m, err := o.ProcessManager(op)
	if err != nil {
		return err
	}

	spec := types.GuestProgramSpec{
		ProgramPath: name,
		Arguments:   args,
	}

	auth := types.NamePasswordAuthentication{
		Username: c.ExecConfig.ID,
	}

	_, err = m.StartProgram(op, &auth, &spec)

	if tasks.IsInvalidPowerStateError(err) {
		return err
	}

	if tasks.IsInvalidStateError(err) {
		// we special case this for now as we _presume_ that it's either a conflict
		// of reconfigure with guest operation, or a conflict with another guest operation.
		// These cases do not return a TaskInProgress or concurrent modification.
		op.Debugf("Transforming invalid state error into concurrent access for start guest program call: %#v", err)
		return ConcurrentAccessError{errors.New("invalid state from start guest program")}
	}

	return err
}

func (c *containerBase) start(op trace.Operation) error {
	defer trace.End(trace.Begin(c.ExecConfig.ID, op))

	// make sure we have vm
	if c.vm == nil {
		return NotYetExistError{c.ExecConfig.ID}
	}

	return c.vm.PowerOn(op)
}

func (c *containerBase) stop(op trace.Operation, waitTime *int32) error {
	// make sure we have vm
	if c.vm == nil {
		return NotYetExistError{c.ExecConfig.ID}
	}

	// get existing state and set to stopping
	// if there's a failure we'll revert to existing

	err := c.shutdown(op, waitTime)
	if err == nil {
		return nil
	}

	op.Warnf("stopping %s via hard power off due to: %s", c, err.Error())

	return c.poweroff(op)
}

func (c *containerBase) kill(op trace.Operation) error {
	// make sure we have vm
	if c.vm == nil {
		return NotYetExistError{c.ExecConfig.ID}
	}

	wait := 10 * time.Second // default
	timeout, cancel := trace.WithTimeout(&op, wait, "kill")
	defer cancel()

	sig := string(ssh.SIGKILL)
	timeout.Infof("sending kill -%s %s", sig, c)

	err := c.startGuestProgram(timeout, shared.GuestActionKill, sig)
	if err == nil && timeout.Err() != nil {
		timeout.Warnf("timeout (%s) waiting for %s to power off via SIG%s", wait, c, sig)
	}
	if err != nil {
		if tasks.IsAlreadyPoweredOffError(err) {
			return nil
		}

		timeout.Warnf("killing %s attempt resulted in: %s", c, err.Error())
	}

	// Even if startGuestProgram failed above, it may actually have executed.  If the container came up and then
	// we kill it before VC gets a chance to detect the toolbox, vSphere can execute the kill but report an
	// error 3016 indicating the guest toolbox wasn't found.  If we then try to poweroff, it may throw vSphere
	// into an invalid transition and will need to recover.  If we try to grab properties at this time, the
	// power state may be incorrect.  We work around this by waiting on the power state, regardless of error
	// from startGuestProgram. https://github.com/vmware/vic/issues/5803
	timeout.Infof("waiting %s for %s to power off", wait, c)
	err = c.vm.WaitForPowerState(timeout, types.VirtualMachinePowerStatePoweredOff)
	if err == nil {
		return nil // VM has powered off
	}

	timeout.Warnf("killing %s via hard power off", c)

	// stop wait time is not applied for the hard kill
	return c.poweroff(op)
}

func (c *containerBase) shutdown(op trace.Operation, waitTime *int32) error {
	// make sure we have vm
	if c.vm == nil {
		return NotYetExistError{c.ExecConfig.ID}
	}

	wait := 10 * time.Second // default
	if waitTime != nil && *waitTime > 0 {
		wait = time.Duration(*waitTime) * time.Second
	}

	cs := c.ExecConfig.Sessions[c.ExecConfig.ID]

	stopSignal := cs.StopSignal
	if stopSignal == "" {
		stopSignal = string(ssh.SIGTERM)
	}

	actionSignals := []struct {
		action string
		sig    string
	}{
		{shared.GuestActionKill, stopSignal},
		{shared.GuestActionGroupKill, string(ssh.SIGKILL)},
	}

	var killed bool
	for _, actionSignal := range actionSignals {
		msg := fmt.Sprintf("sending %s -%s %s", actionSignal.action, actionSignal.sig, c)
		op.Infof(msg)

		timeout, cancel := trace.WithTimeout(&op, wait, "shutdown")
		defer cancel()

		err := c.startGuestProgram(timeout, actionSignal.action, actionSignal.sig)
		if err != nil {
			// Just warn and proceed to waiting for power state per issue https://github.com/vmware/vic/issues/5803
			// Description above in function kill()
			timeout.Warnf("%s: %s", msg, err)

			// If the error tells us "The attempted operation cannot be performed in the current state (Powered off)" (InvalidPowerState),
			// we can avoid hard poweroff (issues #6236 and #6252). Here we wait for the power state changes instead of return
			// immediately to avoid excess vSphere queries
			if tasks.IsAlreadyPoweredOffError(err) {
				killed = true
			}
		}

		timeout.Infof("waiting %s for %s to power off", wait, c)
		err = c.vm.WaitForPowerState(timeout, types.VirtualMachinePowerStatePoweredOff)
		if err == nil {
			return nil // VM has powered off
		}

		if timeout.Err() == nil {
			return err // error other than timeout
		}

		timeout.Warnf("timeout (%s) waiting for %s to power off via SIG%s", wait, c, actionSignal.sig)

		if killed {
			return nil
		}
	}

	return fmt.Errorf("failed to shutdown %s via kill signals %s and %s", c, stopSignal, string(ssh.SIGKILL))
}

func (c *containerBase) poweroff(op trace.Operation) error {
	// make sure we have vm
	if c.vm == nil {
		return NotYetExistError{c.ExecConfig.ID}
	}

	_, err := c.vm.WaitForResult(op, func(op context.Context) (tasks.Task, error) {
		return c.vm.PowerOff(op)
	})

	if err != nil {

		// It is possible the VM has finally shutdown in between, ignore the error in that case
		if terr, ok := err.(task.Error); ok {
			switch terr := terr.Fault().(type) {
			case *types.InvalidPowerState:
				if terr.ExistingState == types.VirtualMachinePowerStatePoweredOff {
					op.Warnf("power off %s task skipped (state was already %s)", c, terr.ExistingState)
					return nil
				}
				op.Warnf("invalid power state during power off: %s", terr.ExistingState)

			case *types.GenericVmConfigFault:

				// Check if the poweroff task was canceled due to a concurrent guest shutdown
				if len(terr.FaultMessage) > 0 {
					k := terr.FaultMessage[0].Key
					if k == vmNotSuspendedKey || k == vmPoweringOffKey {
						op.Infof("power off %s task skipped due to guest shutdown", c)
						return nil
					}
				}
				op.Warnf("generic vm config fault during power off: %#v", terr)

			default:
				op.Warnf("hard power off failed due to: %#v", terr)
			}
		}

		return err
	}

	return nil
}

func (c *containerBase) waitForPowerState(ctx context.Context, max time.Duration, state types.VirtualMachinePowerState) (bool, error) {
	defer trace.End(trace.Begin(c.ExecConfig.ID, ctx))

	timeout, cancel := context.WithTimeout(ctx, max)
	defer cancel()

	err := c.vm.WaitForPowerState(timeout, state)
	if err != nil {
		return timeout.Err() != nil, err
	}

	return false, nil
}

func (c *containerBase) waitForSession(ctx context.Context, id string) error {
	defer trace.End(trace.Begin(id, ctx))

	// guestinfo key that we want to wait for
	key := extraconfig.CalculateKey(c.ExecConfig, fmt.Sprintf("Sessions.%s.Started", id), "")
	return c.waitFor(ctx, key)
}

// WaitForExec will wait for any kind of change in the state of a task. Then it will return signifying that the a refreshed handle must be returned.
// users can then inspect that handle to examine and act against the changes in the task.
func (c *containerBase) waitForExec(op trace.Operation, id string) error {
	defer trace.End(trace.Begin(id, op))

	// guestinfo keys that we want to wait for
	startedKey := extraconfig.CalculateKey(c.ExecConfig, fmt.Sprintf("Execs.%s.Started", id), "")
	startKey := extraconfig.CalculateKey(c.ExecConfig, fmt.Sprintf("Execs.%s.Detail.StartTime", id), "")
	stopKey := extraconfig.CalculateKey(c.ExecConfig, fmt.Sprintf("Execs.%s.Detail.StopTime", id), "")

	// targeted exec
	execConf := c.ExecConfig.Execs[id]

	// construct key filter for exec state changes
	filter := map[string]string{
		startedKey: execConf.Started,
		startKey:   strconv.FormatInt(execConf.Detail.StartTime, 10),
		stopKey:    strconv.FormatInt(execConf.Detail.StopTime, 10),
	}

	return c.vm.WaitForKeyChange(op, filter)
}

func (c *containerBase) waitFor(ctx context.Context, key string) error {
	detail, err := c.vm.WaitForKeyInExtraConfig(ctx, key)
	if err != nil {
		return fmt.Errorf("unable to wait for process launch status: %s", err)
	}

	if detail != "true" {
		return fmt.Errorf("%s", detail)
	}

	return nil
}