# python3
# Copyright 2019 The gVisor Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""A machine producer which produces machine objects using `gcloud`.

Machine producers produce valid harness.Machine objects which are backed by
real machines. This producer produces those machines on the given user's GCP
account using the `gcloud` tool.

GCloudProducer creates instances on the given GCP account named like:
`machine-XXXXXXX-XXXX-XXXX-XXXXXXXXXXXX` in a randomized fashion such that name
collisions with user instances shouldn't happen.

  Typical usage example:

  producer = GCloudProducer(args)
  machines = producer.get_machines(NUM_MACHINES)
  # run stuff on machines with machines[i].run(CMD)
  producer.release_machines(NUM_MACHINES)
"""
import datetime
import json
import subprocess
import threading
from typing import List, Dict, Any
import uuid

from benchmarks.harness import machine
from benchmarks.harness.machine_producers import gcloud_mock_recorder
from benchmarks.harness.machine_producers import machine_producer


class GCloudProducer(machine_producer.MachineProducer):
  """Implementation of MachineProducer backed by GCP.

  Produces Machine objects backed by GCP instances.

  Attributes:
    image: image name as a string.
    zone: string to a valid GCP zone.
    machine_type: type of GCP to create (e.g. n1-standard-4).
    installers: list of installers post-boot.
    ssh_key_file: path to a valid ssh private key. See README on vaild ssh keys.
    ssh_user: string of user name for ssh_key
    ssh_password: string of password for ssh key
    internal: if true, use internal IPs of instances. Used if bm-tools is
    running on a GCP vm when a firewall is set for external IPs.
    mock: a mock printer which will print mock data if required. Mock data is
      recorded output from subprocess calls (returncode, stdout, args).
    condition: mutex for this class around machine creation and deleteion.
  """

  def __init__(self,
               image: str,
               zone: str,
               machine_type: str,
               installers: List[str],
               ssh_key_file: str,
               ssh_user: str,
               ssh_password: str,
               internal: bool,
               mock: gcloud_mock_recorder.MockPrinter = None):
    self.image = image
    self.zone = zone
    self.machine_type = machine_type
    self.installers = installers
    self.ssh_key_file = ssh_key_file
    self.ssh_user = ssh_user
    self.ssh_password = ssh_password
    self.internal = internal
    self.mock = mock
    self.condition = threading.Condition()

  def get_machines(self, num_machines: int) -> List[machine.Machine]:
    """Returns requested number of machines backed by GCP instances."""
    if num_machines <= 0:
      raise ValueError(
          "Cannot ask for {num} machines!".format(num=num_machines))
    with self.condition:
      names = self._get_unique_names(num_machines)
      instances = self._build_instances(names)
    self._add_ssh_key_to_instances(names)
    machines = self._machines_from_instances(instances)

    # Install all bits in lock-step.
    #
    # This will perform paralell installations for however many machines we
    # have, but it's easy to track errors because if installing (a, b, c), we
    # won't install "c" until "b" is installed on all machines.
    for installer in self.installers:
      threads = [None] * len(machines)
      results = [False] * len(machines)
      for i in range(len(machines)):
        threads[i] = threading.Thread(
            target=machines[i].install, args=(installer, results, i))
        threads[i].start()
      for thread in threads:
        thread.join()
      for result in results:
        if not result:
          raise NotImplementedError(
              "Installers failed on at least one machine!")

    # Add this user to each machine's docker group.
    for m in machines:
      m.run("sudo setfacl -m user:$USER:rw /var/run/docker.sock")

    return machines

  def release_machines(self, machine_list: List[machine.Machine]):
    """Releases the requested number of machines, deleting the instances."""
    if not machine_list:
      return
    cmd = "gcloud compute instances delete --quiet".split(" ")
    names = [str(m) for m in machine_list]
    cmd.extend(names)
    cmd.append("--zone={zone}".format(zone=self.zone))
    self._run_command(cmd, detach=True)

  def _machines_from_instances(
      self, instances: List[Dict[str, Any]]) -> List[machine.Machine]:
    """Creates Machine Objects from json data describing created instances."""
    machines = []
    for instance in instances:
      name = instance["name"]
      external = instance["networkInterfaces"][0]["accessConfigs"][0]["natIP"]
      internal = instance["networkInterfaces"][0]["networkIP"]
      kwargs = {
          "hostname": internal if self.internal else external,
          "key_path": self.ssh_key_file,
          "username": self.ssh_user,
          "key_password": self.ssh_password
      }
      machines.append(machine.RemoteMachine(name=name, **kwargs))
    return machines

  def _get_unique_names(self, num_names) -> List[str]:
    """Returns num_names unique names based on data from the GCP project."""
    return ["machine-" + str(uuid.uuid4()) for _ in range(0, num_names)]

  def _build_instances(self, names: List[str]) -> List[Dict[str, Any]]:
    """Creates instances using gcloud command.

    Runs the command `gcloud compute instances create` and returns json data
    on created instances on success. Creates len(names) instances, one for each
    name.

    Args:
      names: list of names of instances to create.

    Returns:
      List of json data describing created machines.
    """
    if not names:
      raise ValueError(
          "_build_instances cannot create instances without names.")
    cmd = "gcloud compute instances create".split(" ")
    cmd.extend(names)
    cmd.append("--image=" + self.image)
    cmd.append("--zone=" + self.zone)
    cmd.append("--machine-type=" + self.machine_type)
    res = self._run_command(cmd)
    data = res.stdout
    data = str(data, "utf-8") if isinstance(data, (bytes, bytearray)) else data
    return json.loads(data)

  def _add_ssh_key_to_instances(self, names: List[str]) -> None:
    """Adds ssh key to instances by calling gcloud ssh command.

    Runs the command `gcloud compute ssh instance_name` on list of images by
    name. Tries to ssh into given instance.

    Args:
      names: list of machine names to which to add the ssh-key
        self.ssh_key_file.

    Raises:
      subprocess.CalledProcessError: when underlying subprocess call returns an
      error other than 255 (Connection closed by remote host).
      TimeoutError: when 3 unsuccessful tries to ssh into the host return 255.
    """
    for name in names:
      cmd = "gcloud compute ssh {user}@{name}".format(
          user=self.ssh_user, name=name).split(" ")
      if self.internal:
        cmd.append("--internal-ip")
      cmd.append("--ssh-key-file={key}".format(key=self.ssh_key_file))
      cmd.append("--zone={zone}".format(zone=self.zone))
      cmd.append("--command=uname")
      timeout = datetime.timedelta(seconds=5 * 60)
      start = datetime.datetime.now()
      while datetime.datetime.now() <= timeout + start:
        try:
          self._run_command(cmd)
          break
        except subprocess.CalledProcessError:
          if datetime.datetime.now() > timeout + start:
            raise TimeoutError(
                "Could not SSH into instance after 5 min: {name}".format(
                    name=name))

  def _run_command(self,
                   cmd: List[str],
                   detach: bool = False) -> [None, subprocess.CompletedProcess]:
    """Runs command as a subprocess.

    Runs command as subprocess and returns the result.
    If this has a mock recorder, use the record method to record the subprocess
    call.

    Args:
      cmd: command to be run as a list of strings.
      detach: if True, run the child process and don't wait for it to return.

    Returns:
      Completed process object to be parsed by caller or None if detach=True.

    Raises:
      CalledProcessError: if subprocess.run returns an error.
    """
    cmd = cmd + ["--format=json"]
    if detach:
      p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
      if self.mock:
        out, _ = p.communicate()
        self.mock.record(
            subprocess.CompletedProcess(
                returncode=p.returncode, stdout=out, args=p.args))
      return

    res = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
    if self.mock:
      self.mock.record(res)
    if res.returncode != 0:
      raise subprocess.CalledProcessError(
          cmd=" ".join(res.args),
          output=res.stdout,
          stderr=res.stderr,
          returncode=res.returncode)
    return res