1
0
mirror of https://github.com/rancher/rke.git synced 2025-04-29 03:53:30 +00:00
rke/cmd/etcd.go

262 lines
7.7 KiB
Go
Raw Normal View History

2018-05-09 17:39:19 +00:00
package cmd
import (
"context"
"fmt"
2019-03-01 00:06:45 +00:00
"strings"
2018-05-17 22:27:35 +00:00
"time"
2018-05-09 17:39:19 +00:00
"github.com/rancher/rke/cluster"
"github.com/rancher/rke/hosts"
"github.com/rancher/rke/log"
"github.com/rancher/rke/pki"
2019-03-01 00:06:45 +00:00
v3 "github.com/rancher/types/apis/management.cattle.io/v3"
2018-05-17 22:27:35 +00:00
"github.com/sirupsen/logrus"
2018-05-09 17:39:19 +00:00
"github.com/urfave/cli"
)
const s3Endpoint = "s3.amazonaws.com"
2018-05-09 17:39:19 +00:00
func EtcdCommand() cli.Command {
2018-05-17 22:27:35 +00:00
snapshotFlags := []cli.Flag{
2018-05-09 17:39:19 +00:00
cli.StringFlag{
Name: "name",
Usage: "Specify snapshot name",
2018-05-09 17:39:19 +00:00
},
cli.StringFlag{
Name: "config",
Usage: "Specify an alternate cluster YAML file",
Value: pki.ClusterConfig,
EnvVar: "RKE_CONFIG",
},
cli.BoolFlag{
Name: "s3",
2019-02-21 18:38:25 +00:00
Usage: "Enabled backup to s3",
},
cli.StringFlag{
Name: "s3-endpoint",
Usage: "Specify s3 endpoint url",
Value: s3Endpoint,
},
cli.StringFlag{
Name: "s3-endpoint-ca",
Usage: "Specify a custom CA cert to connect to S3 endpoint",
},
cli.StringFlag{
Name: "access-key",
Usage: "Specify s3 accessKey",
},
cli.StringFlag{
Name: "secret-key",
Usage: "Specify s3 secretKey",
},
cli.StringFlag{
Name: "bucket-name",
Usage: "Specify s3 bucket name",
},
cli.StringFlag{
Name: "region",
Usage: "Specify the s3 bucket location (optional)",
},
2019-07-18 16:43:07 +00:00
cli.StringFlag{
Name: "folder",
Usage: "Specify s3 folder name",
},
2018-05-09 17:39:19 +00:00
}
2018-05-17 22:27:35 +00:00
snapshotFlags = append(snapshotFlags, commonFlags...)
2018-05-09 17:39:19 +00:00
return cli.Command{
Name: "etcd",
2018-05-17 22:27:35 +00:00
Usage: "etcd snapshot save/restore operations in k8s cluster",
2018-05-09 17:39:19 +00:00
Subcommands: []cli.Command{
{
Name: "snapshot-save",
Usage: "Take snapshot on all etcd hosts",
2018-05-17 22:27:35 +00:00
Flags: snapshotFlags,
Action: SnapshotSaveEtcdHostsFromCli,
2018-05-09 17:39:19 +00:00
},
{
Name: "snapshot-restore",
Usage: "Restore existing snapshot",
2018-05-17 22:27:35 +00:00
Flags: snapshotFlags,
Action: RestoreEtcdSnapshotFromCli,
2018-05-09 17:39:19 +00:00
},
},
}
}
2018-05-17 22:27:35 +00:00
func SnapshotSaveEtcdHosts(
2018-05-09 17:39:19 +00:00
ctx context.Context,
rkeConfig *v3.RancherKubernetesEngineConfig,
dialersOptions hosts.DialersOptions,
flags cluster.ExternalFlags, snapshotName string) error {
2018-05-09 17:39:19 +00:00
log.Infof(ctx, "Starting saving snapshot on etcd hosts")
kubeCluster, err := cluster.InitClusterObject(ctx, rkeConfig, flags)
2018-05-09 17:39:19 +00:00
if err != nil {
return err
}
if err := kubeCluster.SetupDialers(ctx, dialersOptions); err != nil {
return err
}
2018-05-09 17:39:19 +00:00
if err := kubeCluster.TunnelHosts(ctx, flags); err != nil {
2018-05-09 17:39:19 +00:00
return err
}
if err := kubeCluster.SnapshotEtcd(ctx, snapshotName); err != nil {
return err
}
2019-08-21 21:08:30 +00:00
log.Infof(ctx, "Finished saving/uploading snapshot [%s] on all etcd hosts", snapshotName)
2018-05-09 17:39:19 +00:00
return nil
}
2018-05-17 22:27:35 +00:00
func RestoreEtcdSnapshot(
2018-05-09 17:39:19 +00:00
ctx context.Context,
rkeConfig *v3.RancherKubernetesEngineConfig,
dialersOptions hosts.DialersOptions,
flags cluster.ExternalFlags,
data map[string]interface{},
snapshotName string) (string, string, string, string, map[string]pki.CertificatePKI, error) {
var APIURL, caCrt, clientCert, clientKey string
2018-11-24 10:18:24 +00:00
log.Infof(ctx, "Restoring etcd snapshot %s", snapshotName)
2019-02-14 21:00:37 +00:00
kubeCluster, err := cluster.InitClusterObject(ctx, rkeConfig, flags)
2018-11-24 10:18:24 +00:00
if err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-11-24 10:18:24 +00:00
}
2019-02-14 21:00:37 +00:00
stateFilePath := cluster.GetStateFilePath(flags.ClusterFilePath, flags.ConfigDir)
rkeFullState, _ := cluster.ReadStateFile(ctx, stateFilePath)
if err := checkLegacyCluster(ctx, kubeCluster, rkeFullState, flags); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2019-02-14 21:00:37 +00:00
}
2018-11-24 10:18:24 +00:00
rkeFullState.CurrentState = cluster.State{}
if err := rkeFullState.WriteStateFile(ctx, stateFilePath); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-11-24 10:18:24 +00:00
}
if err := kubeCluster.SetupDialers(ctx, dialersOptions); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
}
if err := kubeCluster.TunnelHosts(ctx, flags); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-05-09 17:39:19 +00:00
}
// if we fail after cleanup, we can't find the certs to do the download, we need to redeploy them
if err := kubeCluster.DeployRestoreCerts(ctx, rkeFullState.DesiredState.CertificatesBundle); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
}
2019-01-28 17:17:44 +00:00
// first download and check
if err := kubeCluster.PrepareBackup(ctx, snapshotName); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2019-01-28 17:17:44 +00:00
}
2018-11-24 10:18:24 +00:00
log.Infof(ctx, "Cleaning old kubernetes cluster")
if err := kubeCluster.CleanupNodes(ctx); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-11-24 10:18:24 +00:00
}
2018-05-17 22:27:35 +00:00
if err := kubeCluster.RestoreEtcdSnapshot(ctx, snapshotName); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-05-09 17:39:19 +00:00
}
2018-11-24 10:18:24 +00:00
if err := ClusterInit(ctx, rkeConfig, dialersOptions, flags); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-11-24 10:18:24 +00:00
}
APIURL, caCrt, clientCert, clientKey, certs, err := ClusterUp(ctx, dialersOptions, flags, data)
if err != nil {
2019-03-01 00:06:45 +00:00
if !strings.Contains(err.Error(), "Provisioning incomplete") {
return APIURL, caCrt, clientCert, clientKey, nil, err
2019-03-01 00:06:45 +00:00
}
log.Warnf(ctx, err.Error())
2018-11-24 10:18:24 +00:00
}
2019-03-01 00:06:45 +00:00
2018-11-24 10:18:24 +00:00
if err := cluster.RestartClusterPods(ctx, kubeCluster); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-11-24 10:18:24 +00:00
}
if err := kubeCluster.RemoveOldNodes(ctx); err != nil {
return APIURL, caCrt, clientCert, clientKey, nil, err
2018-11-24 10:18:24 +00:00
}
2018-05-17 22:27:35 +00:00
log.Infof(ctx, "Finished restoring snapshot [%s] on all etcd hosts", snapshotName)
return APIURL, caCrt, clientCert, clientKey, certs, err
2018-05-09 17:39:19 +00:00
}
2018-05-17 22:27:35 +00:00
func SnapshotSaveEtcdHostsFromCli(ctx *cli.Context) error {
2019-09-03 20:01:22 +00:00
logrus.Infof("Running RKE version: %v", ctx.App.Version)
2018-05-09 17:39:19 +00:00
clusterFile, filePath, err := resolveClusterFile(ctx)
if err != nil {
return fmt.Errorf("failed to resolve cluster file: %v", err)
2018-05-09 17:39:19 +00:00
}
rkeConfig, err := cluster.ParseConfig(clusterFile)
if err != nil {
return fmt.Errorf("failed to parse cluster file: %v", err)
2018-05-09 17:39:19 +00:00
}
rkeConfig, err = setOptionsFromCLI(ctx, rkeConfig)
if err != nil {
return err
}
2018-05-17 22:27:35 +00:00
// Check snapshot name
etcdSnapshotName := ctx.String("name")
if etcdSnapshotName == "" {
etcdSnapshotName = fmt.Sprintf("rke_etcd_snapshot_%s", time.Now().Format(time.RFC3339))
logrus.Warnf("Name of the snapshot is not specified using [%s]", etcdSnapshotName)
}
// setting up the flags
2018-11-12 23:24:59 +00:00
flags := cluster.GetExternalFlags(false, false, false, "", filePath)
return SnapshotSaveEtcdHosts(context.Background(), rkeConfig, hosts.DialersOptions{}, flags, etcdSnapshotName)
2018-05-09 17:39:19 +00:00
}
2018-05-17 22:27:35 +00:00
func RestoreEtcdSnapshotFromCli(ctx *cli.Context) error {
2019-09-03 20:01:22 +00:00
logrus.Infof("Running RKE version: %v", ctx.App.Version)
2018-05-09 17:39:19 +00:00
clusterFile, filePath, err := resolveClusterFile(ctx)
if err != nil {
return fmt.Errorf("failed to resolve cluster file: %v", err)
2018-05-09 17:39:19 +00:00
}
rkeConfig, err := cluster.ParseConfig(clusterFile)
if err != nil {
return fmt.Errorf("failed to parse cluster file: %v", err)
2018-05-09 17:39:19 +00:00
}
rkeConfig, err = setOptionsFromCLI(ctx, rkeConfig)
if err != nil {
return err
}
2018-05-17 22:27:35 +00:00
etcdSnapshotName := ctx.String("name")
if etcdSnapshotName == "" {
return fmt.Errorf("you must specify the snapshot name to restore")
2018-05-17 22:27:35 +00:00
}
// setting up the flags
2018-11-12 23:24:59 +00:00
flags := cluster.GetExternalFlags(false, false, false, "", filePath)
_, _, _, _, _, err = RestoreEtcdSnapshot(context.Background(), rkeConfig, hosts.DialersOptions{}, flags, map[string]interface{}{}, etcdSnapshotName)
return err
2018-05-09 17:39:19 +00:00
}
2019-04-02 10:54:02 +00:00
func SnapshotRemoveFromEtcdHosts(
ctx context.Context,
rkeConfig *v3.RancherKubernetesEngineConfig,
dialersOptions hosts.DialersOptions,
flags cluster.ExternalFlags, snapshotName string) error {
log.Infof(ctx, "Starting snapshot remove on etcd hosts")
kubeCluster, err := cluster.InitClusterObject(ctx, rkeConfig, flags)
if err != nil {
return err
}
if err := kubeCluster.SetupDialers(ctx, dialersOptions); err != nil {
return err
}
if err := kubeCluster.TunnelHosts(ctx, flags); err != nil {
return err
}
if err := kubeCluster.RemoveEtcdSnapshot(ctx, snapshotName); err != nil {
return err
}
log.Infof(ctx, "Finished removing snapshot [%s] from all etcd hosts", snapshotName)
return nil
}