2019-10-27 05:53:25 +00:00
|
|
|
package cluster
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2021-02-12 15:35:57 +00:00
|
|
|
"net/url"
|
2021-06-04 22:05:47 +00:00
|
|
|
"runtime"
|
2019-11-11 22:18:26 +00:00
|
|
|
"strings"
|
2024-01-30 23:47:18 +00:00
|
|
|
"time"
|
2019-10-27 05:53:25 +00:00
|
|
|
|
2022-03-02 23:47:27 +00:00
|
|
|
"github.com/k3s-io/k3s/pkg/clientaccess"
|
|
|
|
"github.com/k3s-io/k3s/pkg/cluster/managed"
|
|
|
|
"github.com/k3s-io/k3s/pkg/daemons/config"
|
|
|
|
"github.com/k3s-io/k3s/pkg/etcd"
|
2020-11-30 23:45:22 +00:00
|
|
|
"github.com/k3s-io/kine/pkg/endpoint"
|
2019-12-16 18:44:13 +00:00
|
|
|
"github.com/pkg/errors"
|
2021-03-01 22:19:57 +00:00
|
|
|
"github.com/sirupsen/logrus"
|
2024-01-30 23:47:18 +00:00
|
|
|
"k8s.io/apimachinery/pkg/util/wait"
|
2023-09-21 13:39:05 +00:00
|
|
|
utilsnet "k8s.io/utils/net"
|
2019-10-27 05:53:25 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type Cluster struct {
|
|
|
|
clientAccessInfo *clientaccess.Info
|
|
|
|
config *config.Control
|
2020-05-05 21:59:15 +00:00
|
|
|
managedDB managed.Driver
|
2019-11-11 22:18:26 +00:00
|
|
|
joining bool
|
2021-10-07 19:47:00 +00:00
|
|
|
storageStarted bool
|
2019-11-11 22:18:26 +00:00
|
|
|
saveBootstrap bool
|
2021-10-07 19:47:00 +00:00
|
|
|
shouldBootstrap bool
|
2023-08-01 00:51:46 +00:00
|
|
|
cnFilterFunc func(...string) []string
|
2019-10-27 05:53:25 +00:00
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// Start creates the dynamic tls listener, http request handler,
|
|
|
|
// handles starting and writing/reading bootstrap data, and returns a channel
|
2021-03-11 20:07:40 +00:00
|
|
|
// that will be closed when datastore is ready. If embedded etcd is in use,
|
|
|
|
// a secondary call to Cluster.save is made.
|
2020-05-05 21:59:15 +00:00
|
|
|
func (c *Cluster) Start(ctx context.Context) (<-chan struct{}, error) {
|
2020-09-24 06:29:25 +00:00
|
|
|
// Set up the dynamiclistener and http request handlers
|
2020-05-05 21:59:15 +00:00
|
|
|
if err := c.initClusterAndHTTPS(ctx); err != nil {
|
2020-09-24 06:29:25 +00:00
|
|
|
return nil, errors.Wrap(err, "init cluster datastore and https")
|
2019-10-27 05:53:25 +00:00
|
|
|
}
|
|
|
|
|
2021-02-12 15:35:57 +00:00
|
|
|
if c.config.DisableETCD {
|
|
|
|
ready := make(chan struct{})
|
|
|
|
defer close(ready)
|
|
|
|
|
2024-04-08 18:04:27 +00:00
|
|
|
// try to get /db/info urls first, for a current list of etcd cluster member client URLs
|
2021-03-01 21:50:50 +00:00
|
|
|
clientURLs, _, err := etcd.ClientURLs(ctx, c.clientAccessInfo, c.config.PrivateIP)
|
2021-02-12 15:35:57 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2024-04-08 18:04:27 +00:00
|
|
|
// If we somehow got no error but also no client URLs, just use the address of the server we're joining
|
|
|
|
if len(clientURLs) == 0 {
|
2021-02-12 15:35:57 +00:00
|
|
|
clientURL, err := url.Parse(c.config.JoinURL)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
clientURL.Host = clientURL.Hostname() + ":2379"
|
|
|
|
clientURLs = append(clientURLs, clientURL.String())
|
2024-04-08 18:04:27 +00:00
|
|
|
logrus.Warnf("Got empty etcd ClientURL list; using server URL %s", clientURL)
|
2021-02-12 15:35:57 +00:00
|
|
|
}
|
2024-03-19 22:01:36 +00:00
|
|
|
etcdProxy, err := etcd.NewETCDProxy(ctx, c.config.SupervisorPort, c.config.DataDir, clientURLs[0], utilsnet.IsIPv6CIDR(c.config.ServiceIPRanges[0]))
|
2021-02-12 15:35:57 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2024-04-08 18:04:27 +00:00
|
|
|
// immediately update the load balancer with all etcd addresses
|
|
|
|
// client URLs are a full URI, but the proxy only wants host:port
|
|
|
|
for i, c := range clientURLs {
|
|
|
|
u, err := url.Parse(c)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "failed to parse etcd ClientURL")
|
|
|
|
}
|
|
|
|
clientURLs[i] = u.Host
|
|
|
|
}
|
|
|
|
etcdProxy.Update(clientURLs)
|
|
|
|
|
|
|
|
// start periodic endpoint sync goroutine
|
2021-02-12 15:35:57 +00:00
|
|
|
c.setupEtcdProxy(ctx, etcdProxy)
|
2021-03-01 21:50:50 +00:00
|
|
|
|
|
|
|
// remove etcd member if it exists
|
|
|
|
if err := c.managedDB.RemoveSelf(ctx); err != nil {
|
2021-03-01 22:19:57 +00:00
|
|
|
logrus.Warnf("Failed to remove this node from etcd members")
|
2021-03-01 21:50:50 +00:00
|
|
|
}
|
|
|
|
|
2022-03-08 17:04:31 +00:00
|
|
|
c.config.Runtime.EtcdConfig.Endpoints = strings.Split(c.config.Datastore.Endpoint, ",")
|
|
|
|
c.config.Runtime.EtcdConfig.TLSConfig = c.config.Datastore.BackendTLSConfig
|
|
|
|
|
2021-02-12 15:35:57 +00:00
|
|
|
return ready, nil
|
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// start managed database (if necessary)
|
2020-05-05 21:59:15 +00:00
|
|
|
if err := c.start(ctx); err != nil {
|
2020-09-24 06:29:25 +00:00
|
|
|
return nil, errors.Wrap(err, "start managed database")
|
2019-10-27 05:53:25 +00:00
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// get the wait channel for testing managed database readiness
|
2020-05-05 21:59:15 +00:00
|
|
|
ready, err := c.testClusterDB(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
2019-10-27 05:53:25 +00:00
|
|
|
}
|
|
|
|
|
2024-02-22 22:37:32 +00:00
|
|
|
if err := c.startStorage(ctx, false); err != nil {
|
2021-11-10 12:33:42 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// if necessary, store bootstrap data to datastore
|
2019-11-11 22:18:26 +00:00
|
|
|
if c.saveBootstrap {
|
2022-02-25 17:26:13 +00:00
|
|
|
if err := Save(ctx, c.config, false); err != nil {
|
2020-05-05 21:59:15 +00:00
|
|
|
return nil, err
|
2019-11-11 22:18:26 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:33:00 +00:00
|
|
|
// at this point, if etcd is in use, it's bootstrapping is complete
|
|
|
|
// so save the bootstrap data. We will need for etcd to be up. If
|
|
|
|
// the save call returns an error, we panic since subsequent etcd
|
|
|
|
// snapshots will be empty.
|
2021-03-11 20:07:40 +00:00
|
|
|
if c.managedDB != nil {
|
2021-03-17 21:33:00 +00:00
|
|
|
go func() {
|
2021-06-04 22:05:47 +00:00
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-ready:
|
2022-02-25 17:26:13 +00:00
|
|
|
if err := Save(ctx, c.config, false); err != nil {
|
2021-06-04 22:05:47 +00:00
|
|
|
panic(err)
|
|
|
|
}
|
|
|
|
|
2021-07-09 17:22:49 +00:00
|
|
|
if !c.config.EtcdDisableSnapshots {
|
2024-08-05 16:35:07 +00:00
|
|
|
_ = wait.PollUntilContextCancel(ctx, time.Second, true, func(ctx context.Context) (bool, error) {
|
2024-01-30 23:47:18 +00:00
|
|
|
err := c.managedDB.ReconcileSnapshotData(ctx)
|
|
|
|
if err != nil {
|
|
|
|
logrus.Errorf("Failed to record snapshots for cluster: %v", err)
|
|
|
|
}
|
|
|
|
return err == nil, nil
|
|
|
|
})
|
2021-06-04 22:05:47 +00:00
|
|
|
}
|
|
|
|
return
|
|
|
|
default:
|
|
|
|
runtime.Gosched()
|
2021-03-17 21:33:00 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
2021-03-11 20:07:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return ready, nil
|
2019-11-11 22:18:26 +00:00
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// startStorage starts the kine listener and configures the endpoints, if necessary.
|
|
|
|
// This calls into the kine endpoint code, which sets up the database client
|
|
|
|
// and unix domain socket listener if using an external database. In the case of an etcd
|
|
|
|
// backend it just returns the user-provided etcd endpoints and tls config.
|
2024-02-22 22:37:32 +00:00
|
|
|
func (c *Cluster) startStorage(ctx context.Context, bootstrap bool) error {
|
|
|
|
if c.storageStarted && !c.config.KineTLS {
|
2019-11-11 22:18:26 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
c.storageStarted = true
|
|
|
|
|
2024-02-22 22:37:32 +00:00
|
|
|
if !bootstrap {
|
|
|
|
// set the tls config for the kine storage
|
|
|
|
c.config.Datastore.ServerTLSConfig.CAFile = c.config.Runtime.ETCDServerCA
|
|
|
|
c.config.Datastore.ServerTLSConfig.CertFile = c.config.Runtime.ServerETCDCert
|
|
|
|
c.config.Datastore.ServerTLSConfig.KeyFile = c.config.Runtime.ServerETCDKey
|
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// start listening on the kine socket as an etcd endpoint, or return the external etcd endpoints
|
2019-11-16 00:12:27 +00:00
|
|
|
etcdConfig, err := endpoint.Listen(ctx, c.config.Datastore)
|
2019-11-11 22:18:26 +00:00
|
|
|
if err != nil {
|
2019-12-16 18:44:13 +00:00
|
|
|
return errors.Wrap(err, "creating storage endpoint")
|
2019-10-31 02:05:40 +00:00
|
|
|
}
|
|
|
|
|
2020-09-24 06:29:25 +00:00
|
|
|
// Persist the returned etcd configuration. We decide if we're doing leader election for embedded controllers
|
|
|
|
// based on what the kine wrapper tells us about the datastore. Single-node datastores like sqlite don't require
|
|
|
|
// leader election, while basically all others (etcd, external database, etc) do since they allow multiple servers.
|
2022-02-25 17:26:13 +00:00
|
|
|
c.config.Runtime.EtcdConfig = etcdConfig
|
2024-02-22 22:37:32 +00:00
|
|
|
|
|
|
|
// after the bootstrap we need to set the args for api-server with kine in unixs or just set the
|
|
|
|
// values if the datastoreTLS is not enabled
|
|
|
|
if !bootstrap || !c.config.KineTLS {
|
|
|
|
c.config.Datastore.BackendTLSConfig = etcdConfig.TLSConfig
|
|
|
|
c.config.Datastore.Endpoint = strings.Join(etcdConfig.Endpoints, ",")
|
|
|
|
c.config.NoLeaderElect = !etcdConfig.LeaderElect
|
|
|
|
}
|
|
|
|
|
2019-11-11 22:18:26 +00:00
|
|
|
return nil
|
2019-10-27 05:53:25 +00:00
|
|
|
}
|
|
|
|
|
2021-10-07 19:47:00 +00:00
|
|
|
// New creates an initial cluster using the provided configuration.
|
2019-10-27 05:53:25 +00:00
|
|
|
func New(config *config.Control) *Cluster {
|
|
|
|
return &Cluster{
|
2022-02-24 19:01:14 +00:00
|
|
|
config: config,
|
2019-10-27 05:53:25 +00:00
|
|
|
}
|
|
|
|
}
|