Skip to content

Commit

Permalink
Dynamically resolve reverse tunnel address
Browse files Browse the repository at this point in the history
The reverse tunnel address is currently a static string that is
retrieved from config and passed around for the duration of a
services lifetime. When the `tunnel_public_address` is changed
on the proxy and the proxy is then restarted, all established
reverse tunnels over the old address will fail indefinintely.
As a means to get around this, #8102 introduced a mechanism
that would cause nodes to restart if their connection to the
auth server was down for a period of time. While this did
allow the nodes to pickup the new address after the nodes
restarted it was meant to be a stop gap until a more robust
solution could be applid.

Instead of using a static address, the reverse tunnel address
is now resolved via a `reversetunnel.Resolver`. Anywhere that
previoulsy relied on the static proxy address now will fetch
the actual reverse tunnel address via the webclient by using
the Resolver. In addition this builds on the refactoring done
in #4290 to further simplify the reversetunnel package. Since
we no longer track multiple proxies, all the left over bits
that did so have been removed to accomodate using a dynamic
reverse tunnel address.
  • Loading branch information
rosstimothy committed Jan 27, 2022
1 parent 85129ee commit b3625c0
Show file tree
Hide file tree
Showing 20 changed files with 528 additions and 534 deletions.
111 changes: 0 additions & 111 deletions integration/restart_test.go

This file was deleted.

25 changes: 18 additions & 7 deletions lib/reversetunnel/agent.go
Original file line number Diff line number Diff line change
Expand Up @@ -384,12 +384,19 @@ func (a *Agent) run() {
a.log.Warningf("Failed to create remote tunnel: %v, conn: %v.", err, conn)
return
}
defer conn.Close()

local := conn.LocalAddr().String()
remote := conn.RemoteAddr().String()
defer func() {
if err := conn.Close(); err != nil {
a.log.Warnf("Failed to close remote tunnel: %v, local addr: %s remote addr: %s", err, local, remote)
}
}()

// Successfully connected to remote cluster.
a.log.WithFields(log.Fields{
"addr": conn.LocalAddr().String(),
"remote-addr": conn.RemoteAddr().String(),
"addr": local,
"remote-addr": remote,
}).Info("Connected.")

// wrap up remaining business logic in closure for easy
Expand All @@ -414,14 +421,14 @@ func (a *Agent) run() {
// or permanent loss of a proxy.
err = a.processRequests(conn)
if err != nil {
a.log.Warnf("Unable to continue processesing requests: %v.", err)
a.log.Warnf("Unable to continue processioning requests: %v.", err)
return
}
}
// if Tracker was provided, then the agent shouldn't continue unless
// no other agents hold a claim.
if a.Tracker != nil {
if !a.Tracker.WithProxy(doWork, a.Lease, a.getPrincipalsList()...) {
if !a.Tracker.WithProxy(doWork, a.getPrincipalsList()...) {
a.log.Debugf("Proxy already held by other agent: %v, releasing.", a.getPrincipalsList())
}
} else {
Expand Down Expand Up @@ -518,15 +525,19 @@ func (a *Agent) processRequests(conn *ssh.Client) error {
}
}

// handleDisovery receives discovery requests from the reverse tunnel
// handleDiscovery receives discovery requests from the reverse tunnel
// server, that informs agent about proxies registered in the remote
// cluster and the reverse tunnels already established
//
// ch : SSH channel which received "teleport-transport" out-of-band request
// reqC : request payload
func (a *Agent) handleDiscovery(ch ssh.Channel, reqC <-chan *ssh.Request) {
a.log.Debugf("handleDiscovery requests channel.")
defer ch.Close()
defer func() {
if err := ch.Close(); err != nil {
a.log.Warnf("Failed to closed connection: %v", err)
}
}()

for {
var req *ssh.Request
Expand Down
80 changes: 37 additions & 43 deletions lib/reversetunnel/agentpool.go
Original file line number Diff line number Diff line change
Expand Up @@ -59,7 +59,7 @@ type AgentPool struct {
spawnLimiter utils.Retry

mu sync.Mutex
agents map[utils.NetAddr][]*Agent
agents []*Agent
}

// AgentPoolConfig holds configuration parameters for the agent pool
Expand Down Expand Up @@ -89,8 +89,8 @@ type AgentPoolConfig struct {
Component string
// ReverseTunnelServer holds all reverse tunnel connections.
ReverseTunnelServer Server
// ProxyAddr points to the address of the ssh proxy
ProxyAddr string
// Resolver retrieves the reverse tunnel address
Resolver Resolver
// Cluster is a cluster name of the proxy.
Cluster string
// FIPS indicates if Teleport was started in FIPS mode.
Expand Down Expand Up @@ -135,11 +135,6 @@ func NewAgentPool(ctx context.Context, cfg AgentPoolConfig) (*AgentPool, error)
return nil, trace.Wrap(err)
}

proxyAddr, err := utils.ParseAddr(cfg.ProxyAddr)
if err != nil {
return nil, trace.Wrap(err)
}

ctx, cancel := context.WithCancel(ctx)
tr, err := track.New(ctx, track.Config{ClusterName: cfg.Cluster})
if err != nil {
Expand All @@ -148,7 +143,7 @@ func NewAgentPool(ctx context.Context, cfg AgentPoolConfig) (*AgentPool, error)
}

pool := &AgentPool{
agents: make(map[utils.NetAddr][]*Agent),
agents: nil,
proxyTracker: tr,
cfg: cfg,
ctx: ctx,
Expand All @@ -161,7 +156,7 @@ func NewAgentPool(ctx context.Context, cfg AgentPoolConfig) (*AgentPool, error)
},
}),
}
pool.proxyTracker.Start(*proxyAddr)
pool.proxyTracker.Start()
return pool, nil
}

Expand Down Expand Up @@ -204,7 +199,6 @@ func (m *AgentPool) processSeekEvents() {
// The proxy tracker has given us permission to act on a given
// tunnel address
case lease := <-m.proxyTracker.Acquire():
m.log.Debugf("Seeking: %+v.", lease.Key())
m.withLock(func() {
// Note that ownership of the lease is transferred to agent
// pool for the lifetime of the connection
Expand Down Expand Up @@ -232,11 +226,11 @@ func (m *AgentPool) withLock(f func()) {
type matchAgentFn func(a *Agent) bool

func (m *AgentPool) closeAgents() {
for key, agents := range m.agents {
m.agents[key] = filterAndClose(agents, func(*Agent) bool { return true })
if len(m.agents[key]) == 0 {
delete(m.agents, key)
}
agents := filterAndClose(m.agents, func(*Agent) bool { return true })
if len(agents) <= 0 {
m.agents = nil
} else {
m.agents = agents
}
}

Expand All @@ -246,7 +240,9 @@ func filterAndClose(agents []*Agent, matchAgent matchAgentFn) []*Agent {
agent := agents[i]
if matchAgent(agent) {
agent.log.Debugf("Pool is closing agent.")
agent.Close()
if err := agent.Close(); err != nil {
agent.log.WithError(err).Warnf("Failed to close agent")
}
} else {
filtered = append(filtered, agent)
}
Expand All @@ -271,21 +267,24 @@ func (m *AgentPool) pollAndSyncAgents() {

// getReverseTunnelDetails gets the cached ReverseTunnelDetails obtained during the oldest cached agent.connect call.
// This function should be called under a lock.
func (m *AgentPool) getReverseTunnelDetails(addr utils.NetAddr) *reverseTunnelDetails {
agents, ok := m.agents[addr]
if !ok || len(agents) == 0 {
func (m *AgentPool) getReverseTunnelDetails() *reverseTunnelDetails {
if len(m.agents) <= 0 {
return nil
}
return agents[0].reverseTunnelDetails
return m.agents[0].reverseTunnelDetails
}

// addAgent adds a new agent to the pool. Note that ownership of the lease
// transfers into the AgentPool, and will be released when the AgentPool
// is done with it.
func (m *AgentPool) addAgent(lease track.Lease) error {
addr := lease.Key().(utils.NetAddr)
addr, err := m.cfg.Resolver()
if err != nil {
return trace.Wrap(err)
}

agent, err := NewAgent(AgentConfig{
Addr: addr,
Addr: *addr,
ClusterName: m.cfg.Cluster,
Username: m.cfg.HostUUID,
Signer: m.cfg.HostSigner,
Expand All @@ -300,7 +299,7 @@ func (m *AgentPool) addAgent(lease track.Lease) error {
Tracker: m.proxyTracker,
Lease: lease,
FIPS: m.cfg.FIPS,
reverseTunnelDetails: m.getReverseTunnelDetails(addr),
reverseTunnelDetails: m.getReverseTunnelDetails(),
})
if err != nil {
// ensure that lease has been released; OK to call multiple times.
Expand All @@ -311,21 +310,19 @@ func (m *AgentPool) addAgent(lease track.Lease) error {
// start the agent in a goroutine. no need to handle Start() errors: Start() will be
// retrying itself until the agent is closed
go agent.Start()
m.agents[addr] = append(m.agents[addr], agent)
m.agents = append(m.agents, agent)
return nil
}

// Counts returns a count of the number of proxies a outbound tunnel is
// Count returns a count of the number of proxies an outbound tunnel is
// connected to. Used in tests to determine if a proxy has been found and/or
// removed.
func (m *AgentPool) Count() int {
var out int
m.withLock(func() {
for _, agents := range m.agents {
for _, agent := range agents {
if agent.getState() == agentStateConnected {
out++
}
for _, agent := range m.agents {
if agent.getState() == agentStateConnected {
out++
}
}
})
Expand All @@ -336,18 +333,15 @@ func (m *AgentPool) Count() int {
// removeDisconnected removes disconnected agents from the list of agents.
// This function should be called under a lock.
func (m *AgentPool) removeDisconnected() {
for agentKey, agentSlice := range m.agents {
// Filter and close all disconnected agents.
validAgents := filterAndClose(agentSlice, func(agent *Agent) bool {
return agent.getState() == agentStateDisconnected
})

// Update (or delete) agent key with filter applied.
if len(validAgents) > 0 {
m.agents[agentKey] = validAgents
} else {
delete(m.agents, agentKey)
}
// Filter and close all disconnected agents.
agents := filterAndClose(m.agents, func(agent *Agent) bool {
return agent.getState() == agentStateDisconnected
})

if len(agents) <= 0 {
m.agents = nil
} else {
m.agents = agents
}
}

Expand Down
Loading

0 comments on commit b3625c0

Please sign in to comment.