With long-running jobs like thrashing, ssh connections were timing
out.
remote.ssh = connection.connect(
user_at_host=remote.name,
host_key=ctx.config['targets'][remote.name],
+ keep_alive=True,
)
except socket.timeout:
pass
log.debug('connecting to %s', t)
remotes.append(
remote.Remote(name=t,
- ssh=connection.connect(user_at_host=t, host_key=key)))
+ ssh=connection.connect(user_at_host=t,
+ host_key=key,
+ keep_alive=True)))
ctx.cluster = orchestra.cluster.Cluster()
if 'roles' in ctx.config:
for rem, roles in zip(remotes, ctx.config['roles']):