blob: ddd0d0aa8a3bfb145c7581f0824cdd9b53e5bc25 [file] [log] [blame]
Aviv Keshet07f16242013-10-10 07:54:19 -07001import os, time, socket, shutil, glob, logging, traceback, tempfile
Aviv Keshet53a216a2013-08-27 13:58:46 -07002from autotest_lib.client.common_lib import autotemp, error
jadmanski31c49b72008-10-27 20:44:48 +00003from autotest_lib.server import utils, autotest
mblighe8b93af2009-01-30 00:45:53 +00004from autotest_lib.server.hosts import remote
mblighefccc1b2010-01-11 19:08:42 +00005from autotest_lib.client.common_lib.global_config import global_config
jadmanskica7da372008-10-21 16:26:52 +00006
Aviv Keshet53a216a2013-08-27 13:58:46 -07007# pylint: disable-msg=C0111
jadmanskica7da372008-10-21 16:26:52 +00008
mblighb86bfa12010-02-12 20:22:21 +00009get_value = global_config.get_config_value
10enable_master_ssh = get_value('AUTOSERV', 'enable_master_ssh', type=bool,
11 default=False)
mblighefccc1b2010-01-11 19:08:42 +000012
13
Fang Deng96667ca2013-08-01 17:46:18 -070014class AbstractSSHHost(remote.RemoteHost):
mblighbc9402b2009-12-29 01:15:34 +000015 """
16 This class represents a generic implementation of most of the
jadmanskica7da372008-10-21 16:26:52 +000017 framework necessary for controlling a host via ssh. It implements
18 almost all of the abstract Host methods, except for the core
mblighbc9402b2009-12-29 01:15:34 +000019 Host.run method.
20 """
jadmanskica7da372008-10-21 16:26:52 +000021
jadmanskif6562912008-10-21 17:59:01 +000022 def _initialize(self, hostname, user="root", port=22, password="",
23 *args, **dargs):
24 super(AbstractSSHHost, self)._initialize(hostname=hostname,
25 *args, **dargs)
Dan Shic07b8932014-12-11 15:22:30 -080026 # IP address is retrieved only on demand. Otherwise the host
27 # initialization will fail for host is not online.
28 self._ip = None
jadmanskica7da372008-10-21 16:26:52 +000029 self.user = user
30 self.port = port
31 self.password = password
showard6eafb492010-01-15 20:29:06 +000032 self._use_rsync = None
Fang Deng3af66202013-08-16 15:19:25 -070033 self.known_hosts_file = tempfile.mkstemp()[1]
jadmanskica7da372008-10-21 16:26:52 +000034
mblighefccc1b2010-01-11 19:08:42 +000035 """
36 Master SSH connection background job, socket temp directory and socket
37 control path option. If master-SSH is enabled, these fields will be
38 initialized by start_master_ssh when a new SSH connection is initiated.
39 """
40 self.master_ssh_job = None
41 self.master_ssh_tempdir = None
42 self.master_ssh_option = ''
43
showard6eafb492010-01-15 20:29:06 +000044
Dan Shic07b8932014-12-11 15:22:30 -080045 @property
46 def ip(self):
47 """@return IP address of the host.
48 """
49 if not self._ip:
50 self._ip = socket.getaddrinfo(self.hostname, None)[0][4][0]
51 return self._ip
52
53
Fang Deng96667ca2013-08-01 17:46:18 -070054 def make_ssh_command(self, user="root", port=22, opts='',
55 hosts_file='/dev/null',
56 connect_timeout=30, alive_interval=300):
57 base_command = ("/usr/bin/ssh -a -x %s -o StrictHostKeyChecking=no "
58 "-o UserKnownHostsFile=%s -o BatchMode=yes "
59 "-o ConnectTimeout=%d -o ServerAliveInterval=%d "
60 "-l %s -p %d")
61 assert isinstance(connect_timeout, (int, long))
62 assert connect_timeout > 0 # can't disable the timeout
63 return base_command % (opts, hosts_file, connect_timeout,
64 alive_interval, user, port)
65
66
showard6eafb492010-01-15 20:29:06 +000067 def use_rsync(self):
68 if self._use_rsync is not None:
69 return self._use_rsync
70
mblighc9892c02010-01-06 19:02:16 +000071 # Check if rsync is available on the remote host. If it's not,
72 # don't try to use it for any future file transfers.
showard6eafb492010-01-15 20:29:06 +000073 self._use_rsync = self._check_rsync()
74 if not self._use_rsync:
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -070075 logging.warning("rsync not available on remote host %s -- disabled",
mblighc9892c02010-01-06 19:02:16 +000076 self.hostname)
Eric Lie0493a42010-11-15 13:05:43 -080077 return self._use_rsync
mblighc9892c02010-01-06 19:02:16 +000078
79
80 def _check_rsync(self):
81 """
82 Check if rsync is available on the remote host.
83 """
84 try:
85 self.run("rsync --version", stdout_tee=None, stderr_tee=None)
86 except error.AutoservRunError:
87 return False
88 return True
89
jadmanskica7da372008-10-21 16:26:52 +000090
showard56176ec2009-10-28 19:52:30 +000091 def _encode_remote_paths(self, paths, escape=True):
mblighbc9402b2009-12-29 01:15:34 +000092 """
93 Given a list of file paths, encodes it as a single remote path, in
94 the style used by rsync and scp.
95 """
showard56176ec2009-10-28 19:52:30 +000096 if escape:
97 paths = [utils.scp_remote_escape(path) for path in paths]
98 return '%s@%s:"%s"' % (self.user, self.hostname, " ".join(paths))
jadmanskica7da372008-10-21 16:26:52 +000099
jadmanskica7da372008-10-21 16:26:52 +0000100
mbligh45561782009-05-11 21:14:34 +0000101 def _make_rsync_cmd(self, sources, dest, delete_dest, preserve_symlinks):
mblighbc9402b2009-12-29 01:15:34 +0000102 """
103 Given a list of source paths and a destination path, produces the
jadmanskid7b79ed2009-01-07 17:19:48 +0000104 appropriate rsync command for copying them. Remote paths must be
mblighbc9402b2009-12-29 01:15:34 +0000105 pre-encoded.
106 """
Fang Deng96667ca2013-08-01 17:46:18 -0700107 ssh_cmd = self.make_ssh_command(user=self.user, port=self.port,
108 opts=self.master_ssh_option,
109 hosts_file=self.known_hosts_file)
jadmanskid7b79ed2009-01-07 17:19:48 +0000110 if delete_dest:
111 delete_flag = "--delete"
112 else:
113 delete_flag = ""
mbligh45561782009-05-11 21:14:34 +0000114 if preserve_symlinks:
115 symlink_flag = ""
116 else:
117 symlink_flag = "-L"
Dan Shi06d7fbf2014-02-12 12:34:41 -0800118 command = ("rsync %s %s --timeout=1800 --rsh='%s' -az --no-o --no-g "
David Hendricksb8904182014-06-02 15:22:49 -0700119 "%s \"%s\"")
mbligh45561782009-05-11 21:14:34 +0000120 return command % (symlink_flag, delete_flag, ssh_cmd,
David Hendricksb8904182014-06-02 15:22:49 -0700121 " ".join(['"%s"' % p for p in sources]), dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000122
123
Eric Li861b2d52011-02-04 14:50:35 -0800124 def _make_ssh_cmd(self, cmd):
125 """
126 Create a base ssh command string for the host which can be used
127 to run commands directly on the machine
128 """
Fang Deng96667ca2013-08-01 17:46:18 -0700129 base_cmd = self.make_ssh_command(user=self.user, port=self.port,
130 opts=self.master_ssh_option,
131 hosts_file=self.known_hosts_file)
Eric Li861b2d52011-02-04 14:50:35 -0800132
133 return '%s %s "%s"' % (base_cmd, self.hostname, utils.sh_escape(cmd))
134
jadmanskid7b79ed2009-01-07 17:19:48 +0000135 def _make_scp_cmd(self, sources, dest):
mblighbc9402b2009-12-29 01:15:34 +0000136 """
137 Given a list of source paths and a destination path, produces the
jadmanskid7b79ed2009-01-07 17:19:48 +0000138 appropriate scp command for encoding it. Remote paths must be
mblighbc9402b2009-12-29 01:15:34 +0000139 pre-encoded.
140 """
mblighc0649d62010-01-15 18:15:58 +0000141 command = ("scp -rq %s -o StrictHostKeyChecking=no "
lmraf676f32010-02-04 03:36:26 +0000142 "-o UserKnownHostsFile=%s -P %d %s '%s'")
Fang Deng3af66202013-08-16 15:19:25 -0700143 return command % (self.master_ssh_option, self.known_hosts_file,
mblighefccc1b2010-01-11 19:08:42 +0000144 self.port, " ".join(sources), dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000145
146
147 def _make_rsync_compatible_globs(self, path, is_local):
mblighbc9402b2009-12-29 01:15:34 +0000148 """
149 Given an rsync-style path, returns a list of globbed paths
jadmanskid7b79ed2009-01-07 17:19:48 +0000150 that will hopefully provide equivalent behaviour for scp. Does not
151 support the full range of rsync pattern matching behaviour, only that
152 exposed in the get/send_file interface (trailing slashes).
153
154 The is_local param is flag indicating if the paths should be
mblighbc9402b2009-12-29 01:15:34 +0000155 interpreted as local or remote paths.
156 """
jadmanskid7b79ed2009-01-07 17:19:48 +0000157
158 # non-trailing slash paths should just work
159 if len(path) == 0 or path[-1] != "/":
160 return [path]
161
162 # make a function to test if a pattern matches any files
163 if is_local:
showard56176ec2009-10-28 19:52:30 +0000164 def glob_matches_files(path, pattern):
165 return len(glob.glob(path + pattern)) > 0
jadmanskid7b79ed2009-01-07 17:19:48 +0000166 else:
showard56176ec2009-10-28 19:52:30 +0000167 def glob_matches_files(path, pattern):
168 result = self.run("ls \"%s\"%s" % (utils.sh_escape(path),
169 pattern),
170 stdout_tee=None, ignore_status=True)
jadmanskid7b79ed2009-01-07 17:19:48 +0000171 return result.exit_status == 0
172
173 # take a set of globs that cover all files, and see which are needed
174 patterns = ["*", ".[!.]*"]
showard56176ec2009-10-28 19:52:30 +0000175 patterns = [p for p in patterns if glob_matches_files(path, p)]
jadmanskid7b79ed2009-01-07 17:19:48 +0000176
177 # convert them into a set of paths suitable for the commandline
jadmanskid7b79ed2009-01-07 17:19:48 +0000178 if is_local:
showard56176ec2009-10-28 19:52:30 +0000179 return ["\"%s\"%s" % (utils.sh_escape(path), pattern)
180 for pattern in patterns]
jadmanskid7b79ed2009-01-07 17:19:48 +0000181 else:
showard56176ec2009-10-28 19:52:30 +0000182 return [utils.scp_remote_escape(path) + pattern
183 for pattern in patterns]
jadmanskid7b79ed2009-01-07 17:19:48 +0000184
185
186 def _make_rsync_compatible_source(self, source, is_local):
mblighbc9402b2009-12-29 01:15:34 +0000187 """
188 Applies the same logic as _make_rsync_compatible_globs, but
jadmanskid7b79ed2009-01-07 17:19:48 +0000189 applies it to an entire list of sources, producing a new list of
mblighbc9402b2009-12-29 01:15:34 +0000190 sources, properly quoted.
191 """
jadmanskid7b79ed2009-01-07 17:19:48 +0000192 return sum((self._make_rsync_compatible_globs(path, is_local)
193 for path in source), [])
jadmanskica7da372008-10-21 16:26:52 +0000194
195
mblighfeac0102009-04-28 18:31:12 +0000196 def _set_umask_perms(self, dest):
mblighbc9402b2009-12-29 01:15:34 +0000197 """
198 Given a destination file/dir (recursively) set the permissions on
199 all the files and directories to the max allowed by running umask.
200 """
mblighfeac0102009-04-28 18:31:12 +0000201
202 # now this looks strange but I haven't found a way in Python to _just_
203 # get the umask, apparently the only option is to try to set it
204 umask = os.umask(0)
205 os.umask(umask)
206
207 max_privs = 0777 & ~umask
208
209 def set_file_privs(filename):
Chris Masone567d0d92011-12-19 09:38:30 -0800210 """Sets mode of |filename|. Assumes |filename| exists."""
211 file_stat = os.stat(filename)
mblighfeac0102009-04-28 18:31:12 +0000212
213 file_privs = max_privs
214 # if the original file permissions do not have at least one
215 # executable bit then do not set it anywhere
216 if not file_stat.st_mode & 0111:
217 file_privs &= ~0111
218
219 os.chmod(filename, file_privs)
220
221 # try a bottom-up walk so changes on directory permissions won't cut
222 # our access to the files/directories inside it
223 for root, dirs, files in os.walk(dest, topdown=False):
224 # when setting the privileges we emulate the chmod "X" behaviour
225 # that sets to execute only if it is a directory or any of the
226 # owner/group/other already has execute right
227 for dirname in dirs:
228 os.chmod(os.path.join(root, dirname), max_privs)
229
Chris Masone567d0d92011-12-19 09:38:30 -0800230 # Filter out broken symlinks as we go.
231 for filename in filter(os.path.exists, files):
mblighfeac0102009-04-28 18:31:12 +0000232 set_file_privs(os.path.join(root, filename))
233
234
235 # now set privs for the dest itself
236 if os.path.isdir(dest):
237 os.chmod(dest, max_privs)
238 else:
239 set_file_privs(dest)
240
241
mbligh45561782009-05-11 21:14:34 +0000242 def get_file(self, source, dest, delete_dest=False, preserve_perm=True,
243 preserve_symlinks=False):
jadmanskica7da372008-10-21 16:26:52 +0000244 """
245 Copy files from the remote host to a local path.
246
247 Directories will be copied recursively.
248 If a source component is a directory with a trailing slash,
249 the content of the directory will be copied, otherwise, the
250 directory itself and its content will be copied. This
251 behavior is similar to that of the program 'rsync'.
252
253 Args:
254 source: either
255 1) a single file or directory, as a string
256 2) a list of one or more (possibly mixed)
257 files or directories
258 dest: a file or a directory (if source contains a
259 directory or more than one element, you must
260 supply a directory dest)
mbligh89e258d2008-10-24 13:58:08 +0000261 delete_dest: if this is true, the command will also clear
262 out any old files at dest that are not in the
263 source
mblighfeac0102009-04-28 18:31:12 +0000264 preserve_perm: tells get_file() to try to preserve the sources
265 permissions on files and dirs
mbligh45561782009-05-11 21:14:34 +0000266 preserve_symlinks: try to preserve symlinks instead of
267 transforming them into files/dirs on copy
jadmanskica7da372008-10-21 16:26:52 +0000268
269 Raises:
270 AutoservRunError: the scp command failed
271 """
Simran Basi882f15b2013-10-29 14:59:34 -0700272 logging.debug('get_file. source: %s, dest: %s, delete_dest: %s,'
273 'preserve_perm: %s, preserve_symlinks:%s', source, dest,
274 delete_dest, preserve_perm, preserve_symlinks)
mblighefccc1b2010-01-11 19:08:42 +0000275 # Start a master SSH connection if necessary.
276 self.start_master_ssh()
277
jadmanskica7da372008-10-21 16:26:52 +0000278 if isinstance(source, basestring):
279 source = [source]
jadmanskid7b79ed2009-01-07 17:19:48 +0000280 dest = os.path.abspath(dest)
jadmanskica7da372008-10-21 16:26:52 +0000281
mblighc9892c02010-01-06 19:02:16 +0000282 # If rsync is disabled or fails, try scp.
showard6eafb492010-01-15 20:29:06 +0000283 try_scp = True
284 if self.use_rsync():
Simran Basi882f15b2013-10-29 14:59:34 -0700285 logging.debug('Using Rsync.')
mblighc9892c02010-01-06 19:02:16 +0000286 try:
287 remote_source = self._encode_remote_paths(source)
288 local_dest = utils.sh_escape(dest)
289 rsync = self._make_rsync_cmd([remote_source], local_dest,
290 delete_dest, preserve_symlinks)
291 utils.run(rsync)
showard6eafb492010-01-15 20:29:06 +0000292 try_scp = False
mblighc9892c02010-01-06 19:02:16 +0000293 except error.CmdError, e:
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700294 logging.warning("trying scp, rsync failed: %s", e)
mblighc9892c02010-01-06 19:02:16 +0000295
296 if try_scp:
Simran Basi882f15b2013-10-29 14:59:34 -0700297 logging.debug('Trying scp.')
jadmanskid7b79ed2009-01-07 17:19:48 +0000298 # scp has no equivalent to --delete, just drop the entire dest dir
299 if delete_dest and os.path.isdir(dest):
300 shutil.rmtree(dest)
301 os.mkdir(dest)
jadmanskica7da372008-10-21 16:26:52 +0000302
jadmanskid7b79ed2009-01-07 17:19:48 +0000303 remote_source = self._make_rsync_compatible_source(source, False)
304 if remote_source:
showard56176ec2009-10-28 19:52:30 +0000305 # _make_rsync_compatible_source() already did the escaping
306 remote_source = self._encode_remote_paths(remote_source,
307 escape=False)
jadmanskid7b79ed2009-01-07 17:19:48 +0000308 local_dest = utils.sh_escape(dest)
jadmanski2583a432009-02-10 23:59:11 +0000309 scp = self._make_scp_cmd([remote_source], local_dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000310 try:
311 utils.run(scp)
312 except error.CmdError, e:
Simran Basi882f15b2013-10-29 14:59:34 -0700313 logging.debug('scp failed: %s', e)
jadmanskid7b79ed2009-01-07 17:19:48 +0000314 raise error.AutoservRunError(e.args[0], e.args[1])
jadmanskica7da372008-10-21 16:26:52 +0000315
mblighfeac0102009-04-28 18:31:12 +0000316 if not preserve_perm:
317 # we have no way to tell scp to not try to preserve the
318 # permissions so set them after copy instead.
319 # for rsync we could use "--no-p --chmod=ugo=rwX" but those
320 # options are only in very recent rsync versions
321 self._set_umask_perms(dest)
322
jadmanskica7da372008-10-21 16:26:52 +0000323
mbligh45561782009-05-11 21:14:34 +0000324 def send_file(self, source, dest, delete_dest=False,
325 preserve_symlinks=False):
jadmanskica7da372008-10-21 16:26:52 +0000326 """
327 Copy files from a local path to the remote host.
328
329 Directories will be copied recursively.
330 If a source component is a directory with a trailing slash,
331 the content of the directory will be copied, otherwise, the
332 directory itself and its content will be copied. This
333 behavior is similar to that of the program 'rsync'.
334
335 Args:
336 source: either
337 1) a single file or directory, as a string
338 2) a list of one or more (possibly mixed)
339 files or directories
340 dest: a file or a directory (if source contains a
341 directory or more than one element, you must
342 supply a directory dest)
mbligh89e258d2008-10-24 13:58:08 +0000343 delete_dest: if this is true, the command will also clear
344 out any old files at dest that are not in the
345 source
mbligh45561782009-05-11 21:14:34 +0000346 preserve_symlinks: controls if symlinks on the source will be
347 copied as such on the destination or transformed into the
348 referenced file/directory
jadmanskica7da372008-10-21 16:26:52 +0000349
350 Raises:
351 AutoservRunError: the scp command failed
352 """
Simran Basi882f15b2013-10-29 14:59:34 -0700353 logging.debug('send_file. source: %s, dest: %s, delete_dest: %s,'
354 'preserve_symlinks:%s', source, dest,
355 delete_dest, preserve_symlinks)
mblighefccc1b2010-01-11 19:08:42 +0000356 # Start a master SSH connection if necessary.
357 self.start_master_ssh()
358
jadmanskica7da372008-10-21 16:26:52 +0000359 if isinstance(source, basestring):
360 source = [source]
jadmanski2583a432009-02-10 23:59:11 +0000361 remote_dest = self._encode_remote_paths([dest])
jadmanskica7da372008-10-21 16:26:52 +0000362
mblighc9892c02010-01-06 19:02:16 +0000363 # If rsync is disabled or fails, try scp.
showard6eafb492010-01-15 20:29:06 +0000364 try_scp = True
365 if self.use_rsync():
Simran Basi882f15b2013-10-29 14:59:34 -0700366 logging.debug('Using Rsync.')
mblighc9892c02010-01-06 19:02:16 +0000367 try:
368 local_sources = [utils.sh_escape(path) for path in source]
369 rsync = self._make_rsync_cmd(local_sources, remote_dest,
370 delete_dest, preserve_symlinks)
371 utils.run(rsync)
showard6eafb492010-01-15 20:29:06 +0000372 try_scp = False
mblighc9892c02010-01-06 19:02:16 +0000373 except error.CmdError, e:
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700374 logging.warning("trying scp, rsync failed: %s", e)
mblighc9892c02010-01-06 19:02:16 +0000375
376 if try_scp:
Simran Basi882f15b2013-10-29 14:59:34 -0700377 logging.debug('Trying scp.')
jadmanskid7b79ed2009-01-07 17:19:48 +0000378 # scp has no equivalent to --delete, just drop the entire dest dir
379 if delete_dest:
showard27160152009-07-15 14:28:42 +0000380 is_dir = self.run("ls -d %s/" % dest,
jadmanskid7b79ed2009-01-07 17:19:48 +0000381 ignore_status=True).exit_status == 0
382 if is_dir:
383 cmd = "rm -rf %s && mkdir %s"
mbligh5a0ca532009-08-03 16:44:34 +0000384 cmd %= (dest, dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000385 self.run(cmd)
jadmanskica7da372008-10-21 16:26:52 +0000386
jadmanski2583a432009-02-10 23:59:11 +0000387 local_sources = self._make_rsync_compatible_source(source, True)
388 if local_sources:
389 scp = self._make_scp_cmd(local_sources, remote_dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000390 try:
391 utils.run(scp)
392 except error.CmdError, e:
Simran Basi882f15b2013-10-29 14:59:34 -0700393 logging.debug('scp failed: %s', e)
jadmanskid7b79ed2009-01-07 17:19:48 +0000394 raise error.AutoservRunError(e.args[0], e.args[1])
395
jadmanskica7da372008-10-21 16:26:52 +0000396
beeps46dadc92013-11-07 14:07:10 -0800397 def ssh_ping(self, timeout=60, base_cmd='true'):
beepsadd66d32013-03-04 17:21:51 -0800398 """
399 Pings remote host via ssh.
400
401 @param timeout: Time in seconds before giving up.
402 Defaults to 60 seconds.
beeps46dadc92013-11-07 14:07:10 -0800403 @param base_cmd: The base command to run with the ssh ping.
404 Defaults to true.
beepsadd66d32013-03-04 17:21:51 -0800405 @raise AutoservSSHTimeout: If the ssh ping times out.
406 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
407 permissions.
408 @raise AutoservSshPingHostError: For other AutoservRunErrors.
409 """
jadmanskica7da372008-10-21 16:26:52 +0000410 try:
beeps46dadc92013-11-07 14:07:10 -0800411 self.run(base_cmd, timeout=timeout, connect_timeout=timeout)
jadmanskica7da372008-10-21 16:26:52 +0000412 except error.AutoservSSHTimeout:
mblighd0e94982009-07-11 00:15:18 +0000413 msg = "Host (ssh) verify timed out (timeout = %d)" % timeout
jadmanskica7da372008-10-21 16:26:52 +0000414 raise error.AutoservSSHTimeout(msg)
mbligh9d738d62009-03-09 21:17:10 +0000415 except error.AutoservSshPermissionDeniedError:
416 #let AutoservSshPermissionDeniedError be visible to the callers
417 raise
jadmanskica7da372008-10-21 16:26:52 +0000418 except error.AutoservRunError, e:
mblighc971c5f2009-06-08 16:48:54 +0000419 # convert the generic AutoservRunError into something more
420 # specific for this context
421 raise error.AutoservSshPingHostError(e.description + '\n' +
422 repr(e.result_obj))
jadmanskica7da372008-10-21 16:26:52 +0000423
424
beeps46dadc92013-11-07 14:07:10 -0800425 def is_up(self, timeout=60, base_cmd='true'):
jadmanskica7da372008-10-21 16:26:52 +0000426 """
beeps46dadc92013-11-07 14:07:10 -0800427 Check if the remote host is up by ssh-ing and running a base command.
jadmanskica7da372008-10-21 16:26:52 +0000428
beepsadd66d32013-03-04 17:21:51 -0800429 @param timeout: timeout in seconds.
beeps46dadc92013-11-07 14:07:10 -0800430 @param base_cmd: a base command to run with ssh. The default is 'true'.
beepsadd66d32013-03-04 17:21:51 -0800431 @returns True if the remote host is up before the timeout expires,
432 False otherwise.
jadmanskica7da372008-10-21 16:26:52 +0000433 """
434 try:
beeps46dadc92013-11-07 14:07:10 -0800435 self.ssh_ping(timeout=timeout, base_cmd=base_cmd)
jadmanskica7da372008-10-21 16:26:52 +0000436 except error.AutoservError:
437 return False
438 else:
439 return True
440
441
442 def wait_up(self, timeout=None):
443 """
444 Wait until the remote host is up or the timeout expires.
445
446 In fact, it will wait until an ssh connection to the remote
447 host can be established, and getty is running.
448
jadmanskic0354912010-01-12 15:57:29 +0000449 @param timeout time limit in seconds before returning even
450 if the host is not up.
jadmanskica7da372008-10-21 16:26:52 +0000451
beepsadd66d32013-03-04 17:21:51 -0800452 @returns True if the host was found to be up before the timeout expires,
453 False otherwise
jadmanskica7da372008-10-21 16:26:52 +0000454 """
455 if timeout:
beeps46dadc92013-11-07 14:07:10 -0800456 current_time = int(time.time())
457 end_time = current_time + timeout
jadmanskica7da372008-10-21 16:26:52 +0000458
beepsadd66d32013-03-04 17:21:51 -0800459 while not timeout or current_time < end_time:
460 if self.is_up(timeout=end_time - current_time):
jadmanskica7da372008-10-21 16:26:52 +0000461 try:
462 if self.are_wait_up_processes_up():
jadmanski7ebac3d2010-06-17 16:06:31 +0000463 logging.debug('Host %s is now up', self.hostname)
jadmanskica7da372008-10-21 16:26:52 +0000464 return True
465 except error.AutoservError:
466 pass
467 time.sleep(1)
beeps46dadc92013-11-07 14:07:10 -0800468 current_time = int(time.time())
jadmanskica7da372008-10-21 16:26:52 +0000469
jadmanski7ebac3d2010-06-17 16:06:31 +0000470 logging.debug('Host %s is still down after waiting %d seconds',
471 self.hostname, int(timeout + time.time() - end_time))
jadmanskica7da372008-10-21 16:26:52 +0000472 return False
473
474
jadmanskic0354912010-01-12 15:57:29 +0000475 def wait_down(self, timeout=None, warning_timer=None, old_boot_id=None):
jadmanskica7da372008-10-21 16:26:52 +0000476 """
477 Wait until the remote host is down or the timeout expires.
478
jadmanskic0354912010-01-12 15:57:29 +0000479 If old_boot_id is provided, this will wait until either the machine
480 is unpingable or self.get_boot_id() returns a value different from
481 old_boot_id. If the boot_id value has changed then the function
482 returns true under the assumption that the machine has shut down
483 and has now already come back up.
jadmanskica7da372008-10-21 16:26:52 +0000484
jadmanskic0354912010-01-12 15:57:29 +0000485 If old_boot_id is None then until the machine becomes unreachable the
486 method assumes the machine has not yet shut down.
jadmanskica7da372008-10-21 16:26:52 +0000487
beepsadd66d32013-03-04 17:21:51 -0800488 Based on this definition, the 4 possible permutations of timeout
489 and old_boot_id are:
490 1. timeout and old_boot_id: wait timeout seconds for either the
491 host to become unpingable, or the boot id
492 to change. In the latter case we've rebooted
493 and in the former case we've only shutdown,
494 but both cases return True.
495 2. only timeout: wait timeout seconds for the host to become unpingable.
496 If the host remains pingable throughout timeout seconds
497 we return False.
498 3. only old_boot_id: wait forever until either the host becomes
499 unpingable or the boot_id changes. Return true
500 when either of those conditions are met.
501 4. not timeout, not old_boot_id: wait forever till the host becomes
502 unpingable.
503
jadmanskic0354912010-01-12 15:57:29 +0000504 @param timeout Time limit in seconds before returning even
505 if the host is still up.
506 @param warning_timer Time limit in seconds that will generate
507 a warning if the host is not down yet.
508 @param old_boot_id A string containing the result of self.get_boot_id()
509 prior to the host being told to shut down. Can be None if this is
510 not available.
511
512 @returns True if the host was found to be down, False otherwise
jadmanskica7da372008-10-21 16:26:52 +0000513 """
mblighe5e3cf22010-05-27 23:33:14 +0000514 #TODO: there is currently no way to distinguish between knowing
515 #TODO: boot_id was unsupported and not knowing the boot_id.
beeps46dadc92013-11-07 14:07:10 -0800516 current_time = int(time.time())
jadmanskica7da372008-10-21 16:26:52 +0000517 if timeout:
mbligh2ed998f2009-04-08 21:03:47 +0000518 end_time = current_time + timeout
jadmanskica7da372008-10-21 16:26:52 +0000519
mbligh2ed998f2009-04-08 21:03:47 +0000520 if warning_timer:
521 warn_time = current_time + warning_timer
522
jadmanskic0354912010-01-12 15:57:29 +0000523 if old_boot_id is not None:
524 logging.debug('Host %s pre-shutdown boot_id is %s',
525 self.hostname, old_boot_id)
526
beepsadd66d32013-03-04 17:21:51 -0800527 # Impose semi real-time deadline constraints, since some clients
528 # (eg: watchdog timer tests) expect strict checking of time elapsed.
529 # Each iteration of this loop is treated as though it atomically
530 # completes within current_time, this is needed because if we used
531 # inline time.time() calls instead then the following could happen:
532 #
533 # while not timeout or time.time() < end_time: [23 < 30]
534 # some code. [takes 10 secs]
535 # try:
536 # new_boot_id = self.get_boot_id(timeout=end_time - time.time())
537 # [30 - 33]
538 # The last step will lead to a return True, when in fact the machine
539 # went down at 32 seconds (>30). Hence we need to pass get_boot_id
540 # the same time that allowed us into that iteration of the loop.
mbligh2ed998f2009-04-08 21:03:47 +0000541 while not timeout or current_time < end_time:
jadmanskic0354912010-01-12 15:57:29 +0000542 try:
beeps46dadc92013-11-07 14:07:10 -0800543 new_boot_id = self.get_boot_id(timeout=end_time-current_time)
mblighdbc7e4a2010-01-15 20:34:20 +0000544 except error.AutoservError:
jadmanskic0354912010-01-12 15:57:29 +0000545 logging.debug('Host %s is now unreachable over ssh, is down',
546 self.hostname)
jadmanskica7da372008-10-21 16:26:52 +0000547 return True
jadmanskic0354912010-01-12 15:57:29 +0000548 else:
549 # if the machine is up but the boot_id value has changed from
550 # old boot id, then we can assume the machine has gone down
551 # and then already come back up
552 if old_boot_id is not None and old_boot_id != new_boot_id:
553 logging.debug('Host %s now has boot_id %s and so must '
554 'have rebooted', self.hostname, new_boot_id)
555 return True
mbligh2ed998f2009-04-08 21:03:47 +0000556
557 if warning_timer and current_time > warn_time:
Scott Zawalskic86fdeb2013-10-23 10:24:04 -0400558 self.record("INFO", None, "shutdown",
mbligh2ed998f2009-04-08 21:03:47 +0000559 "Shutdown took longer than %ds" % warning_timer)
560 # Print the warning only once.
561 warning_timer = None
mbligha4464402009-04-17 20:13:41 +0000562 # If a machine is stuck switching runlevels
563 # This may cause the machine to reboot.
564 self.run('kill -HUP 1', ignore_status=True)
mbligh2ed998f2009-04-08 21:03:47 +0000565
jadmanskica7da372008-10-21 16:26:52 +0000566 time.sleep(1)
beeps46dadc92013-11-07 14:07:10 -0800567 current_time = int(time.time())
jadmanskica7da372008-10-21 16:26:52 +0000568
569 return False
jadmanskif6562912008-10-21 17:59:01 +0000570
mbligha0a27592009-01-24 01:41:36 +0000571
jadmanskif6562912008-10-21 17:59:01 +0000572 # tunable constants for the verify & repair code
mblighb86bfa12010-02-12 20:22:21 +0000573 AUTOTEST_GB_DISKSPACE_REQUIRED = get_value("SERVER",
574 "gb_diskspace_required",
Fang Deng6b05f5b2013-03-20 13:42:11 -0700575 type=float,
576 default=20.0)
mbligha0a27592009-01-24 01:41:36 +0000577
jadmanskif6562912008-10-21 17:59:01 +0000578
showardca572982009-09-18 21:20:01 +0000579 def verify_connectivity(self):
580 super(AbstractSSHHost, self).verify_connectivity()
jadmanskif6562912008-10-21 17:59:01 +0000581
showardb18134f2009-03-20 20:52:18 +0000582 logging.info('Pinging host ' + self.hostname)
jadmanskif6562912008-10-21 17:59:01 +0000583 self.ssh_ping()
mbligh2ba7ab02009-08-24 22:09:26 +0000584 logging.info("Host (ssh) %s is alive", self.hostname)
jadmanskif6562912008-10-21 17:59:01 +0000585
jadmanski80deb752009-01-21 17:14:16 +0000586 if self.is_shutting_down():
mblighc971c5f2009-06-08 16:48:54 +0000587 raise error.AutoservHostIsShuttingDownError("Host is shutting down")
jadmanski80deb752009-01-21 17:14:16 +0000588
mblighb49b5232009-02-12 21:54:49 +0000589
showardca572982009-09-18 21:20:01 +0000590 def verify_software(self):
591 super(AbstractSSHHost, self).verify_software()
jadmanskif6562912008-10-21 17:59:01 +0000592 try:
showardad812bf2009-10-20 23:49:56 +0000593 self.check_diskspace(autotest.Autotest.get_install_dir(self),
594 self.AUTOTEST_GB_DISKSPACE_REQUIRED)
jadmanskif6562912008-10-21 17:59:01 +0000595 except error.AutoservHostError:
596 raise # only want to raise if it's a space issue
showardad812bf2009-10-20 23:49:56 +0000597 except autotest.AutodirNotFoundError:
showardca572982009-09-18 21:20:01 +0000598 # autotest dir may not exist, etc. ignore
599 logging.debug('autodir space check exception, this is probably '
600 'safe to ignore\n' + traceback.format_exc())
mblighefccc1b2010-01-11 19:08:42 +0000601
602
603 def close(self):
604 super(AbstractSSHHost, self).close()
605 self._cleanup_master_ssh()
Fang Deng3af66202013-08-16 15:19:25 -0700606 os.remove(self.known_hosts_file)
mblighefccc1b2010-01-11 19:08:42 +0000607
608
609 def _cleanup_master_ssh(self):
610 """
611 Release all resources (process, temporary directory) used by an active
612 master SSH connection.
613 """
614 # If a master SSH connection is running, kill it.
615 if self.master_ssh_job is not None:
Aviv Keshet46250752013-08-27 15:52:06 -0700616 logging.debug('Nuking master_ssh_job.')
mblighefccc1b2010-01-11 19:08:42 +0000617 utils.nuke_subprocess(self.master_ssh_job.sp)
618 self.master_ssh_job = None
619
620 # Remove the temporary directory for the master SSH socket.
621 if self.master_ssh_tempdir is not None:
Aviv Keshet46250752013-08-27 15:52:06 -0700622 logging.debug('Cleaning master_ssh_tempdir.')
mblighefccc1b2010-01-11 19:08:42 +0000623 self.master_ssh_tempdir.clean()
624 self.master_ssh_tempdir = None
625 self.master_ssh_option = ''
626
627
Aviv Keshet0749a822013-10-17 09:53:26 -0700628 def start_master_ssh(self, timeout=5):
mblighefccc1b2010-01-11 19:08:42 +0000629 """
630 Called whenever a slave SSH connection needs to be initiated (e.g., by
631 run, rsync, scp). If master SSH support is enabled and a master SSH
632 connection is not active already, start a new one in the background.
633 Also, cleanup any zombie master SSH connections (e.g., dead due to
634 reboot).
Aviv Keshet0749a822013-10-17 09:53:26 -0700635
636 timeout: timeout in seconds (default 5) to wait for master ssh
637 connection to be established. If timeout is reached, a
638 warning message is logged, but no other action is taken.
mblighefccc1b2010-01-11 19:08:42 +0000639 """
640 if not enable_master_ssh:
641 return
642
643 # If a previously started master SSH connection is not running
644 # anymore, it needs to be cleaned up and then restarted.
645 if self.master_ssh_job is not None:
Aviv Keshet49b4ed02013-09-05 14:48:21 -0700646 socket_path = os.path.join(self.master_ssh_tempdir.name, 'socket')
647 if (not os.path.exists(socket_path) or
J. Richard Barnettec83ab152014-12-19 17:11:28 -0800648 self.master_ssh_job.sp.poll() is not None):
mblighefccc1b2010-01-11 19:08:42 +0000649 logging.info("Master ssh connection to %s is down.",
650 self.hostname)
651 self._cleanup_master_ssh()
652
653 # Start a new master SSH connection.
654 if self.master_ssh_job is None:
655 # Create a shared socket in a temp location.
656 self.master_ssh_tempdir = autotemp.tempdir(unique_id='ssh-master')
657 self.master_ssh_option = ("-o ControlPath=%s/socket" %
658 self.master_ssh_tempdir.name)
659
660 # Start the master SSH connection in the background.
mbligh5644c122010-01-29 17:43:26 +0000661 master_cmd = self.ssh_command(options="-N -o ControlMaster=yes")
Aviv Keshet46250752013-08-27 15:52:06 -0700662 logging.info("Starting master ssh connection '%s'", master_cmd)
Aviv Keshet53a216a2013-08-27 13:58:46 -0700663 self.master_ssh_job = utils.BgJob(master_cmd,
Aviv Keshet46250752013-08-27 15:52:06 -0700664 nickname='master-ssh',
665 no_pipes=True)
Aviv Keshet0749a822013-10-17 09:53:26 -0700666 # To prevent a race between the the master ssh connection startup
667 # and its first attempted use, wait for socket file to exist before
668 # returning.
669 end_time = time.time() + timeout
670 socket_file_path = os.path.join(self.master_ssh_tempdir.name,
671 'socket')
672 while time.time() < end_time:
673 if os.path.exists(socket_file_path):
674 break
675 time.sleep(.2)
676 else:
J. Richard Barnettec83ab152014-12-19 17:11:28 -0800677 logging.info('Timed out waiting for master-ssh connection '
Aviv Keshet0749a822013-10-17 09:53:26 -0700678 'to be established.')
mbligh0a883702010-04-21 01:58:34 +0000679
680
681 def clear_known_hosts(self):
682 """Clears out the temporary ssh known_hosts file.
683
684 This is useful if the test SSHes to the machine, then reinstalls it,
685 then SSHes to it again. It can be called after the reinstall to
686 reduce the spam in the logs.
687 """
688 logging.info("Clearing known hosts for host '%s', file '%s'.",
Fang Deng3af66202013-08-16 15:19:25 -0700689 self.hostname, self.known_hosts_file)
mbligh0a883702010-04-21 01:58:34 +0000690 # Clear out the file by opening it for writing and then closing.
Fang Deng3af66202013-08-16 15:19:25 -0700691 fh = open(self.known_hosts_file, "w")
mbligh0a883702010-04-21 01:58:34 +0000692 fh.close()
Prashanth B98509c72014-04-04 16:01:34 -0700693
694
695 def collect_logs(self, remote_src_dir, local_dest_dir, ignore_errors=True):
696 """Copy log directories from a host to a local directory.
697
698 @param remote_src_dir: A destination directory on the host.
699 @param local_dest_dir: A path to a local destination directory.
700 If it doesn't exist it will be created.
701 @param ignore_errors: If True, ignore exceptions.
702
703 @raises OSError: If there were problems creating the local_dest_dir and
704 ignore_errors is False.
705 @raises AutoservRunError, AutotestRunError: If something goes wrong
706 while copying the directories and ignore_errors is False.
707 """
708 locally_created_dest = False
709 if (not os.path.exists(local_dest_dir)
710 or not os.path.isdir(local_dest_dir)):
711 try:
712 os.makedirs(local_dest_dir)
713 locally_created_dest = True
714 except OSError as e:
715 logging.warning('Unable to collect logs from host '
716 '%s: %s', self.hostname, e)
717 if not ignore_errors:
718 raise
719 return
720 try:
721 self.get_file(
722 remote_src_dir, local_dest_dir, preserve_symlinks=True)
723 except (error.AutotestRunError, error.AutoservRunError,
724 error.AutoservSSHTimeout) as e:
725 logging.warning('Collection of %s to local dir %s from host %s '
726 'failed: %s', remote_src_dir, local_dest_dir,
727 self.hostname, e)
728 if locally_created_dest:
729 shutil.rmtree(local_dest_dir, ignore_errors=ignore_errors)
730 if not ignore_errors:
731 raise