blob: 4854d9e36456a239c0faa6f2d88cf9f25a26b123 [file] [log] [blame]
Marc Herbert21eb6492015-11-13 15:48:53 -08001import os, time, socket, shutil, glob, logging, traceback, tempfile, re
Cheng-Yi Chianga155e7e2015-08-20 20:42:04 +08002import subprocess
3
Simran Basi3b858a22015-03-17 16:23:24 -07004from multiprocessing import Lock
Aviv Keshet53a216a2013-08-27 13:58:46 -07005from autotest_lib.client.common_lib import autotemp, error
jadmanski31c49b72008-10-27 20:44:48 +00006from autotest_lib.server import utils, autotest
mblighe8b93af2009-01-30 00:45:53 +00007from autotest_lib.server.hosts import remote
Roshan Pius58e5dd32015-10-16 15:16:42 -07008from autotest_lib.server.hosts import rpc_server_tracker
mblighefccc1b2010-01-11 19:08:42 +00009from autotest_lib.client.common_lib.global_config import global_config
jadmanskica7da372008-10-21 16:26:52 +000010
Aviv Keshet53a216a2013-08-27 13:58:46 -070011# pylint: disable-msg=C0111
jadmanskica7da372008-10-21 16:26:52 +000012
mblighb86bfa12010-02-12 20:22:21 +000013get_value = global_config.get_config_value
14enable_master_ssh = get_value('AUTOSERV', 'enable_master_ssh', type=bool,
15 default=False)
mblighefccc1b2010-01-11 19:08:42 +000016
17
Fang Deng96667ca2013-08-01 17:46:18 -070018class AbstractSSHHost(remote.RemoteHost):
mblighbc9402b2009-12-29 01:15:34 +000019 """
20 This class represents a generic implementation of most of the
jadmanskica7da372008-10-21 16:26:52 +000021 framework necessary for controlling a host via ssh. It implements
22 almost all of the abstract Host methods, except for the core
mblighbc9402b2009-12-29 01:15:34 +000023 Host.run method.
24 """
Simran Basi5ace6f22016-01-06 17:30:44 -080025 VERSION_PREFIX = ''
jadmanskica7da372008-10-21 16:26:52 +000026
jadmanskif6562912008-10-21 17:59:01 +000027 def _initialize(self, hostname, user="root", port=22, password="",
Simran Basi1bf60eb2015-12-01 16:39:29 -080028 is_client_install_supported=True, host_attributes={},
29 *args, **dargs):
jadmanskif6562912008-10-21 17:59:01 +000030 super(AbstractSSHHost, self)._initialize(hostname=hostname,
31 *args, **dargs)
Dan Shic07b8932014-12-11 15:22:30 -080032 # IP address is retrieved only on demand. Otherwise the host
33 # initialization will fail for host is not online.
34 self._ip = None
jadmanskica7da372008-10-21 16:26:52 +000035 self.user = user
36 self.port = port
37 self.password = password
Roshan Piusa58163a2015-10-14 13:36:29 -070038 self._is_client_install_supported = is_client_install_supported
showard6eafb492010-01-15 20:29:06 +000039 self._use_rsync = None
Fang Deng3af66202013-08-16 15:19:25 -070040 self.known_hosts_file = tempfile.mkstemp()[1]
Roshan Pius58e5dd32015-10-16 15:16:42 -070041 self._rpc_server_tracker = rpc_server_tracker.RpcServerTracker(self);
jadmanskica7da372008-10-21 16:26:52 +000042
mblighefccc1b2010-01-11 19:08:42 +000043 """
44 Master SSH connection background job, socket temp directory and socket
45 control path option. If master-SSH is enabled, these fields will be
46 initialized by start_master_ssh when a new SSH connection is initiated.
47 """
48 self.master_ssh_job = None
49 self.master_ssh_tempdir = None
50 self.master_ssh_option = ''
51
Simran Basi3b858a22015-03-17 16:23:24 -070052 # Create a Lock to protect against race conditions.
53 self._lock = Lock()
54
Simran Basi1bf60eb2015-12-01 16:39:29 -080055 self.host_attributes = host_attributes
56
showard6eafb492010-01-15 20:29:06 +000057
Dan Shic07b8932014-12-11 15:22:30 -080058 @property
59 def ip(self):
60 """@return IP address of the host.
61 """
62 if not self._ip:
63 self._ip = socket.getaddrinfo(self.hostname, None)[0][4][0]
64 return self._ip
65
66
Roshan Piusa58163a2015-10-14 13:36:29 -070067 @property
68 def is_client_install_supported(self):
69 """"
70 Returns True if the host supports autotest client installs, False
71 otherwise.
72 """
73 return self._is_client_install_supported
74
75
Roshan Pius58e5dd32015-10-16 15:16:42 -070076 @property
77 def rpc_server_tracker(self):
78 """"
79 @return The RPC server tracker associated with this host.
80 """
81 return self._rpc_server_tracker
82
83
Fang Deng96667ca2013-08-01 17:46:18 -070084 def make_ssh_command(self, user="root", port=22, opts='',
85 hosts_file='/dev/null',
86 connect_timeout=30, alive_interval=300):
87 base_command = ("/usr/bin/ssh -a -x %s -o StrictHostKeyChecking=no "
88 "-o UserKnownHostsFile=%s -o BatchMode=yes "
89 "-o ConnectTimeout=%d -o ServerAliveInterval=%d "
90 "-l %s -p %d")
91 assert isinstance(connect_timeout, (int, long))
92 assert connect_timeout > 0 # can't disable the timeout
93 return base_command % (opts, hosts_file, connect_timeout,
94 alive_interval, user, port)
95
96
showard6eafb492010-01-15 20:29:06 +000097 def use_rsync(self):
98 if self._use_rsync is not None:
99 return self._use_rsync
100
mblighc9892c02010-01-06 19:02:16 +0000101 # Check if rsync is available on the remote host. If it's not,
102 # don't try to use it for any future file transfers.
showard6eafb492010-01-15 20:29:06 +0000103 self._use_rsync = self._check_rsync()
104 if not self._use_rsync:
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700105 logging.warning("rsync not available on remote host %s -- disabled",
mblighc9892c02010-01-06 19:02:16 +0000106 self.hostname)
Eric Lie0493a42010-11-15 13:05:43 -0800107 return self._use_rsync
mblighc9892c02010-01-06 19:02:16 +0000108
109
110 def _check_rsync(self):
111 """
112 Check if rsync is available on the remote host.
113 """
114 try:
115 self.run("rsync --version", stdout_tee=None, stderr_tee=None)
116 except error.AutoservRunError:
117 return False
118 return True
119
jadmanskica7da372008-10-21 16:26:52 +0000120
showard56176ec2009-10-28 19:52:30 +0000121 def _encode_remote_paths(self, paths, escape=True):
mblighbc9402b2009-12-29 01:15:34 +0000122 """
123 Given a list of file paths, encodes it as a single remote path, in
124 the style used by rsync and scp.
125 """
showard56176ec2009-10-28 19:52:30 +0000126 if escape:
127 paths = [utils.scp_remote_escape(path) for path in paths]
Marc Herbert21eb6492015-11-13 15:48:53 -0800128
129 remote = self.hostname
130
131 # rsync and scp require IPv6 brackets, even when there isn't any
132 # trailing port number (ssh doesn't support IPv6 brackets).
133 # In the Python >= 3.3 future, 'import ipaddress' will parse addresses.
134 if re.search(r':.*:', remote):
135 remote = '[%s]' % remote
136
137 return '%s@%s:"%s"' % (self.user, remote, " ".join(paths))
jadmanskica7da372008-10-21 16:26:52 +0000138
jadmanskica7da372008-10-21 16:26:52 +0000139
mbligh45561782009-05-11 21:14:34 +0000140 def _make_rsync_cmd(self, sources, dest, delete_dest, preserve_symlinks):
mblighbc9402b2009-12-29 01:15:34 +0000141 """
142 Given a list of source paths and a destination path, produces the
jadmanskid7b79ed2009-01-07 17:19:48 +0000143 appropriate rsync command for copying them. Remote paths must be
mblighbc9402b2009-12-29 01:15:34 +0000144 pre-encoded.
145 """
Fang Deng96667ca2013-08-01 17:46:18 -0700146 ssh_cmd = self.make_ssh_command(user=self.user, port=self.port,
147 opts=self.master_ssh_option,
148 hosts_file=self.known_hosts_file)
jadmanskid7b79ed2009-01-07 17:19:48 +0000149 if delete_dest:
150 delete_flag = "--delete"
151 else:
152 delete_flag = ""
mbligh45561782009-05-11 21:14:34 +0000153 if preserve_symlinks:
154 symlink_flag = ""
155 else:
156 symlink_flag = "-L"
Dan Shi06d7fbf2014-02-12 12:34:41 -0800157 command = ("rsync %s %s --timeout=1800 --rsh='%s' -az --no-o --no-g "
David Hendricksb8904182014-06-02 15:22:49 -0700158 "%s \"%s\"")
mbligh45561782009-05-11 21:14:34 +0000159 return command % (symlink_flag, delete_flag, ssh_cmd,
David Hendricksb8904182014-06-02 15:22:49 -0700160 " ".join(['"%s"' % p for p in sources]), dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000161
162
Eric Li861b2d52011-02-04 14:50:35 -0800163 def _make_ssh_cmd(self, cmd):
164 """
165 Create a base ssh command string for the host which can be used
166 to run commands directly on the machine
167 """
Fang Deng96667ca2013-08-01 17:46:18 -0700168 base_cmd = self.make_ssh_command(user=self.user, port=self.port,
169 opts=self.master_ssh_option,
170 hosts_file=self.known_hosts_file)
Eric Li861b2d52011-02-04 14:50:35 -0800171
172 return '%s %s "%s"' % (base_cmd, self.hostname, utils.sh_escape(cmd))
173
jadmanskid7b79ed2009-01-07 17:19:48 +0000174 def _make_scp_cmd(self, sources, dest):
mblighbc9402b2009-12-29 01:15:34 +0000175 """
176 Given a list of source paths and a destination path, produces the
jadmanskid7b79ed2009-01-07 17:19:48 +0000177 appropriate scp command for encoding it. Remote paths must be
mblighbc9402b2009-12-29 01:15:34 +0000178 pre-encoded.
179 """
mblighc0649d62010-01-15 18:15:58 +0000180 command = ("scp -rq %s -o StrictHostKeyChecking=no "
lmraf676f32010-02-04 03:36:26 +0000181 "-o UserKnownHostsFile=%s -P %d %s '%s'")
Fang Deng3af66202013-08-16 15:19:25 -0700182 return command % (self.master_ssh_option, self.known_hosts_file,
mblighefccc1b2010-01-11 19:08:42 +0000183 self.port, " ".join(sources), dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000184
185
186 def _make_rsync_compatible_globs(self, path, is_local):
mblighbc9402b2009-12-29 01:15:34 +0000187 """
188 Given an rsync-style path, returns a list of globbed paths
jadmanskid7b79ed2009-01-07 17:19:48 +0000189 that will hopefully provide equivalent behaviour for scp. Does not
190 support the full range of rsync pattern matching behaviour, only that
191 exposed in the get/send_file interface (trailing slashes).
192
193 The is_local param is flag indicating if the paths should be
mblighbc9402b2009-12-29 01:15:34 +0000194 interpreted as local or remote paths.
195 """
jadmanskid7b79ed2009-01-07 17:19:48 +0000196
197 # non-trailing slash paths should just work
198 if len(path) == 0 or path[-1] != "/":
199 return [path]
200
201 # make a function to test if a pattern matches any files
202 if is_local:
showard56176ec2009-10-28 19:52:30 +0000203 def glob_matches_files(path, pattern):
204 return len(glob.glob(path + pattern)) > 0
jadmanskid7b79ed2009-01-07 17:19:48 +0000205 else:
showard56176ec2009-10-28 19:52:30 +0000206 def glob_matches_files(path, pattern):
207 result = self.run("ls \"%s\"%s" % (utils.sh_escape(path),
208 pattern),
209 stdout_tee=None, ignore_status=True)
jadmanskid7b79ed2009-01-07 17:19:48 +0000210 return result.exit_status == 0
211
212 # take a set of globs that cover all files, and see which are needed
213 patterns = ["*", ".[!.]*"]
showard56176ec2009-10-28 19:52:30 +0000214 patterns = [p for p in patterns if glob_matches_files(path, p)]
jadmanskid7b79ed2009-01-07 17:19:48 +0000215
216 # convert them into a set of paths suitable for the commandline
jadmanskid7b79ed2009-01-07 17:19:48 +0000217 if is_local:
showard56176ec2009-10-28 19:52:30 +0000218 return ["\"%s\"%s" % (utils.sh_escape(path), pattern)
219 for pattern in patterns]
jadmanskid7b79ed2009-01-07 17:19:48 +0000220 else:
showard56176ec2009-10-28 19:52:30 +0000221 return [utils.scp_remote_escape(path) + pattern
222 for pattern in patterns]
jadmanskid7b79ed2009-01-07 17:19:48 +0000223
224
225 def _make_rsync_compatible_source(self, source, is_local):
mblighbc9402b2009-12-29 01:15:34 +0000226 """
227 Applies the same logic as _make_rsync_compatible_globs, but
jadmanskid7b79ed2009-01-07 17:19:48 +0000228 applies it to an entire list of sources, producing a new list of
mblighbc9402b2009-12-29 01:15:34 +0000229 sources, properly quoted.
230 """
jadmanskid7b79ed2009-01-07 17:19:48 +0000231 return sum((self._make_rsync_compatible_globs(path, is_local)
232 for path in source), [])
jadmanskica7da372008-10-21 16:26:52 +0000233
234
mblighfeac0102009-04-28 18:31:12 +0000235 def _set_umask_perms(self, dest):
mblighbc9402b2009-12-29 01:15:34 +0000236 """
237 Given a destination file/dir (recursively) set the permissions on
238 all the files and directories to the max allowed by running umask.
239 """
mblighfeac0102009-04-28 18:31:12 +0000240
241 # now this looks strange but I haven't found a way in Python to _just_
242 # get the umask, apparently the only option is to try to set it
243 umask = os.umask(0)
244 os.umask(umask)
245
246 max_privs = 0777 & ~umask
247
248 def set_file_privs(filename):
Chris Masone567d0d92011-12-19 09:38:30 -0800249 """Sets mode of |filename|. Assumes |filename| exists."""
250 file_stat = os.stat(filename)
mblighfeac0102009-04-28 18:31:12 +0000251
252 file_privs = max_privs
253 # if the original file permissions do not have at least one
254 # executable bit then do not set it anywhere
255 if not file_stat.st_mode & 0111:
256 file_privs &= ~0111
257
258 os.chmod(filename, file_privs)
259
260 # try a bottom-up walk so changes on directory permissions won't cut
261 # our access to the files/directories inside it
262 for root, dirs, files in os.walk(dest, topdown=False):
263 # when setting the privileges we emulate the chmod "X" behaviour
264 # that sets to execute only if it is a directory or any of the
265 # owner/group/other already has execute right
266 for dirname in dirs:
267 os.chmod(os.path.join(root, dirname), max_privs)
268
Chris Masone567d0d92011-12-19 09:38:30 -0800269 # Filter out broken symlinks as we go.
270 for filename in filter(os.path.exists, files):
mblighfeac0102009-04-28 18:31:12 +0000271 set_file_privs(os.path.join(root, filename))
272
273
274 # now set privs for the dest itself
275 if os.path.isdir(dest):
276 os.chmod(dest, max_privs)
277 else:
278 set_file_privs(dest)
279
280
mbligh45561782009-05-11 21:14:34 +0000281 def get_file(self, source, dest, delete_dest=False, preserve_perm=True,
282 preserve_symlinks=False):
jadmanskica7da372008-10-21 16:26:52 +0000283 """
284 Copy files from the remote host to a local path.
285
286 Directories will be copied recursively.
287 If a source component is a directory with a trailing slash,
288 the content of the directory will be copied, otherwise, the
289 directory itself and its content will be copied. This
290 behavior is similar to that of the program 'rsync'.
291
292 Args:
293 source: either
294 1) a single file or directory, as a string
295 2) a list of one or more (possibly mixed)
296 files or directories
297 dest: a file or a directory (if source contains a
298 directory or more than one element, you must
299 supply a directory dest)
mbligh89e258d2008-10-24 13:58:08 +0000300 delete_dest: if this is true, the command will also clear
301 out any old files at dest that are not in the
302 source
mblighfeac0102009-04-28 18:31:12 +0000303 preserve_perm: tells get_file() to try to preserve the sources
304 permissions on files and dirs
mbligh45561782009-05-11 21:14:34 +0000305 preserve_symlinks: try to preserve symlinks instead of
306 transforming them into files/dirs on copy
jadmanskica7da372008-10-21 16:26:52 +0000307
308 Raises:
309 AutoservRunError: the scp command failed
310 """
Simran Basi882f15b2013-10-29 14:59:34 -0700311 logging.debug('get_file. source: %s, dest: %s, delete_dest: %s,'
312 'preserve_perm: %s, preserve_symlinks:%s', source, dest,
313 delete_dest, preserve_perm, preserve_symlinks)
mblighefccc1b2010-01-11 19:08:42 +0000314 # Start a master SSH connection if necessary.
315 self.start_master_ssh()
316
jadmanskica7da372008-10-21 16:26:52 +0000317 if isinstance(source, basestring):
318 source = [source]
jadmanskid7b79ed2009-01-07 17:19:48 +0000319 dest = os.path.abspath(dest)
jadmanskica7da372008-10-21 16:26:52 +0000320
mblighc9892c02010-01-06 19:02:16 +0000321 # If rsync is disabled or fails, try scp.
showard6eafb492010-01-15 20:29:06 +0000322 try_scp = True
323 if self.use_rsync():
Simran Basi882f15b2013-10-29 14:59:34 -0700324 logging.debug('Using Rsync.')
mblighc9892c02010-01-06 19:02:16 +0000325 try:
326 remote_source = self._encode_remote_paths(source)
327 local_dest = utils.sh_escape(dest)
328 rsync = self._make_rsync_cmd([remote_source], local_dest,
329 delete_dest, preserve_symlinks)
330 utils.run(rsync)
showard6eafb492010-01-15 20:29:06 +0000331 try_scp = False
mblighc9892c02010-01-06 19:02:16 +0000332 except error.CmdError, e:
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700333 logging.warning("trying scp, rsync failed: %s", e)
mblighc9892c02010-01-06 19:02:16 +0000334
335 if try_scp:
Simran Basi882f15b2013-10-29 14:59:34 -0700336 logging.debug('Trying scp.')
jadmanskid7b79ed2009-01-07 17:19:48 +0000337 # scp has no equivalent to --delete, just drop the entire dest dir
338 if delete_dest and os.path.isdir(dest):
339 shutil.rmtree(dest)
340 os.mkdir(dest)
jadmanskica7da372008-10-21 16:26:52 +0000341
jadmanskid7b79ed2009-01-07 17:19:48 +0000342 remote_source = self._make_rsync_compatible_source(source, False)
343 if remote_source:
showard56176ec2009-10-28 19:52:30 +0000344 # _make_rsync_compatible_source() already did the escaping
345 remote_source = self._encode_remote_paths(remote_source,
346 escape=False)
jadmanskid7b79ed2009-01-07 17:19:48 +0000347 local_dest = utils.sh_escape(dest)
jadmanski2583a432009-02-10 23:59:11 +0000348 scp = self._make_scp_cmd([remote_source], local_dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000349 try:
350 utils.run(scp)
351 except error.CmdError, e:
Simran Basi882f15b2013-10-29 14:59:34 -0700352 logging.debug('scp failed: %s', e)
jadmanskid7b79ed2009-01-07 17:19:48 +0000353 raise error.AutoservRunError(e.args[0], e.args[1])
jadmanskica7da372008-10-21 16:26:52 +0000354
mblighfeac0102009-04-28 18:31:12 +0000355 if not preserve_perm:
356 # we have no way to tell scp to not try to preserve the
357 # permissions so set them after copy instead.
358 # for rsync we could use "--no-p --chmod=ugo=rwX" but those
359 # options are only in very recent rsync versions
360 self._set_umask_perms(dest)
361
jadmanskica7da372008-10-21 16:26:52 +0000362
mbligh45561782009-05-11 21:14:34 +0000363 def send_file(self, source, dest, delete_dest=False,
364 preserve_symlinks=False):
jadmanskica7da372008-10-21 16:26:52 +0000365 """
366 Copy files from a local path to the remote host.
367
368 Directories will be copied recursively.
369 If a source component is a directory with a trailing slash,
370 the content of the directory will be copied, otherwise, the
371 directory itself and its content will be copied. This
372 behavior is similar to that of the program 'rsync'.
373
374 Args:
375 source: either
376 1) a single file or directory, as a string
377 2) a list of one or more (possibly mixed)
378 files or directories
379 dest: a file or a directory (if source contains a
380 directory or more than one element, you must
381 supply a directory dest)
mbligh89e258d2008-10-24 13:58:08 +0000382 delete_dest: if this is true, the command will also clear
383 out any old files at dest that are not in the
384 source
mbligh45561782009-05-11 21:14:34 +0000385 preserve_symlinks: controls if symlinks on the source will be
386 copied as such on the destination or transformed into the
387 referenced file/directory
jadmanskica7da372008-10-21 16:26:52 +0000388
389 Raises:
390 AutoservRunError: the scp command failed
391 """
Simran Basi882f15b2013-10-29 14:59:34 -0700392 logging.debug('send_file. source: %s, dest: %s, delete_dest: %s,'
393 'preserve_symlinks:%s', source, dest,
394 delete_dest, preserve_symlinks)
mblighefccc1b2010-01-11 19:08:42 +0000395 # Start a master SSH connection if necessary.
396 self.start_master_ssh()
397
jadmanskica7da372008-10-21 16:26:52 +0000398 if isinstance(source, basestring):
399 source = [source]
jadmanski2583a432009-02-10 23:59:11 +0000400 remote_dest = self._encode_remote_paths([dest])
jadmanskica7da372008-10-21 16:26:52 +0000401
mukesh agrawal0d3616c2015-07-17 15:47:36 -0700402 local_sources = [utils.sh_escape(path) for path in source]
403 if not local_sources:
404 raise error.TestError('source |%s| yielded an empty list' % (
405 source))
406 if any([local_source.find('\x00') != -1 for
407 local_source in local_sources]):
408 raise error.TestError('one or more sources include NUL char')
409
mblighc9892c02010-01-06 19:02:16 +0000410 # If rsync is disabled or fails, try scp.
showard6eafb492010-01-15 20:29:06 +0000411 try_scp = True
412 if self.use_rsync():
Simran Basi882f15b2013-10-29 14:59:34 -0700413 logging.debug('Using Rsync.')
mblighc9892c02010-01-06 19:02:16 +0000414 try:
mblighc9892c02010-01-06 19:02:16 +0000415 rsync = self._make_rsync_cmd(local_sources, remote_dest,
416 delete_dest, preserve_symlinks)
417 utils.run(rsync)
showard6eafb492010-01-15 20:29:06 +0000418 try_scp = False
mblighc9892c02010-01-06 19:02:16 +0000419 except error.CmdError, e:
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700420 logging.warning("trying scp, rsync failed: %s", e)
mblighc9892c02010-01-06 19:02:16 +0000421
422 if try_scp:
Simran Basi882f15b2013-10-29 14:59:34 -0700423 logging.debug('Trying scp.')
jadmanskid7b79ed2009-01-07 17:19:48 +0000424 # scp has no equivalent to --delete, just drop the entire dest dir
425 if delete_dest:
showard27160152009-07-15 14:28:42 +0000426 is_dir = self.run("ls -d %s/" % dest,
jadmanskid7b79ed2009-01-07 17:19:48 +0000427 ignore_status=True).exit_status == 0
428 if is_dir:
429 cmd = "rm -rf %s && mkdir %s"
mbligh5a0ca532009-08-03 16:44:34 +0000430 cmd %= (dest, dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000431 self.run(cmd)
jadmanskica7da372008-10-21 16:26:52 +0000432
jadmanski2583a432009-02-10 23:59:11 +0000433 local_sources = self._make_rsync_compatible_source(source, True)
434 if local_sources:
435 scp = self._make_scp_cmd(local_sources, remote_dest)
jadmanskid7b79ed2009-01-07 17:19:48 +0000436 try:
437 utils.run(scp)
438 except error.CmdError, e:
Simran Basi882f15b2013-10-29 14:59:34 -0700439 logging.debug('scp failed: %s', e)
jadmanskid7b79ed2009-01-07 17:19:48 +0000440 raise error.AutoservRunError(e.args[0], e.args[1])
mukesh agrawal0d3616c2015-07-17 15:47:36 -0700441 else:
442 logging.debug('skipping scp for empty source list')
jadmanskid7b79ed2009-01-07 17:19:48 +0000443
jadmanskica7da372008-10-21 16:26:52 +0000444
Simran Basi1621c632015-10-14 12:22:23 -0700445 def verify_ssh_user_access(self):
446 """Verify ssh access to this host.
447
448 @returns False if ssh_ping fails due to Permissions error, True
449 otherwise.
450 """
451 try:
452 self.ssh_ping()
453 except (error.AutoservSshPermissionDeniedError,
454 error.AutoservSshPingHostError):
455 return False
456 return True
457
458
beeps46dadc92013-11-07 14:07:10 -0800459 def ssh_ping(self, timeout=60, base_cmd='true'):
beepsadd66d32013-03-04 17:21:51 -0800460 """
461 Pings remote host via ssh.
462
463 @param timeout: Time in seconds before giving up.
464 Defaults to 60 seconds.
beeps46dadc92013-11-07 14:07:10 -0800465 @param base_cmd: The base command to run with the ssh ping.
466 Defaults to true.
beepsadd66d32013-03-04 17:21:51 -0800467 @raise AutoservSSHTimeout: If the ssh ping times out.
468 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
469 permissions.
470 @raise AutoservSshPingHostError: For other AutoservRunErrors.
471 """
jadmanskica7da372008-10-21 16:26:52 +0000472 try:
beeps46dadc92013-11-07 14:07:10 -0800473 self.run(base_cmd, timeout=timeout, connect_timeout=timeout)
jadmanskica7da372008-10-21 16:26:52 +0000474 except error.AutoservSSHTimeout:
mblighd0e94982009-07-11 00:15:18 +0000475 msg = "Host (ssh) verify timed out (timeout = %d)" % timeout
jadmanskica7da372008-10-21 16:26:52 +0000476 raise error.AutoservSSHTimeout(msg)
mbligh9d738d62009-03-09 21:17:10 +0000477 except error.AutoservSshPermissionDeniedError:
478 #let AutoservSshPermissionDeniedError be visible to the callers
479 raise
jadmanskica7da372008-10-21 16:26:52 +0000480 except error.AutoservRunError, e:
mblighc971c5f2009-06-08 16:48:54 +0000481 # convert the generic AutoservRunError into something more
482 # specific for this context
483 raise error.AutoservSshPingHostError(e.description + '\n' +
484 repr(e.result_obj))
jadmanskica7da372008-10-21 16:26:52 +0000485
486
beeps46dadc92013-11-07 14:07:10 -0800487 def is_up(self, timeout=60, base_cmd='true'):
jadmanskica7da372008-10-21 16:26:52 +0000488 """
beeps46dadc92013-11-07 14:07:10 -0800489 Check if the remote host is up by ssh-ing and running a base command.
jadmanskica7da372008-10-21 16:26:52 +0000490
beepsadd66d32013-03-04 17:21:51 -0800491 @param timeout: timeout in seconds.
beeps46dadc92013-11-07 14:07:10 -0800492 @param base_cmd: a base command to run with ssh. The default is 'true'.
beepsadd66d32013-03-04 17:21:51 -0800493 @returns True if the remote host is up before the timeout expires,
494 False otherwise.
jadmanskica7da372008-10-21 16:26:52 +0000495 """
496 try:
beeps46dadc92013-11-07 14:07:10 -0800497 self.ssh_ping(timeout=timeout, base_cmd=base_cmd)
jadmanskica7da372008-10-21 16:26:52 +0000498 except error.AutoservError:
499 return False
500 else:
501 return True
502
503
504 def wait_up(self, timeout=None):
505 """
506 Wait until the remote host is up or the timeout expires.
507
508 In fact, it will wait until an ssh connection to the remote
509 host can be established, and getty is running.
510
jadmanskic0354912010-01-12 15:57:29 +0000511 @param timeout time limit in seconds before returning even
512 if the host is not up.
jadmanskica7da372008-10-21 16:26:52 +0000513
beepsadd66d32013-03-04 17:21:51 -0800514 @returns True if the host was found to be up before the timeout expires,
515 False otherwise
jadmanskica7da372008-10-21 16:26:52 +0000516 """
517 if timeout:
beeps46dadc92013-11-07 14:07:10 -0800518 current_time = int(time.time())
519 end_time = current_time + timeout
jadmanskica7da372008-10-21 16:26:52 +0000520
beepsadd66d32013-03-04 17:21:51 -0800521 while not timeout or current_time < end_time:
522 if self.is_up(timeout=end_time - current_time):
jadmanskica7da372008-10-21 16:26:52 +0000523 try:
524 if self.are_wait_up_processes_up():
jadmanski7ebac3d2010-06-17 16:06:31 +0000525 logging.debug('Host %s is now up', self.hostname)
jadmanskica7da372008-10-21 16:26:52 +0000526 return True
527 except error.AutoservError:
528 pass
529 time.sleep(1)
beeps46dadc92013-11-07 14:07:10 -0800530 current_time = int(time.time())
jadmanskica7da372008-10-21 16:26:52 +0000531
jadmanski7ebac3d2010-06-17 16:06:31 +0000532 logging.debug('Host %s is still down after waiting %d seconds',
533 self.hostname, int(timeout + time.time() - end_time))
jadmanskica7da372008-10-21 16:26:52 +0000534 return False
535
536
jadmanskic0354912010-01-12 15:57:29 +0000537 def wait_down(self, timeout=None, warning_timer=None, old_boot_id=None):
jadmanskica7da372008-10-21 16:26:52 +0000538 """
539 Wait until the remote host is down or the timeout expires.
540
jadmanskic0354912010-01-12 15:57:29 +0000541 If old_boot_id is provided, this will wait until either the machine
542 is unpingable or self.get_boot_id() returns a value different from
543 old_boot_id. If the boot_id value has changed then the function
544 returns true under the assumption that the machine has shut down
545 and has now already come back up.
jadmanskica7da372008-10-21 16:26:52 +0000546
jadmanskic0354912010-01-12 15:57:29 +0000547 If old_boot_id is None then until the machine becomes unreachable the
548 method assumes the machine has not yet shut down.
jadmanskica7da372008-10-21 16:26:52 +0000549
beepsadd66d32013-03-04 17:21:51 -0800550 Based on this definition, the 4 possible permutations of timeout
551 and old_boot_id are:
552 1. timeout and old_boot_id: wait timeout seconds for either the
553 host to become unpingable, or the boot id
554 to change. In the latter case we've rebooted
555 and in the former case we've only shutdown,
556 but both cases return True.
557 2. only timeout: wait timeout seconds for the host to become unpingable.
558 If the host remains pingable throughout timeout seconds
559 we return False.
560 3. only old_boot_id: wait forever until either the host becomes
561 unpingable or the boot_id changes. Return true
562 when either of those conditions are met.
563 4. not timeout, not old_boot_id: wait forever till the host becomes
564 unpingable.
565
jadmanskic0354912010-01-12 15:57:29 +0000566 @param timeout Time limit in seconds before returning even
567 if the host is still up.
568 @param warning_timer Time limit in seconds that will generate
569 a warning if the host is not down yet.
570 @param old_boot_id A string containing the result of self.get_boot_id()
571 prior to the host being told to shut down. Can be None if this is
572 not available.
573
574 @returns True if the host was found to be down, False otherwise
jadmanskica7da372008-10-21 16:26:52 +0000575 """
mblighe5e3cf22010-05-27 23:33:14 +0000576 #TODO: there is currently no way to distinguish between knowing
577 #TODO: boot_id was unsupported and not knowing the boot_id.
beeps46dadc92013-11-07 14:07:10 -0800578 current_time = int(time.time())
jadmanskica7da372008-10-21 16:26:52 +0000579 if timeout:
mbligh2ed998f2009-04-08 21:03:47 +0000580 end_time = current_time + timeout
jadmanskica7da372008-10-21 16:26:52 +0000581
mbligh2ed998f2009-04-08 21:03:47 +0000582 if warning_timer:
583 warn_time = current_time + warning_timer
584
jadmanskic0354912010-01-12 15:57:29 +0000585 if old_boot_id is not None:
586 logging.debug('Host %s pre-shutdown boot_id is %s',
587 self.hostname, old_boot_id)
588
beepsadd66d32013-03-04 17:21:51 -0800589 # Impose semi real-time deadline constraints, since some clients
590 # (eg: watchdog timer tests) expect strict checking of time elapsed.
591 # Each iteration of this loop is treated as though it atomically
592 # completes within current_time, this is needed because if we used
593 # inline time.time() calls instead then the following could happen:
594 #
595 # while not timeout or time.time() < end_time: [23 < 30]
596 # some code. [takes 10 secs]
597 # try:
598 # new_boot_id = self.get_boot_id(timeout=end_time - time.time())
599 # [30 - 33]
600 # The last step will lead to a return True, when in fact the machine
601 # went down at 32 seconds (>30). Hence we need to pass get_boot_id
602 # the same time that allowed us into that iteration of the loop.
mbligh2ed998f2009-04-08 21:03:47 +0000603 while not timeout or current_time < end_time:
jadmanskic0354912010-01-12 15:57:29 +0000604 try:
beeps46dadc92013-11-07 14:07:10 -0800605 new_boot_id = self.get_boot_id(timeout=end_time-current_time)
mblighdbc7e4a2010-01-15 20:34:20 +0000606 except error.AutoservError:
jadmanskic0354912010-01-12 15:57:29 +0000607 logging.debug('Host %s is now unreachable over ssh, is down',
608 self.hostname)
jadmanskica7da372008-10-21 16:26:52 +0000609 return True
jadmanskic0354912010-01-12 15:57:29 +0000610 else:
611 # if the machine is up but the boot_id value has changed from
612 # old boot id, then we can assume the machine has gone down
613 # and then already come back up
614 if old_boot_id is not None and old_boot_id != new_boot_id:
615 logging.debug('Host %s now has boot_id %s and so must '
616 'have rebooted', self.hostname, new_boot_id)
617 return True
mbligh2ed998f2009-04-08 21:03:47 +0000618
619 if warning_timer and current_time > warn_time:
Scott Zawalskic86fdeb2013-10-23 10:24:04 -0400620 self.record("INFO", None, "shutdown",
mbligh2ed998f2009-04-08 21:03:47 +0000621 "Shutdown took longer than %ds" % warning_timer)
622 # Print the warning only once.
623 warning_timer = None
mbligha4464402009-04-17 20:13:41 +0000624 # If a machine is stuck switching runlevels
625 # This may cause the machine to reboot.
626 self.run('kill -HUP 1', ignore_status=True)
mbligh2ed998f2009-04-08 21:03:47 +0000627
jadmanskica7da372008-10-21 16:26:52 +0000628 time.sleep(1)
beeps46dadc92013-11-07 14:07:10 -0800629 current_time = int(time.time())
jadmanskica7da372008-10-21 16:26:52 +0000630
631 return False
jadmanskif6562912008-10-21 17:59:01 +0000632
mbligha0a27592009-01-24 01:41:36 +0000633
jadmanskif6562912008-10-21 17:59:01 +0000634 # tunable constants for the verify & repair code
mblighb86bfa12010-02-12 20:22:21 +0000635 AUTOTEST_GB_DISKSPACE_REQUIRED = get_value("SERVER",
636 "gb_diskspace_required",
Fang Deng6b05f5b2013-03-20 13:42:11 -0700637 type=float,
638 default=20.0)
mbligha0a27592009-01-24 01:41:36 +0000639
jadmanskif6562912008-10-21 17:59:01 +0000640
showardca572982009-09-18 21:20:01 +0000641 def verify_connectivity(self):
642 super(AbstractSSHHost, self).verify_connectivity()
jadmanskif6562912008-10-21 17:59:01 +0000643
showardb18134f2009-03-20 20:52:18 +0000644 logging.info('Pinging host ' + self.hostname)
jadmanskif6562912008-10-21 17:59:01 +0000645 self.ssh_ping()
mbligh2ba7ab02009-08-24 22:09:26 +0000646 logging.info("Host (ssh) %s is alive", self.hostname)
jadmanskif6562912008-10-21 17:59:01 +0000647
jadmanski80deb752009-01-21 17:14:16 +0000648 if self.is_shutting_down():
mblighc971c5f2009-06-08 16:48:54 +0000649 raise error.AutoservHostIsShuttingDownError("Host is shutting down")
jadmanski80deb752009-01-21 17:14:16 +0000650
mblighb49b5232009-02-12 21:54:49 +0000651
showardca572982009-09-18 21:20:01 +0000652 def verify_software(self):
653 super(AbstractSSHHost, self).verify_software()
jadmanskif6562912008-10-21 17:59:01 +0000654 try:
showardad812bf2009-10-20 23:49:56 +0000655 self.check_diskspace(autotest.Autotest.get_install_dir(self),
656 self.AUTOTEST_GB_DISKSPACE_REQUIRED)
jadmanskif6562912008-10-21 17:59:01 +0000657 except error.AutoservHostError:
658 raise # only want to raise if it's a space issue
showardad812bf2009-10-20 23:49:56 +0000659 except autotest.AutodirNotFoundError:
showardca572982009-09-18 21:20:01 +0000660 # autotest dir may not exist, etc. ignore
661 logging.debug('autodir space check exception, this is probably '
662 'safe to ignore\n' + traceback.format_exc())
mblighefccc1b2010-01-11 19:08:42 +0000663
664
665 def close(self):
666 super(AbstractSSHHost, self).close()
667 self._cleanup_master_ssh()
Fang Deng3af66202013-08-16 15:19:25 -0700668 os.remove(self.known_hosts_file)
Roshan Pius58e5dd32015-10-16 15:16:42 -0700669 self.rpc_server_tracker.disconnect_all()
mblighefccc1b2010-01-11 19:08:42 +0000670
671
672 def _cleanup_master_ssh(self):
673 """
674 Release all resources (process, temporary directory) used by an active
675 master SSH connection.
676 """
677 # If a master SSH connection is running, kill it.
678 if self.master_ssh_job is not None:
Aviv Keshet46250752013-08-27 15:52:06 -0700679 logging.debug('Nuking master_ssh_job.')
mblighefccc1b2010-01-11 19:08:42 +0000680 utils.nuke_subprocess(self.master_ssh_job.sp)
681 self.master_ssh_job = None
682
683 # Remove the temporary directory for the master SSH socket.
684 if self.master_ssh_tempdir is not None:
Aviv Keshet46250752013-08-27 15:52:06 -0700685 logging.debug('Cleaning master_ssh_tempdir.')
mblighefccc1b2010-01-11 19:08:42 +0000686 self.master_ssh_tempdir.clean()
687 self.master_ssh_tempdir = None
688 self.master_ssh_option = ''
689
690
Aviv Keshet0749a822013-10-17 09:53:26 -0700691 def start_master_ssh(self, timeout=5):
mblighefccc1b2010-01-11 19:08:42 +0000692 """
693 Called whenever a slave SSH connection needs to be initiated (e.g., by
694 run, rsync, scp). If master SSH support is enabled and a master SSH
695 connection is not active already, start a new one in the background.
696 Also, cleanup any zombie master SSH connections (e.g., dead due to
697 reboot).
Aviv Keshet0749a822013-10-17 09:53:26 -0700698
699 timeout: timeout in seconds (default 5) to wait for master ssh
700 connection to be established. If timeout is reached, a
701 warning message is logged, but no other action is taken.
mblighefccc1b2010-01-11 19:08:42 +0000702 """
703 if not enable_master_ssh:
704 return
705
Simran Basi3b858a22015-03-17 16:23:24 -0700706 # Multiple processes might try in parallel to clean up the old master
707 # ssh connection and create a new one, therefore use a lock to protect
708 # against race conditions.
709 with self._lock:
710 # If a previously started master SSH connection is not running
711 # anymore, it needs to be cleaned up and then restarted.
712 if self.master_ssh_job is not None:
713 socket_path = os.path.join(self.master_ssh_tempdir.name,
714 'socket')
715 if (not os.path.exists(socket_path) or
716 self.master_ssh_job.sp.poll() is not None):
717 logging.info("Master ssh connection to %s is down.",
718 self.hostname)
719 self._cleanup_master_ssh()
mblighefccc1b2010-01-11 19:08:42 +0000720
Simran Basi3b858a22015-03-17 16:23:24 -0700721 # Start a new master SSH connection.
722 if self.master_ssh_job is None:
723 # Create a shared socket in a temp location.
724 self.master_ssh_tempdir = autotemp.tempdir(
725 unique_id='ssh-master')
726 self.master_ssh_option = ("-o ControlPath=%s/socket" %
727 self.master_ssh_tempdir.name)
mblighefccc1b2010-01-11 19:08:42 +0000728
Simran Basi3b858a22015-03-17 16:23:24 -0700729 # Start the master SSH connection in the background.
730 master_cmd = self.ssh_command(
731 options="-N -o ControlMaster=yes")
732 logging.info("Starting master ssh connection '%s'", master_cmd)
733 self.master_ssh_job = utils.BgJob(master_cmd,
734 nickname='master-ssh',
735 no_pipes=True)
736 # To prevent a race between the the master ssh connection
737 # startup and its first attempted use, wait for socket file to
738 # exist before returning.
739 end_time = time.time() + timeout
740 socket_file_path = os.path.join(self.master_ssh_tempdir.name,
741 'socket')
742 while time.time() < end_time:
743 if os.path.exists(socket_file_path):
744 break
745 time.sleep(.2)
746 else:
747 logging.info('Timed out waiting for master-ssh connection '
748 'to be established.')
mbligh0a883702010-04-21 01:58:34 +0000749
750
751 def clear_known_hosts(self):
752 """Clears out the temporary ssh known_hosts file.
753
754 This is useful if the test SSHes to the machine, then reinstalls it,
755 then SSHes to it again. It can be called after the reinstall to
756 reduce the spam in the logs.
757 """
758 logging.info("Clearing known hosts for host '%s', file '%s'.",
Fang Deng3af66202013-08-16 15:19:25 -0700759 self.hostname, self.known_hosts_file)
mbligh0a883702010-04-21 01:58:34 +0000760 # Clear out the file by opening it for writing and then closing.
Fang Deng3af66202013-08-16 15:19:25 -0700761 fh = open(self.known_hosts_file, "w")
mbligh0a883702010-04-21 01:58:34 +0000762 fh.close()
Prashanth B98509c72014-04-04 16:01:34 -0700763
764
765 def collect_logs(self, remote_src_dir, local_dest_dir, ignore_errors=True):
766 """Copy log directories from a host to a local directory.
767
768 @param remote_src_dir: A destination directory on the host.
769 @param local_dest_dir: A path to a local destination directory.
770 If it doesn't exist it will be created.
771 @param ignore_errors: If True, ignore exceptions.
772
773 @raises OSError: If there were problems creating the local_dest_dir and
774 ignore_errors is False.
775 @raises AutoservRunError, AutotestRunError: If something goes wrong
776 while copying the directories and ignore_errors is False.
777 """
778 locally_created_dest = False
779 if (not os.path.exists(local_dest_dir)
780 or not os.path.isdir(local_dest_dir)):
781 try:
782 os.makedirs(local_dest_dir)
783 locally_created_dest = True
784 except OSError as e:
785 logging.warning('Unable to collect logs from host '
786 '%s: %s', self.hostname, e)
787 if not ignore_errors:
788 raise
789 return
790 try:
791 self.get_file(
792 remote_src_dir, local_dest_dir, preserve_symlinks=True)
793 except (error.AutotestRunError, error.AutoservRunError,
794 error.AutoservSSHTimeout) as e:
795 logging.warning('Collection of %s to local dir %s from host %s '
796 'failed: %s', remote_src_dir, local_dest_dir,
797 self.hostname, e)
798 if locally_created_dest:
799 shutil.rmtree(local_dest_dir, ignore_errors=ignore_errors)
800 if not ignore_errors:
801 raise
Cheng-Yi Chianga155e7e2015-08-20 20:42:04 +0800802
803
804 def _create_ssh_tunnel(self, port, local_port):
805 """Create an ssh tunnel from local_port to port.
806
807 @param port: remote port on the host.
808 @param local_port: local forwarding port.
809
810 @return: the tunnel process.
811 """
812 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
813 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
814 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
815 logging.debug('Full tunnel command: %s', tunnel_cmd)
816 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
817 logging.debug('Started ssh tunnel, local = %d'
818 ' remote = %d, pid = %d',
819 local_port, port, tunnel_proc.pid)
820 return tunnel_proc
Gilad Arnolda76bef02015-09-29 13:55:15 -0700821
822
Roshan Pius58e5dd32015-10-16 15:16:42 -0700823 def rpc_port_forward(self, port, local_port):
824 """
825 Forwards a port securely through a tunnel process from the server
826 to the DUT for RPC server connection.
827
828 @param port: remote port on the DUT.
829 @param local_port: local forwarding port.
830
831 @return: the tunnel process.
832 """
833 return self._create_ssh_tunnel(port, local_port)
834
835
836 def rpc_port_disconnect(self, tunnel_proc, port):
837 """
838 Disconnects a previously forwarded port from the server to the DUT for
839 RPC server connection.
840
841 @param tunnel_proc: the original tunnel process returned from
842 |rpc_port_forward|.
843 @param port: remote port on the DUT.
844
845 """
846 if tunnel_proc.poll() is None:
847 tunnel_proc.terminate()
848 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
849 else:
850 logging.debug('Tunnel pid %d terminated early, status %d',
851 tunnel_proc.pid, tunnel_proc.returncode)
852
853
Gilad Arnolda76bef02015-09-29 13:55:15 -0700854 def get_os_type(self):
855 """Returns the host OS descriptor (to be implemented in subclasses).
856
857 @return A string describing the OS type.
858 """
Simran Basi5ace6f22016-01-06 17:30:44 -0800859 raise NotImplementedError