Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 1 | # Copyright (c) 2013 The Chromium OS Authors. All rights reserved. |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 2 | # Use of this source code is governed by a BSD-style license that can be |
| 3 | # found in the LICENSE file. |
| 4 | |
Prashanth B | a06d2d2 | 2014-03-07 15:35:19 -0800 | [diff] [blame] | 5 | import collections |
Chris Sosa | 9164ca3 | 2012-03-28 11:04:50 -0700 | [diff] [blame] | 6 | import os |
Gilad Arnold | 0b8c3f3 | 2012-09-19 14:35:44 -0700 | [diff] [blame] | 7 | import threading |
Prashanth B | a06d2d2 | 2014-03-07 15:35:19 -0800 | [diff] [blame] | 8 | from datetime import datetime |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 9 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 10 | import build_artifact |
Gilad Arnold | c65330c | 2012-09-20 15:17:48 -0700 | [diff] [blame] | 11 | import common_util |
| 12 | import log_util |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 13 | |
| 14 | |
Dan Shi | 6e50c72 | 2013-08-19 15:05:06 -0700 | [diff] [blame] | 15 | class DownloaderException(Exception): |
| 16 | """Exception that aggregates all exceptions raised during async download. |
| 17 | |
| 18 | Exceptions could be raised in artifact.Process method, and saved to files. |
| 19 | When caller calls IsStaged to check the downloading progress, devserver can |
| 20 | retrieve the persisted exceptions from the files, wrap them into a |
| 21 | DownloaderException, and raise it. |
| 22 | """ |
| 23 | def __init__(self, exceptions): |
| 24 | """Initialize a DownloaderException instance with a list of exceptions. |
| 25 | |
| 26 | @param exceptions: Exceptions raised when downloading artifacts. |
| 27 | """ |
| 28 | message = 'Exceptions were raised when downloading artifacts.' |
| 29 | Exception.__init__(self, message) |
| 30 | self.exceptions = exceptions |
| 31 | |
| 32 | def __repr__(self): |
| 33 | return self.__str__() |
| 34 | |
| 35 | def __str__(self): |
| 36 | """Return a custom exception message with all exceptions merged.""" |
| 37 | return '--------\n'.join([str(exception) for exception in self.exceptions]) |
| 38 | |
Gilad Arnold | c65330c | 2012-09-20 15:17:48 -0700 | [diff] [blame] | 39 | class Downloader(log_util.Loggable): |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 40 | """Downloader of images to the devsever. |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 41 | |
| 42 | Given a URL to a build on the archive server: |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 43 | - Caches that build and the given artifacts onto the devserver. |
| 44 | - May also initiate caching of related artifacts in the background. |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 45 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 46 | Private class members: |
| 47 | archive_url: a URL where to download build artifacts from. |
| 48 | static_dir: local filesystem directory to store all artifacts. |
| 49 | build_dir: the local filesystem directory to store artifacts for the given |
| 50 | build defined by the archive_url. |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 51 | """ |
| 52 | |
Alex Miller | a44d502 | 2012-07-27 11:34:16 -0700 | [diff] [blame] | 53 | # This filename must be kept in sync with clean_staged_images.py |
| 54 | _TIMESTAMP_FILENAME = 'staged.timestamp' |
Chris Masone | a22d938 | 2012-05-18 12:38:51 -0700 | [diff] [blame] | 55 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 56 | def __init__(self, static_dir, archive_url): |
| 57 | super(Downloader, self).__init__() |
| 58 | self._archive_url = archive_url |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 59 | self._static_dir = static_dir |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 60 | self._build_dir = Downloader.GetBuildDir(static_dir, archive_url) |
Chris Masone | 816e38c | 2012-05-02 12:22:36 -0700 | [diff] [blame] | 61 | |
| 62 | @staticmethod |
Chris Sosa | cde6bf4 | 2012-05-31 18:36:39 -0700 | [diff] [blame] | 63 | def ParseUrl(archive_url): |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 64 | """Parses archive_url into rel_path and build. |
Chris Masone | 816e38c | 2012-05-02 12:22:36 -0700 | [diff] [blame] | 65 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 66 | Parses archive_url into rel_path and build e.g. |
| 67 | gs://chromeos-image-archive/{rel_path}/{build}. |
| 68 | |
| 69 | Args: |
| 70 | archive_url: a URL at which build artifacts are archived. |
| 71 | |
| 72 | Returns: |
| 73 | A tuple of (build relative path, short build name) |
Chris Masone | 816e38c | 2012-05-02 12:22:36 -0700 | [diff] [blame] | 74 | """ |
Yu-Ju Hong | d49d7f4 | 2012-06-25 12:23:11 -0700 | [diff] [blame] | 75 | # The archive_url is of the form gs://server/[some_path/target]/...]/build |
| 76 | # This function discards 'gs://server/' and extracts the [some_path/target] |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 77 | # as rel_path and the build as build. |
Yu-Ju Hong | d49d7f4 | 2012-06-25 12:23:11 -0700 | [diff] [blame] | 78 | sub_url = archive_url.partition('://')[2] |
| 79 | split_sub_url = sub_url.split('/') |
| 80 | rel_path = '/'.join(split_sub_url[1:-1]) |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 81 | build = split_sub_url[-1] |
| 82 | return rel_path, build |
Chris Masone | 816e38c | 2012-05-02 12:22:36 -0700 | [diff] [blame] | 83 | |
| 84 | @staticmethod |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 85 | def GetBuildDir(static_dir, archive_url): |
| 86 | """Returns the path to where the artifacts will be staged. |
Chris Masone | 816e38c | 2012-05-02 12:22:36 -0700 | [diff] [blame] | 87 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 88 | Args: |
| 89 | static_dir: The base static dir that will be used. |
| 90 | archive_url: The gs path to the archive url. |
Chris Masone | 816e38c | 2012-05-02 12:22:36 -0700 | [diff] [blame] | 91 | """ |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 92 | # Parse archive_url into rel_path (contains the build target) and |
| 93 | # build e.g. gs://chromeos-image-archive/{rel_path}/{build}. |
| 94 | rel_path, build = Downloader.ParseUrl(archive_url) |
| 95 | return os.path.join(static_dir, rel_path, build) |
Frank Farzan | 37761d1 | 2011-12-01 14:29:08 -0800 | [diff] [blame] | 96 | |
Chris Sosa | 9164ca3 | 2012-03-28 11:04:50 -0700 | [diff] [blame] | 97 | @staticmethod |
Simran Basi | ef83d6a | 2014-08-28 14:32:01 -0700 | [diff] [blame] | 98 | def TouchTimestampForStaged(directory_path): |
Alex Miller | a44d502 | 2012-07-27 11:34:16 -0700 | [diff] [blame] | 99 | file_name = os.path.join(directory_path, Downloader._TIMESTAMP_FILENAME) |
| 100 | # Easiest python version of |touch file_name| |
| 101 | with file(file_name, 'a'): |
| 102 | os.utime(file_name, None) |
| 103 | |
Dan Shi | ba0e674 | 2013-06-26 17:39:05 -0700 | [diff] [blame] | 104 | @staticmethod |
| 105 | def _TryRemoveStageDir(directory_path): |
Gilad Arnold | 02dc655 | 2013-11-14 11:27:54 -0800 | [diff] [blame] | 106 | """If download failed, try to remove the stage dir. |
Dan Shi | ba0e674 | 2013-06-26 17:39:05 -0700 | [diff] [blame] | 107 | |
Gilad Arnold | 02dc655 | 2013-11-14 11:27:54 -0800 | [diff] [blame] | 108 | If the download attempt failed (ArtifactDownloadError) and staged.timestamp |
| 109 | is the only file in that directory. The build could be non-existing, and |
| 110 | the directory should be removed. |
Dan Shi | ba0e674 | 2013-06-26 17:39:05 -0700 | [diff] [blame] | 111 | |
| 112 | @param directory_path: directory used to stage the image. |
| 113 | |
| 114 | """ |
| 115 | file_name = os.path.join(directory_path, Downloader._TIMESTAMP_FILENAME) |
| 116 | if os.path.exists(file_name) and len(os.listdir(directory_path)) == 1: |
| 117 | os.remove(file_name) |
| 118 | os.rmdir(directory_path) |
| 119 | |
Prashanth B | a06d2d2 | 2014-03-07 15:35:19 -0800 | [diff] [blame] | 120 | def ListBuildDir(self): |
| 121 | """List the files in the build directory. |
| 122 | |
| 123 | Only lists files a single level into the build directory. Includes |
| 124 | timestamp information in the listing. |
| 125 | |
| 126 | Returns: |
| 127 | A string with information about the files in the build directory. |
| 128 | None if the build directory doesn't exist. |
| 129 | |
| 130 | Raises: |
| 131 | build_artifact.ArtifactDownloadError: If the build_dir path exists |
| 132 | but is not a directory. |
| 133 | """ |
| 134 | if not os.path.exists(self._build_dir): |
| 135 | return None |
| 136 | if not os.path.isdir(self._build_dir): |
| 137 | raise build_artifact.ArtifactDownloadError( |
| 138 | 'Artifacts %s improperly staged to build_dir path %s. The path is ' |
| 139 | 'not a directory.' % (self._archive_url, self._build_dir)) |
| 140 | |
| 141 | ls_format = collections.namedtuple( |
| 142 | 'ls', ['name', 'accessed', 'modified', 'size']) |
| 143 | output_format = ('Name: %(name)s Accessed: %(accessed)s ' |
| 144 | 'Modified: %(modified)s Size: %(size)s bytes.\n') |
| 145 | |
| 146 | build_dir_info = 'Listing contents of :%s \n' % self._build_dir |
| 147 | for file_name in os.listdir(self._build_dir): |
| 148 | file_path = os.path.join(self._build_dir, file_name) |
| 149 | file_info = os.stat(file_path) |
| 150 | ls_info = ls_format(file_path, |
| 151 | datetime.fromtimestamp(file_info.st_atime), |
| 152 | datetime.fromtimestamp(file_info.st_mtime), |
| 153 | file_info.st_size) |
| 154 | build_dir_info += output_format % ls_info._asdict() |
| 155 | return build_dir_info |
| 156 | |
Chris Sosa | 6b0c617 | 2013-08-05 17:01:33 -0700 | [diff] [blame] | 157 | def Download(self, artifacts, files, async=False): |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 158 | """Downloads and caches the |artifacts|. |
Chris Sosa | 9164ca3 | 2012-03-28 11:04:50 -0700 | [diff] [blame] | 159 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 160 | Downloads and caches the |artifacts|. Returns once these |
| 161 | are present on the devserver. A call to this will attempt to cache |
| 162 | non-specified artifacts in the background following the principle of |
| 163 | spatial locality. |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 164 | |
Chris Sosa | 7549080 | 2013-09-30 17:21:45 -0700 | [diff] [blame] | 165 | Args: |
| 166 | artifacts: A list of artifact names that correspond to |
| 167 | artifacts defined in artifact_info.py to stage. |
| 168 | files: A list of filenames to stage from an archive_url. |
| 169 | async: If True, return without waiting for download to complete. |
| 170 | |
| 171 | Raises: |
Gilad Arnold | 02dc655 | 2013-11-14 11:27:54 -0800 | [diff] [blame] | 172 | build_artifact.ArtifactDownloadError: If failed to download the artifact. |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 173 | |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 174 | """ |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 175 | common_util.MkDirP(self._build_dir) |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 176 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 177 | # We are doing some work on this build -- let's touch it to indicate that |
| 178 | # we shouldn't be cleaning it up anytime soon. |
Simran Basi | ef83d6a | 2014-08-28 14:32:01 -0700 | [diff] [blame] | 179 | Downloader.TouchTimestampForStaged(self._build_dir) |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 180 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 181 | # Create factory to create build_artifacts from artifact names. |
| 182 | build = self.ParseUrl(self._archive_url)[1] |
Chris Sosa | 6b0c617 | 2013-08-05 17:01:33 -0700 | [diff] [blame] | 183 | factory = build_artifact.ArtifactFactory( |
| 184 | self._build_dir, self._archive_url, artifacts, files, |
| 185 | build) |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 186 | background_artifacts = factory.OptionalArtifacts() |
| 187 | if background_artifacts: |
| 188 | self._DownloadArtifactsInBackground(background_artifacts) |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 189 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 190 | required_artifacts = factory.RequiredArtifacts() |
| 191 | str_repr = [str(a) for a in required_artifacts] |
| 192 | self._Log('Downloading artifacts %s.', ' '.join(str_repr)) |
Dan Shi | e37f8fe | 2013-08-09 16:10:29 -0700 | [diff] [blame] | 193 | |
Dan Shi | 6e50c72 | 2013-08-19 15:05:06 -0700 | [diff] [blame] | 194 | if async: |
| 195 | self._DownloadArtifactsInBackground(required_artifacts) |
| 196 | else: |
| 197 | self._DownloadArtifactsSerially(required_artifacts, no_wait=True) |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 198 | |
Chris Sosa | 6b0c617 | 2013-08-05 17:01:33 -0700 | [diff] [blame] | 199 | def IsStaged(self, artifacts, files): |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 200 | """Check if all artifacts have been downloaded. |
| 201 | |
Chris Sosa | 6b0c617 | 2013-08-05 17:01:33 -0700 | [diff] [blame] | 202 | artifacts: A list of artifact names that correspond to |
| 203 | artifacts defined in artifact_info.py to stage. |
| 204 | files: A list of filenames to stage from an archive_url. |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 205 | @returns: True if all artifacts are staged. |
Dan Shi | 6e50c72 | 2013-08-19 15:05:06 -0700 | [diff] [blame] | 206 | @raise exception: that was raised by any artifact when calling Process. |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 207 | |
| 208 | """ |
| 209 | # Create factory to create build_artifacts from artifact names. |
| 210 | build = self.ParseUrl(self._archive_url)[1] |
Chris Sosa | 6b0c617 | 2013-08-05 17:01:33 -0700 | [diff] [blame] | 211 | factory = build_artifact.ArtifactFactory( |
| 212 | self._build_dir, self._archive_url, artifacts, files, build) |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 213 | required_artifacts = factory.RequiredArtifacts() |
Dan Shi | 6e50c72 | 2013-08-19 15:05:06 -0700 | [diff] [blame] | 214 | exceptions = [artifact.GetException() for artifact in required_artifacts if |
| 215 | artifact.GetException()] |
| 216 | if exceptions: |
| 217 | raise DownloaderException(exceptions) |
| 218 | |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 219 | return all([artifact.ArtifactStaged() for artifact in required_artifacts]) |
| 220 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 221 | def _DownloadArtifactsSerially(self, artifacts, no_wait): |
| 222 | """Simple function to download all the given artifacts serially. |
| 223 | |
Chris Sosa | 7549080 | 2013-09-30 17:21:45 -0700 | [diff] [blame] | 224 | Args: |
| 225 | artifacts: A list of build_artifact.BuildArtifact instances to |
| 226 | download. |
| 227 | no_wait: If True, don't block waiting for artifact to exist if we |
| 228 | fail to immediately find it. |
| 229 | |
| 230 | Raises: |
| 231 | build_artifact.ArtifactDownloadError: If we failed to download the |
| 232 | artifact. |
Dan Shi | f8eb0d1 | 2013-08-01 17:52:06 -0700 | [diff] [blame] | 233 | |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 234 | """ |
Dan Shi | 6e50c72 | 2013-08-19 15:05:06 -0700 | [diff] [blame] | 235 | try: |
| 236 | for artifact in artifacts: |
| 237 | artifact.Process(no_wait) |
Gilad Arnold | 02dc655 | 2013-11-14 11:27:54 -0800 | [diff] [blame] | 238 | except build_artifact.ArtifactDownloadError: |
Dan Shi | 6e50c72 | 2013-08-19 15:05:06 -0700 | [diff] [blame] | 239 | Downloader._TryRemoveStageDir(self._build_dir) |
| 240 | raise |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 241 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 242 | def _DownloadArtifactsInBackground(self, artifacts): |
| 243 | """Downloads |artifacts| in the background. |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 244 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 245 | Downloads |artifacts| in the background. As these are backgrounded |
| 246 | artifacts, they are done best effort and may not exist. |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 247 | |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 248 | Args: |
| 249 | artifacts: List of build_artifact.BuildArtifact instances to download. |
Gilad Arnold | 6f99b98 | 2012-09-12 10:49:40 -0700 | [diff] [blame] | 250 | """ |
Chris Sosa | 76e44b9 | 2013-01-31 12:11:38 -0800 | [diff] [blame] | 251 | self._Log('Invoking background download of artifacts for %r', artifacts) |
| 252 | thread = threading.Thread(target=self._DownloadArtifactsSerially, |
| 253 | args=(artifacts, False)) |
| 254 | thread.start() |