diff options
Diffstat (limited to 'hooks.py')
| -rw-r--r-- | hooks.py | 431 |
1 files changed, 431 insertions, 0 deletions
diff --git a/hooks.py b/hooks.py new file mode 100644 index 00000000..177bc88b --- /dev/null +++ b/hooks.py | |||
| @@ -0,0 +1,431 @@ | |||
| 1 | # -*- coding:utf-8 -*- | ||
| 2 | # | ||
| 3 | # Copyright (C) 2008 The Android Open Source Project | ||
| 4 | # | ||
| 5 | # Licensed under the Apache License, Version 2.0 (the "License"); | ||
| 6 | # you may not use this file except in compliance with the License. | ||
| 7 | # You may obtain a copy of the License at | ||
| 8 | # | ||
| 9 | # http://www.apache.org/licenses/LICENSE-2.0 | ||
| 10 | # | ||
| 11 | # Unless required by applicable law or agreed to in writing, software | ||
| 12 | # distributed under the License is distributed on an "AS IS" BASIS, | ||
| 13 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
| 14 | # See the License for the specific language governing permissions and | ||
| 15 | # limitations under the License. | ||
| 16 | |||
| 17 | import json | ||
| 18 | import os | ||
| 19 | import re | ||
| 20 | import sys | ||
| 21 | import traceback | ||
| 22 | |||
| 23 | from error import HookError | ||
| 24 | from git_refs import HEAD | ||
| 25 | |||
| 26 | from pyversion import is_python3 | ||
| 27 | if is_python3(): | ||
| 28 | import urllib.parse | ||
| 29 | else: | ||
| 30 | import imp | ||
| 31 | import urlparse | ||
| 32 | urllib = imp.new_module('urllib') | ||
| 33 | urllib.parse = urlparse | ||
| 34 | input = raw_input # noqa: F821 | ||
| 35 | |||
| 36 | class RepoHook(object): | ||
| 37 | """A RepoHook contains information about a script to run as a hook. | ||
| 38 | |||
| 39 | Hooks are used to run a python script before running an upload (for instance, | ||
| 40 | to run presubmit checks). Eventually, we may have hooks for other actions. | ||
| 41 | |||
| 42 | This shouldn't be confused with files in the 'repo/hooks' directory. Those | ||
| 43 | files are copied into each '.git/hooks' folder for each project. Repo-level | ||
| 44 | hooks are associated instead with repo actions. | ||
| 45 | |||
| 46 | Hooks are always python. When a hook is run, we will load the hook into the | ||
| 47 | interpreter and execute its main() function. | ||
| 48 | """ | ||
| 49 | |||
| 50 | def __init__(self, | ||
| 51 | hook_type, | ||
| 52 | hooks_project, | ||
| 53 | topdir, | ||
| 54 | manifest_url, | ||
| 55 | abort_if_user_denies=False): | ||
| 56 | """RepoHook constructor. | ||
| 57 | |||
| 58 | Params: | ||
| 59 | hook_type: A string representing the type of hook. This is also used | ||
| 60 | to figure out the name of the file containing the hook. For | ||
| 61 | example: 'pre-upload'. | ||
| 62 | hooks_project: The project containing the repo hooks. If you have a | ||
| 63 | manifest, this is manifest.repo_hooks_project. OK if this is None, | ||
| 64 | which will make the hook a no-op. | ||
| 65 | topdir: Repo's top directory (the one containing the .repo directory). | ||
| 66 | Scripts will run with CWD as this directory. If you have a manifest, | ||
| 67 | this is manifest.topdir | ||
| 68 | manifest_url: The URL to the manifest git repo. | ||
| 69 | abort_if_user_denies: If True, we'll throw a HookError() if the user | ||
| 70 | doesn't allow us to run the hook. | ||
| 71 | """ | ||
| 72 | self._hook_type = hook_type | ||
| 73 | self._hooks_project = hooks_project | ||
| 74 | self._manifest_url = manifest_url | ||
| 75 | self._topdir = topdir | ||
| 76 | self._abort_if_user_denies = abort_if_user_denies | ||
| 77 | |||
| 78 | # Store the full path to the script for convenience. | ||
| 79 | if self._hooks_project: | ||
| 80 | self._script_fullpath = os.path.join(self._hooks_project.worktree, | ||
| 81 | self._hook_type + '.py') | ||
| 82 | else: | ||
| 83 | self._script_fullpath = None | ||
| 84 | |||
| 85 | def _GetHash(self): | ||
| 86 | """Return a hash of the contents of the hooks directory. | ||
| 87 | |||
| 88 | We'll just use git to do this. This hash has the property that if anything | ||
| 89 | changes in the directory we will return a different has. | ||
| 90 | |||
| 91 | SECURITY CONSIDERATION: | ||
| 92 | This hash only represents the contents of files in the hook directory, not | ||
| 93 | any other files imported or called by hooks. Changes to imported files | ||
| 94 | can change the script behavior without affecting the hash. | ||
| 95 | |||
| 96 | Returns: | ||
| 97 | A string representing the hash. This will always be ASCII so that it can | ||
| 98 | be printed to the user easily. | ||
| 99 | """ | ||
| 100 | assert self._hooks_project, "Must have hooks to calculate their hash." | ||
| 101 | |||
| 102 | # We will use the work_git object rather than just calling GetRevisionId(). | ||
| 103 | # That gives us a hash of the latest checked in version of the files that | ||
| 104 | # the user will actually be executing. Specifically, GetRevisionId() | ||
| 105 | # doesn't appear to change even if a user checks out a different version | ||
| 106 | # of the hooks repo (via git checkout) nor if a user commits their own revs. | ||
| 107 | # | ||
| 108 | # NOTE: Local (non-committed) changes will not be factored into this hash. | ||
| 109 | # I think this is OK, since we're really only worried about warning the user | ||
| 110 | # about upstream changes. | ||
| 111 | return self._hooks_project.work_git.rev_parse('HEAD') | ||
| 112 | |||
| 113 | def _GetMustVerb(self): | ||
| 114 | """Return 'must' if the hook is required; 'should' if not.""" | ||
| 115 | if self._abort_if_user_denies: | ||
| 116 | return 'must' | ||
| 117 | else: | ||
| 118 | return 'should' | ||
| 119 | |||
| 120 | def _CheckForHookApproval(self): | ||
| 121 | """Check to see whether this hook has been approved. | ||
| 122 | |||
| 123 | We'll accept approval of manifest URLs if they're using secure transports. | ||
| 124 | This way the user can say they trust the manifest hoster. For insecure | ||
| 125 | hosts, we fall back to checking the hash of the hooks repo. | ||
| 126 | |||
| 127 | Note that we ask permission for each individual hook even though we use | ||
| 128 | the hash of all hooks when detecting changes. We'd like the user to be | ||
| 129 | able to approve / deny each hook individually. We only use the hash of all | ||
| 130 | hooks because there is no other easy way to detect changes to local imports. | ||
| 131 | |||
| 132 | Returns: | ||
| 133 | True if this hook is approved to run; False otherwise. | ||
| 134 | |||
| 135 | Raises: | ||
| 136 | HookError: Raised if the user doesn't approve and abort_if_user_denies | ||
| 137 | was passed to the consturctor. | ||
| 138 | """ | ||
| 139 | if self._ManifestUrlHasSecureScheme(): | ||
| 140 | return self._CheckForHookApprovalManifest() | ||
| 141 | else: | ||
| 142 | return self._CheckForHookApprovalHash() | ||
| 143 | |||
| 144 | def _CheckForHookApprovalHelper(self, subkey, new_val, main_prompt, | ||
| 145 | changed_prompt): | ||
| 146 | """Check for approval for a particular attribute and hook. | ||
| 147 | |||
| 148 | Args: | ||
| 149 | subkey: The git config key under [repo.hooks.<hook_type>] to store the | ||
| 150 | last approved string. | ||
| 151 | new_val: The new value to compare against the last approved one. | ||
| 152 | main_prompt: Message to display to the user to ask for approval. | ||
| 153 | changed_prompt: Message explaining why we're re-asking for approval. | ||
| 154 | |||
| 155 | Returns: | ||
| 156 | True if this hook is approved to run; False otherwise. | ||
| 157 | |||
| 158 | Raises: | ||
| 159 | HookError: Raised if the user doesn't approve and abort_if_user_denies | ||
| 160 | was passed to the consturctor. | ||
| 161 | """ | ||
| 162 | hooks_config = self._hooks_project.config | ||
| 163 | git_approval_key = 'repo.hooks.%s.%s' % (self._hook_type, subkey) | ||
| 164 | |||
| 165 | # Get the last value that the user approved for this hook; may be None. | ||
| 166 | old_val = hooks_config.GetString(git_approval_key) | ||
| 167 | |||
| 168 | if old_val is not None: | ||
| 169 | # User previously approved hook and asked not to be prompted again. | ||
| 170 | if new_val == old_val: | ||
| 171 | # Approval matched. We're done. | ||
| 172 | return True | ||
| 173 | else: | ||
| 174 | # Give the user a reason why we're prompting, since they last told | ||
| 175 | # us to "never ask again". | ||
| 176 | prompt = 'WARNING: %s\n\n' % (changed_prompt,) | ||
| 177 | else: | ||
| 178 | prompt = '' | ||
| 179 | |||
| 180 | # Prompt the user if we're not on a tty; on a tty we'll assume "no". | ||
| 181 | if sys.stdout.isatty(): | ||
| 182 | prompt += main_prompt + ' (yes/always/NO)? ' | ||
| 183 | response = input(prompt).lower() | ||
| 184 | print() | ||
| 185 | |||
| 186 | # User is doing a one-time approval. | ||
| 187 | if response in ('y', 'yes'): | ||
| 188 | return True | ||
| 189 | elif response == 'always': | ||
| 190 | hooks_config.SetString(git_approval_key, new_val) | ||
| 191 | return True | ||
| 192 | |||
| 193 | # For anything else, we'll assume no approval. | ||
| 194 | if self._abort_if_user_denies: | ||
| 195 | raise HookError('You must allow the %s hook or use --no-verify.' % | ||
| 196 | self._hook_type) | ||
| 197 | |||
| 198 | return False | ||
| 199 | |||
| 200 | def _ManifestUrlHasSecureScheme(self): | ||
| 201 | """Check if the URI for the manifest is a secure transport.""" | ||
| 202 | secure_schemes = ('file', 'https', 'ssh', 'persistent-https', 'sso', 'rpc') | ||
| 203 | parse_results = urllib.parse.urlparse(self._manifest_url) | ||
| 204 | return parse_results.scheme in secure_schemes | ||
| 205 | |||
| 206 | def _CheckForHookApprovalManifest(self): | ||
| 207 | """Check whether the user has approved this manifest host. | ||
| 208 | |||
| 209 | Returns: | ||
| 210 | True if this hook is approved to run; False otherwise. | ||
| 211 | """ | ||
| 212 | return self._CheckForHookApprovalHelper( | ||
| 213 | 'approvedmanifest', | ||
| 214 | self._manifest_url, | ||
| 215 | 'Run hook scripts from %s' % (self._manifest_url,), | ||
| 216 | 'Manifest URL has changed since %s was allowed.' % (self._hook_type,)) | ||
| 217 | |||
| 218 | def _CheckForHookApprovalHash(self): | ||
| 219 | """Check whether the user has approved the hooks repo. | ||
| 220 | |||
| 221 | Returns: | ||
| 222 | True if this hook is approved to run; False otherwise. | ||
| 223 | """ | ||
| 224 | prompt = ('Repo %s run the script:\n' | ||
| 225 | ' %s\n' | ||
| 226 | '\n' | ||
| 227 | 'Do you want to allow this script to run') | ||
| 228 | return self._CheckForHookApprovalHelper( | ||
| 229 | 'approvedhash', | ||
| 230 | self._GetHash(), | ||
| 231 | prompt % (self._GetMustVerb(), self._script_fullpath), | ||
| 232 | 'Scripts have changed since %s was allowed.' % (self._hook_type,)) | ||
| 233 | |||
| 234 | @staticmethod | ||
| 235 | def _ExtractInterpFromShebang(data): | ||
| 236 | """Extract the interpreter used in the shebang. | ||
| 237 | |||
| 238 | Try to locate the interpreter the script is using (ignoring `env`). | ||
| 239 | |||
| 240 | Args: | ||
| 241 | data: The file content of the script. | ||
| 242 | |||
| 243 | Returns: | ||
| 244 | The basename of the main script interpreter, or None if a shebang is not | ||
| 245 | used or could not be parsed out. | ||
| 246 | """ | ||
| 247 | firstline = data.splitlines()[:1] | ||
| 248 | if not firstline: | ||
| 249 | return None | ||
| 250 | |||
| 251 | # The format here can be tricky. | ||
| 252 | shebang = firstline[0].strip() | ||
| 253 | m = re.match(r'^#!\s*([^\s]+)(?:\s+([^\s]+))?', shebang) | ||
| 254 | if not m: | ||
| 255 | return None | ||
| 256 | |||
| 257 | # If the using `env`, find the target program. | ||
| 258 | interp = m.group(1) | ||
| 259 | if os.path.basename(interp) == 'env': | ||
| 260 | interp = m.group(2) | ||
| 261 | |||
| 262 | return interp | ||
| 263 | |||
| 264 | def _ExecuteHookViaReexec(self, interp, context, **kwargs): | ||
| 265 | """Execute the hook script through |interp|. | ||
| 266 | |||
| 267 | Note: Support for this feature should be dropped ~Jun 2021. | ||
| 268 | |||
| 269 | Args: | ||
| 270 | interp: The Python program to run. | ||
| 271 | context: Basic Python context to execute the hook inside. | ||
| 272 | kwargs: Arbitrary arguments to pass to the hook script. | ||
| 273 | |||
| 274 | Raises: | ||
| 275 | HookError: When the hooks failed for any reason. | ||
| 276 | """ | ||
| 277 | # This logic needs to be kept in sync with _ExecuteHookViaImport below. | ||
| 278 | script = """ | ||
| 279 | import json, os, sys | ||
| 280 | path = '''%(path)s''' | ||
| 281 | kwargs = json.loads('''%(kwargs)s''') | ||
| 282 | context = json.loads('''%(context)s''') | ||
| 283 | sys.path.insert(0, os.path.dirname(path)) | ||
| 284 | data = open(path).read() | ||
| 285 | exec(compile(data, path, 'exec'), context) | ||
| 286 | context['main'](**kwargs) | ||
| 287 | """ % { | ||
| 288 | 'path': self._script_fullpath, | ||
| 289 | 'kwargs': json.dumps(kwargs), | ||
| 290 | 'context': json.dumps(context), | ||
| 291 | } | ||
| 292 | |||
| 293 | # We pass the script via stdin to avoid OS argv limits. It also makes | ||
| 294 | # unhandled exception tracebacks less verbose/confusing for users. | ||
| 295 | cmd = [interp, '-c', 'import sys; exec(sys.stdin.read())'] | ||
| 296 | proc = subprocess.Popen(cmd, stdin=subprocess.PIPE) | ||
| 297 | proc.communicate(input=script.encode('utf-8')) | ||
| 298 | if proc.returncode: | ||
| 299 | raise HookError('Failed to run %s hook.' % (self._hook_type,)) | ||
| 300 | |||
| 301 | def _ExecuteHookViaImport(self, data, context, **kwargs): | ||
| 302 | """Execute the hook code in |data| directly. | ||
| 303 | |||
| 304 | Args: | ||
| 305 | data: The code of the hook to execute. | ||
| 306 | context: Basic Python context to execute the hook inside. | ||
| 307 | kwargs: Arbitrary arguments to pass to the hook script. | ||
| 308 | |||
| 309 | Raises: | ||
| 310 | HookError: When the hooks failed for any reason. | ||
| 311 | """ | ||
| 312 | # Exec, storing global context in the context dict. We catch exceptions | ||
| 313 | # and convert to a HookError w/ just the failing traceback. | ||
| 314 | try: | ||
| 315 | exec(compile(data, self._script_fullpath, 'exec'), context) | ||
| 316 | except Exception: | ||
| 317 | raise HookError('%s\nFailed to import %s hook; see traceback above.' % | ||
| 318 | (traceback.format_exc(), self._hook_type)) | ||
| 319 | |||
| 320 | # Running the script should have defined a main() function. | ||
| 321 | if 'main' not in context: | ||
| 322 | raise HookError('Missing main() in: "%s"' % self._script_fullpath) | ||
| 323 | |||
| 324 | # Call the main function in the hook. If the hook should cause the | ||
| 325 | # build to fail, it will raise an Exception. We'll catch that convert | ||
| 326 | # to a HookError w/ just the failing traceback. | ||
| 327 | try: | ||
| 328 | context['main'](**kwargs) | ||
| 329 | except Exception: | ||
| 330 | raise HookError('%s\nFailed to run main() for %s hook; see traceback ' | ||
| 331 | 'above.' % (traceback.format_exc(), self._hook_type)) | ||
| 332 | |||
| 333 | def _ExecuteHook(self, **kwargs): | ||
| 334 | """Actually execute the given hook. | ||
| 335 | |||
| 336 | This will run the hook's 'main' function in our python interpreter. | ||
| 337 | |||
| 338 | Args: | ||
| 339 | kwargs: Keyword arguments to pass to the hook. These are often specific | ||
| 340 | to the hook type. For instance, pre-upload hooks will contain | ||
| 341 | a project_list. | ||
| 342 | """ | ||
| 343 | # Keep sys.path and CWD stashed away so that we can always restore them | ||
| 344 | # upon function exit. | ||
| 345 | orig_path = os.getcwd() | ||
| 346 | orig_syspath = sys.path | ||
| 347 | |||
| 348 | try: | ||
| 349 | # Always run hooks with CWD as topdir. | ||
| 350 | os.chdir(self._topdir) | ||
| 351 | |||
| 352 | # Put the hook dir as the first item of sys.path so hooks can do | ||
| 353 | # relative imports. We want to replace the repo dir as [0] so | ||
| 354 | # hooks can't import repo files. | ||
| 355 | sys.path = [os.path.dirname(self._script_fullpath)] + sys.path[1:] | ||
| 356 | |||
| 357 | # Initial global context for the hook to run within. | ||
| 358 | context = {'__file__': self._script_fullpath} | ||
| 359 | |||
| 360 | # Add 'hook_should_take_kwargs' to the arguments to be passed to main. | ||
| 361 | # We don't actually want hooks to define their main with this argument-- | ||
| 362 | # it's there to remind them that their hook should always take **kwargs. | ||
| 363 | # For instance, a pre-upload hook should be defined like: | ||
| 364 | # def main(project_list, **kwargs): | ||
| 365 | # | ||
| 366 | # This allows us to later expand the API without breaking old hooks. | ||
| 367 | kwargs = kwargs.copy() | ||
| 368 | kwargs['hook_should_take_kwargs'] = True | ||
| 369 | |||
| 370 | # See what version of python the hook has been written against. | ||
| 371 | data = open(self._script_fullpath).read() | ||
| 372 | interp = self._ExtractInterpFromShebang(data) | ||
| 373 | reexec = False | ||
| 374 | if interp: | ||
| 375 | prog = os.path.basename(interp) | ||
| 376 | if prog.startswith('python2') and sys.version_info.major != 2: | ||
| 377 | reexec = True | ||
| 378 | elif prog.startswith('python3') and sys.version_info.major == 2: | ||
| 379 | reexec = True | ||
| 380 | |||
| 381 | # Attempt to execute the hooks through the requested version of Python. | ||
| 382 | if reexec: | ||
| 383 | try: | ||
| 384 | self._ExecuteHookViaReexec(interp, context, **kwargs) | ||
| 385 | except OSError as e: | ||
| 386 | if e.errno == errno.ENOENT: | ||
| 387 | # We couldn't find the interpreter, so fallback to importing. | ||
| 388 | reexec = False | ||
| 389 | else: | ||
| 390 | raise | ||
| 391 | |||
| 392 | # Run the hook by importing directly. | ||
| 393 | if not reexec: | ||
| 394 | self._ExecuteHookViaImport(data, context, **kwargs) | ||
| 395 | finally: | ||
| 396 | # Restore sys.path and CWD. | ||
| 397 | sys.path = orig_syspath | ||
| 398 | os.chdir(orig_path) | ||
| 399 | |||
| 400 | def Run(self, user_allows_all_hooks, **kwargs): | ||
| 401 | """Run the hook. | ||
| 402 | |||
| 403 | If the hook doesn't exist (because there is no hooks project or because | ||
| 404 | this particular hook is not enabled), this is a no-op. | ||
| 405 | |||
| 406 | Args: | ||
| 407 | user_allows_all_hooks: If True, we will never prompt about running the | ||
| 408 | hook--we'll just assume it's OK to run it. | ||
| 409 | kwargs: Keyword arguments to pass to the hook. These are often specific | ||
| 410 | to the hook type. For instance, pre-upload hooks will contain | ||
| 411 | a project_list. | ||
| 412 | |||
| 413 | Raises: | ||
| 414 | HookError: If there was a problem finding the hook or the user declined | ||
| 415 | to run a required hook (from _CheckForHookApproval). | ||
| 416 | """ | ||
| 417 | # No-op if there is no hooks project or if hook is disabled. | ||
| 418 | if ((not self._hooks_project) or (self._hook_type not in | ||
| 419 | self._hooks_project.enabled_repo_hooks)): | ||
| 420 | return | ||
| 421 | |||
| 422 | # Bail with a nice error if we can't find the hook. | ||
| 423 | if not os.path.isfile(self._script_fullpath): | ||
| 424 | raise HookError('Couldn\'t find repo hook: "%s"' % self._script_fullpath) | ||
| 425 | |||
| 426 | # Make sure the user is OK with running the hook. | ||
| 427 | if (not user_allows_all_hooks) and (not self._CheckForHookApproval()): | ||
| 428 | return | ||
| 429 | |||
| 430 | # Run the hook with the same version of python we're using. | ||
| 431 | self._ExecuteHook(**kwargs) | ||
