Merge pull request #3204 from quay/joseph.schorr/QUAY-1030/registry-interface
Start on a basic registry_model interface
This commit is contained in:
		
						commit
						6414e580f6
					
				
					 7 changed files with 150 additions and 56 deletions
				
			
		|  | @ -5,6 +5,8 @@ from app import app | ||||||
| from cachetools import lru_cache | from cachetools import lru_cache | ||||||
| from notifications import spawn_notification | from notifications import spawn_notification | ||||||
| from data import model | from data import model | ||||||
|  | from data.registry_model import registry_model | ||||||
|  | from data.registry_model.datatypes import RepositoryReference | ||||||
| from data.database import UseThenDisconnect | from data.database import UseThenDisconnect | ||||||
| from util.imagetree import ImageTree | from util.imagetree import ImageTree | ||||||
| from util.morecollections import AttrDict | from util.morecollections import AttrDict | ||||||
|  | @ -95,70 +97,24 @@ class BuildJob(object): | ||||||
| 
 | 
 | ||||||
|   def determine_cached_tag(self, base_image_id=None, cache_comments=None): |   def determine_cached_tag(self, base_image_id=None, cache_comments=None): | ||||||
|     """ Returns the tag to pull to prime the cache or None if none. """ |     """ Returns the tag to pull to prime the cache or None if none. """ | ||||||
|     cached_tag = None |  | ||||||
|     if base_image_id and cache_comments: |  | ||||||
|       cached_tag = self._determine_cached_tag_by_comments(base_image_id, cache_comments) |  | ||||||
| 
 |  | ||||||
|     if not cached_tag: |  | ||||||
|     cached_tag = self._determine_cached_tag_by_tag() |     cached_tag = self._determine_cached_tag_by_tag() | ||||||
| 
 |  | ||||||
|     logger.debug('Determined cached tag %s for %s: %s', cached_tag, base_image_id, cache_comments) |     logger.debug('Determined cached tag %s for %s: %s', cached_tag, base_image_id, cache_comments) | ||||||
| 
 |  | ||||||
|     return cached_tag |     return cached_tag | ||||||
| 
 | 
 | ||||||
|   def _determine_cached_tag_by_comments(self, base_image_id, cache_commands): |  | ||||||
|     """ Determines the tag to use for priming the cache for this build job, by matching commands |  | ||||||
|         starting at the given base_image_id. This mimics the Docker cache checking, so it should, |  | ||||||
|         in theory, provide "perfect" caching. |  | ||||||
|     """ |  | ||||||
|     with UseThenDisconnect(app.config): |  | ||||||
|       # Lookup the base image in the repository. If it doesn't exist, nothing more to do. |  | ||||||
|       repo_build = self.repo_build |  | ||||||
|       repo_namespace = repo_build.repository.namespace_user.username |  | ||||||
|       repo_name = repo_build.repository.name |  | ||||||
| 
 |  | ||||||
|       base_image = model.image.get_image(repo_build.repository, base_image_id) |  | ||||||
|       if base_image is None: |  | ||||||
|         return None |  | ||||||
| 
 |  | ||||||
|       # Build an in-memory tree of the full heirarchy of images in the repository. |  | ||||||
|       all_images = model.image.get_repository_images_without_placements(repo_build.repository, |  | ||||||
|                                                                         with_ancestor=base_image) |  | ||||||
| 
 |  | ||||||
|       all_tags = model.tag.list_repository_tags(repo_namespace, repo_name) |  | ||||||
|       tree = ImageTree(all_images, all_tags, base_filter=base_image.id) |  | ||||||
| 
 |  | ||||||
|       # Find a path in the tree, starting at the base image, that matches the cache comments |  | ||||||
|       # or some subset thereof. |  | ||||||
|       def checker(step, image): |  | ||||||
|         if step >= len(cache_commands): |  | ||||||
|           return False |  | ||||||
| 
 |  | ||||||
|         full_command = '["/bin/sh", "-c", "%s"]' % cache_commands[step] |  | ||||||
|         logger.debug('Checking step #%s: %s, %s == %s', step, image.id, image.command, full_command) |  | ||||||
| 
 |  | ||||||
|         return image.command == full_command |  | ||||||
| 
 |  | ||||||
|       path = tree.find_longest_path(base_image.id, checker) |  | ||||||
|       if not path: |  | ||||||
|         return None |  | ||||||
| 
 |  | ||||||
|       # Find any tag associated with the last image in the path. |  | ||||||
|       return tree.tag_containing_image(path[-1]) |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
|   def _determine_cached_tag_by_tag(self): |   def _determine_cached_tag_by_tag(self): | ||||||
|     """ Determines the cached tag by looking for one of the tags being built, and seeing if it |     """ Determines the cached tag by looking for one of the tags being built, and seeing if it | ||||||
|         exists in the repository. This is a fallback for when no comment information is available. |         exists in the repository. This is a fallback for when no comment information is available. | ||||||
|     """ |     """ | ||||||
|     with UseThenDisconnect(app.config): |     with UseThenDisconnect(app.config): | ||||||
|       tags = self.build_config.get('docker_tags', ['latest']) |       tags = self.build_config.get('docker_tags', ['latest']) | ||||||
|       repository = self.repo_build.repository |       repository = RepositoryReference.for_repo_obj(self.repo_build.repository) | ||||||
|       existing_tags = model.tag.list_repository_tags(repository.namespace_user.username, |       matching_tag = registry_model.find_matching_tag(repository, tags) | ||||||
|                                                      repository.name) |       if matching_tag is not None: | ||||||
|       cached_tags = set(tags) & set([tag.name for tag in existing_tags]) |         return matching_tag.name | ||||||
|       if cached_tags: | 
 | ||||||
|         return list(cached_tags)[0] |       most_recent_tag = registry_model.get_most_recent_tag(repository) | ||||||
|  |       if most_recent_tag is not None: | ||||||
|  |         return most_recent_tag.name | ||||||
| 
 | 
 | ||||||
|       return None |       return None | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -721,3 +721,30 @@ def change_tag_expiration(tag, expiration_date): | ||||||
|             .execute()) |             .execute()) | ||||||
| 
 | 
 | ||||||
|   return (tag.lifetime_end_ts, result > 0) |   return (tag.lifetime_end_ts, result > 0) | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | def find_matching_tag(repo_id, tag_names): | ||||||
|  |   """ Finds the most recently pushed alive tag in the repository with one of the given names, | ||||||
|  |       if any. | ||||||
|  |   """ | ||||||
|  |   try: | ||||||
|  |     return (_tag_alive(RepositoryTag | ||||||
|  |                        .select() | ||||||
|  |                        .where(RepositoryTag.repository == repo_id, | ||||||
|  |                               RepositoryTag.name << list(tag_names)) | ||||||
|  |                        .order_by(RepositoryTag.lifetime_start_ts.desc())) | ||||||
|  |             .get()) | ||||||
|  |   except RepositoryTag.DoesNotExist: | ||||||
|  |     return None | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | def get_most_recent_tag(repo_id): | ||||||
|  |   """ Returns the most recently pushed alive tag in the repository, or None if none. """ | ||||||
|  |   try: | ||||||
|  |     return (_tag_alive(RepositoryTag | ||||||
|  |                        .select() | ||||||
|  |                        .where(RepositoryTag.repository == repo_id) | ||||||
|  |                        .order_by(RepositoryTag.lifetime_start_ts.desc())) | ||||||
|  |             .get()) | ||||||
|  |   except RepositoryTag.DoesNotExist: | ||||||
|  |     return None | ||||||
|  |  | ||||||
							
								
								
									
										3
									
								
								data/registry_model/__init__.py
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										3
									
								
								data/registry_model/__init__.py
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,3 @@ | ||||||
|  | from data.registry_model.registry_pre_oci_model import pre_oci_model | ||||||
|  | 
 | ||||||
|  | registry_model = pre_oci_model | ||||||
							
								
								
									
										20
									
								
								data/registry_model/datatypes.py
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										20
									
								
								data/registry_model/datatypes.py
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,20 @@ | ||||||
|  | from collections import namedtuple | ||||||
|  | 
 | ||||||
|  | class RepositoryReference(object): | ||||||
|  |   """ RepositoryReference is a reference to a repository, passed to registry interface methods. """ | ||||||
|  |   def __init__(self, repo_id): | ||||||
|  |     self.repo_id = repo_id | ||||||
|  | 
 | ||||||
|  |   @classmethod | ||||||
|  |   def for_repo_obj(cls, repo_obj): | ||||||
|  |     return RepositoryReference(repo_obj.id) | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | class Tag(namedtuple('Tag', ['id', 'name'])): | ||||||
|  |   """ Tag represents a tag in a repository, which points to a manifest or image. """ | ||||||
|  |   @classmethod | ||||||
|  |   def for_repository_tag(cls, repository_tag): | ||||||
|  |     if repository_tag is None: | ||||||
|  |       return None | ||||||
|  | 
 | ||||||
|  |     return Tag(id=repository_tag.id, name=repository_tag.name) | ||||||
							
								
								
									
										21
									
								
								data/registry_model/interface.py
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										21
									
								
								data/registry_model/interface.py
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,21 @@ | ||||||
|  | from abc import ABCMeta, abstractmethod | ||||||
|  | from six import add_metaclass | ||||||
|  | 
 | ||||||
|  | @add_metaclass(ABCMeta) | ||||||
|  | class RegistryDataInterface(object): | ||||||
|  |   """ Interface for code to work with the registry data model. The registry data model consists | ||||||
|  |       of all tables that store registry-specific information, such as Manifests, Blobs, Images, | ||||||
|  |       and Labels. | ||||||
|  |   """ | ||||||
|  | 
 | ||||||
|  |   @abstractmethod | ||||||
|  |   def find_matching_tag(self, repository_ref, tag_names): | ||||||
|  |     """ Finds an alive tag in the repository matching one of the given tag names and returns it | ||||||
|  |         or None if none. | ||||||
|  |     """ | ||||||
|  | 
 | ||||||
|  |   @abstractmethod | ||||||
|  |   def get_most_recent_tag(self, repository_ref): | ||||||
|  |     """ Returns the most recently pushed alive tag in the repository, if any. If none, returns | ||||||
|  |         None. | ||||||
|  |     """ | ||||||
							
								
								
									
										27
									
								
								data/registry_model/registry_pre_oci_model.py
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										27
									
								
								data/registry_model/registry_pre_oci_model.py
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,27 @@ | ||||||
|  | from data import model | ||||||
|  | from data.registry_model.interface import RegistryDataInterface | ||||||
|  | from data.registry_model.datatypes import Tag | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | class PreOCIModel(RegistryDataInterface): | ||||||
|  |   """ | ||||||
|  |   PreOCIModel implements the data model for the registry API using a database schema | ||||||
|  |   before it was changed to support the OCI specification. | ||||||
|  |   """ | ||||||
|  | 
 | ||||||
|  |   def find_matching_tag(self, repository_ref, tag_names): | ||||||
|  |     """ Finds an alive tag in the repository matching one of the given tag names and returns it | ||||||
|  |         or None if none. | ||||||
|  |     """ | ||||||
|  |     found_tag = model.tag.find_matching_tag(repository_ref.repo_id, tag_names) | ||||||
|  |     return Tag.for_repository_tag(found_tag) | ||||||
|  | 
 | ||||||
|  |   def get_most_recent_tag(self, repository_ref): | ||||||
|  |     """ Returns the most recently pushed alive tag in the repository, if any. If none, returns | ||||||
|  |         None. | ||||||
|  |     """ | ||||||
|  |     found_tag = model.tag.get_most_recent_tag(repository_ref.repo_id) | ||||||
|  |     return Tag.for_repository_tag(found_tag) | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | pre_oci_model = PreOCIModel() | ||||||
							
								
								
									
										40
									
								
								data/registry_model/test/test_pre_oci_model.py
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										40
									
								
								data/registry_model/test/test_pre_oci_model.py
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,40 @@ | ||||||
|  | import pytest | ||||||
|  | 
 | ||||||
|  | from data import model | ||||||
|  | from data.registry_model.registry_pre_oci_model import PreOCIModel | ||||||
|  | from data.registry_model.datatypes import RepositoryReference | ||||||
|  | from test.fixtures import * | ||||||
|  | 
 | ||||||
|  | @pytest.fixture() | ||||||
|  | def pre_oci_model(initialized_db): | ||||||
|  |   return PreOCIModel() | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | @pytest.mark.parametrize('names, expected', [ | ||||||
|  |   (['unknown'], None), | ||||||
|  |   (['latest'], 'latest'), | ||||||
|  |   (['latest', 'prod'], 'latest'), | ||||||
|  |   (['foo', 'prod'], 'prod'), | ||||||
|  | ]) | ||||||
|  | def test_find_matching_tag(names, expected, pre_oci_model): | ||||||
|  |   repo = model.repository.get_repository('devtable', 'simple') | ||||||
|  |   repository_ref = RepositoryReference.for_repo_obj(repo) | ||||||
|  |   found = pre_oci_model.find_matching_tag(repository_ref, names) | ||||||
|  |   if expected is None: | ||||||
|  |     assert found is None | ||||||
|  |   else: | ||||||
|  |     assert found.name == expected | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | @pytest.mark.parametrize('repo_namespace, repo_name, expected', [ | ||||||
|  |   ('devtable', 'simple', 'latest'), | ||||||
|  |   ('buynlarge', 'orgrepo', 'latest'), | ||||||
|  | ]) | ||||||
|  | def test_get_most_recent_tag(repo_namespace, repo_name, expected, pre_oci_model): | ||||||
|  |   repo = model.repository.get_repository(repo_namespace, repo_name) | ||||||
|  |   repository_ref = RepositoryReference.for_repo_obj(repo) | ||||||
|  |   found = pre_oci_model.get_most_recent_tag(repository_ref) | ||||||
|  |   if expected is None: | ||||||
|  |     assert found is None | ||||||
|  |   else: | ||||||
|  |     assert found.name == expected | ||||||
		Reference in a new issue