Benjamin Schubert pushed to branch bschubert/fix-atomic-move-git-repo at BuildStream / buildstream
Commits:
-
fe33e328
by James Ennis at 2018-11-08T17:54:18Z
-
09faf002
by James Ennis at 2018-11-08T17:54:18Z
-
d153453c
by Javier Jardón at 2018-11-08T18:22:54Z
-
1557b491
by Benjamin Schubert at 2018-11-09T11:21:18Z
-
942a4329
by Benjamin Schubert at 2018-11-09T11:21:18Z
7 changed files:
- buildstream/_artifactcache/artifactcache.py
- buildstream/plugins/sources/git.py
- buildstream/utils.py
- doc/source/using_config.rst
- tests/frontend/buildtrack.py
- tests/utils/misc.py
- + tests/utils/movedirectory.py
Changes:
| ... | ... | @@ -937,15 +937,22 @@ class ArtifactCache(): |
| 937 | 937 |
"Invalid cache quota ({}): ".format(utils._pretty_size(cache_quota)) +
|
| 938 | 938 |
"BuildStream requires a minimum cache quota of 2G.")
|
| 939 | 939 |
elif cache_quota > cache_size + available_space: # Check maximum
|
| 940 |
+ if '%' in self.context.config_cache_quota:
|
|
| 941 |
+ available = (available_space / (stat.f_blocks * stat.f_bsize)) * 100
|
|
| 942 |
+ available = '{}% of total disk space'.format(round(available, 1))
|
|
| 943 |
+ else:
|
|
| 944 |
+ available = utils._pretty_size(available_space)
|
|
| 945 |
+ |
|
| 940 | 946 |
raise LoadError(LoadErrorReason.INVALID_DATA,
|
| 941 | 947 |
("Your system does not have enough available " +
|
| 942 | 948 |
"space to support the cache quota specified.\n" +
|
| 943 |
- "You currently have:\n" +
|
|
| 944 |
- "- {used} of cache in use at {local_cache_path}\n" +
|
|
| 945 |
- "- {available} of available system storage").format(
|
|
| 946 |
- used=utils._pretty_size(cache_size),
|
|
| 947 |
- local_cache_path=self.context.artifactdir,
|
|
| 948 |
- available=utils._pretty_size(available_space)))
|
|
| 949 |
+ "\nYou have specified a quota of {quota} total disk space.\n" +
|
|
| 950 |
+ "- The filesystem containing {local_cache_path} only " +
|
|
| 951 |
+ "has: {available_size} available.")
|
|
| 952 |
+ .format(
|
|
| 953 |
+ quota=self.context.config_cache_quota,
|
|
| 954 |
+ local_cache_path=self.context.artifactdir,
|
|
| 955 |
+ available_size=available))
|
|
| 949 | 956 |
|
| 950 | 957 |
# Place a slight headroom (2e9 (2GB) on the cache_quota) into
|
| 951 | 958 |
# cache_quota to try and avoid exceptions.
|
| ... | ... | @@ -97,6 +97,7 @@ from configparser import RawConfigParser |
| 97 | 97 |
from buildstream import Source, SourceError, Consistency, SourceFetcher
|
| 98 | 98 |
from buildstream import utils
|
| 99 | 99 |
from buildstream.plugin import CoreWarnings
|
| 100 |
+from buildstream.utils import move_atomic, DirectoryExistsError
|
|
| 100 | 101 |
|
| 101 | 102 |
GIT_MODULES = '.gitmodules'
|
| 102 | 103 |
|
| ... | ... | @@ -141,21 +142,16 @@ class GitMirror(SourceFetcher): |
| 141 | 142 |
fail="Failed to clone git repository {}".format(url),
|
| 142 | 143 |
fail_temporarily=True)
|
| 143 | 144 |
|
| 144 |
- # Attempt atomic rename into destination, this will fail if
|
|
| 145 |
- # another process beat us to the punch
|
|
| 146 | 145 |
try:
|
| 147 |
- os.rename(tmpdir, self.mirror)
|
|
| 148 |
- except OSError as e:
|
|
| 149 |
- |
|
| 150 |
- # When renaming and the destination repo already exists, os.rename()
|
|
| 151 |
- # will fail with ENOTEMPTY, since an empty directory will be silently
|
|
| 152 |
- # replaced
|
|
| 153 |
- if e.errno == errno.ENOTEMPTY:
|
|
| 154 |
- self.source.status("{}: Discarding duplicate clone of {}"
|
|
| 155 |
- .format(self.source, url))
|
|
| 156 |
- else:
|
|
| 157 |
- raise SourceError("{}: Failed to move cloned git repository {} from '{}' to '{}': {}"
|
|
| 158 |
- .format(self.source, url, tmpdir, self.mirror, e)) from e
|
|
| 146 |
+ move_atomic(tmpdir, self.mirror)
|
|
| 147 |
+ except DirectoryExistsError:
|
|
| 148 |
+ # Another process was quicker to download this repository.
|
|
| 149 |
+ # Let's discard our own
|
|
| 150 |
+ self.source.status("{}: Discarding duplicate clone of {}"
|
|
| 151 |
+ .format(self.source, url))
|
|
| 152 |
+ except OSError:
|
|
| 153 |
+ raise SourceError("{}: Failed to move cloned git repository {} from '{}' to '{}': {}"
|
|
| 154 |
+ .format(self.source, url, tmpdir, self.mirror, e)) from e
|
|
| 159 | 155 |
|
| 160 | 156 |
def _fetch(self, alias_override=None):
|
| 161 | 157 |
url = self.source.translate_url(self.url,
|
| ... | ... | @@ -72,6 +72,11 @@ class ProgramNotFoundError(BstError): |
| 72 | 72 |
super().__init__(message, domain=ErrorDomain.PROG_NOT_FOUND, reason=reason)
|
| 73 | 73 |
|
| 74 | 74 |
|
| 75 |
+class DirectoryExistsError(OSError):
|
|
| 76 |
+ """Raised when a `os.rename` is attempted but the destination is an existing directory.
|
|
| 77 |
+ """
|
|
| 78 |
+ |
|
| 79 |
+ |
|
| 75 | 80 |
class FileListResult():
|
| 76 | 81 |
"""An object which stores the result of one of the operations
|
| 77 | 82 |
which run on a list of files.
|
| ... | ... | @@ -500,6 +505,32 @@ def get_bst_version(): |
| 500 | 505 |
.format(__version__))
|
| 501 | 506 |
|
| 502 | 507 |
|
| 508 |
+def move_atomic(source, destination, ensure_parents=True):
|
|
| 509 |
+ """Move the source to the destination using atomic primitives.
|
|
| 510 |
+ |
|
| 511 |
+ This uses `os.rename` to move a file or directory to a new destination.
|
|
| 512 |
+ It wraps some `OSError` thrown errors to ensure their handling is correct.
|
|
| 513 |
+ |
|
| 514 |
+ The main reason for this to exist is that rename can throw different errors
|
|
| 515 |
+ for the same symptom (https://www.unix.com/man-page/POSIX/3posix/rename/).
|
|
| 516 |
+ |
|
| 517 |
+ We are especially interested here in the case when the destination already
|
|
| 518 |
+ exists. In this case, either EEXIST or ENOTEMPTY are thrown.
|
|
| 519 |
+ |
|
| 520 |
+ In order to ensure consistent handling of these exceptions, this function
|
|
| 521 |
+ should be used instead of `os.rename`
|
|
| 522 |
+ """
|
|
| 523 |
+ if ensure_parents:
|
|
| 524 |
+ os.makedirs(os.path.dirname(destination), exist_ok=True)
|
|
| 525 |
+ |
|
| 526 |
+ try:
|
|
| 527 |
+ os.rename(source, destination)
|
|
| 528 |
+ except OSError as exc:
|
|
| 529 |
+ if exc.errno in (errno.EEXIST, errno.ENOTEMPTY):
|
|
| 530 |
+ raise DirectoryExistsError(*exc.args) from exc
|
|
| 531 |
+ raise
|
|
| 532 |
+ |
|
| 533 |
+ |
|
| 503 | 534 |
@contextmanager
|
| 504 | 535 |
def save_file_atomic(filename, mode='w', *, buffering=-1, encoding=None,
|
| 505 | 536 |
errors=None, newline=None, closefd=True, opener=None, tempdir=None):
|
| ... | ... | @@ -147,6 +147,44 @@ The default mirror is defined by its name, e.g. |
| 147 | 147 |
``--default-mirror`` command-line option.
|
| 148 | 148 |
|
| 149 | 149 |
|
| 150 |
+Local cache expiry
|
|
| 151 |
+~~~~~~~~~~~~~~~~~~
|
|
| 152 |
+BuildStream locally caches artifacts, build trees, log files and sources within a
|
|
| 153 |
+cache located at ``~/.cache/buildstream`` (unless a $XDG_CACHE_HOME environment
|
|
| 154 |
+variable exists). When building large projects, this cache can get very large,
|
|
| 155 |
+thus BuildStream will attempt to clean up the cache automatically by expiring the least
|
|
| 156 |
+recently *used* artifacts.
|
|
| 157 |
+ |
|
| 158 |
+By default, cache expiry will begin once the file system which contains the cache
|
|
| 159 |
+approaches maximum usage. However, it is also possible to impose a quota on the local
|
|
| 160 |
+cache in the user configuration. This can be done in two ways:
|
|
| 161 |
+ |
|
| 162 |
+1. By restricting the maximum size of the cache directory itself.
|
|
| 163 |
+ |
|
| 164 |
+For example, to ensure that BuildStream's cache does not grow beyond 100 GB,
|
|
| 165 |
+simply declare the following in your user configuration (``~/.config/buildstream.conf``):
|
|
| 166 |
+ |
|
| 167 |
+.. code:: yaml
|
|
| 168 |
+ |
|
| 169 |
+ cache:
|
|
| 170 |
+ quota: 100G
|
|
| 171 |
+ |
|
| 172 |
+This quota defines the maximum size of the artifact cache in bytes.
|
|
| 173 |
+Other accepted values are: K, M, G or T (or you can simply declare the value in bytes, without the suffix).
|
|
| 174 |
+This uses the same format as systemd's
|
|
| 175 |
+`resource-control <https://www.freedesktop.org/software/systemd/man/systemd.resource-control.html>`_.
|
|
| 176 |
+ |
|
| 177 |
+2. By expiring artifacts once the file system which contains the cache exceeds a specified usage.
|
|
| 178 |
+ |
|
| 179 |
+To ensure that we start cleaning the cache once we've used 80% of local disk space (on the file system
|
|
| 180 |
+which mounts the cache):
|
|
| 181 |
+ |
|
| 182 |
+.. code:: yaml
|
|
| 183 |
+ |
|
| 184 |
+ cache:
|
|
| 185 |
+ quota: 80%
|
|
| 186 |
+ |
|
| 187 |
+ |
|
| 150 | 188 |
Default configuration
|
| 151 | 189 |
---------------------
|
| 152 | 190 |
The default BuildStream configuration is specified here for reference:
|
| ... | ... | @@ -115,6 +115,7 @@ def test_build_track(cli, datafiles, tmpdir, ref_storage, |
| 115 | 115 |
args += ['0.bst']
|
| 116 | 116 |
|
| 117 | 117 |
result = cli.run(project=project, silent=True, args=args)
|
| 118 |
+ result.assert_success()
|
|
| 118 | 119 |
tracked_elements = result.get_tracked_elements()
|
| 119 | 120 |
|
| 120 | 121 |
assert set(tracked_elements) == set(tracked)
|
| ... | ... | @@ -27,4 +27,5 @@ def test_parse_size_over_1024T(cli, tmpdir): |
| 27 | 27 |
patched_statvfs = mock_os.mock_statvfs(f_bavail=bavail, f_bsize=BLOCK_SIZE)
|
| 28 | 28 |
with mock_os.monkey_patch("statvfs", patched_statvfs):
|
| 29 | 29 |
result = cli.run(project, args=["build", "file.bst"])
|
| 30 |
- assert "1025T of available system storage" in result.stderr
|
|
| 30 |
+ failure_msg = 'Your system does not have enough available space to support the cache quota specified.'
|
|
| 31 |
+ assert failure_msg in result.stderr
|
| 1 |
+import pytest
|
|
| 2 |
+ |
|
| 3 |
+from buildstream.utils import move_atomic, DirectoryExistsError
|
|
| 4 |
+ |
|
| 5 |
+ |
|
| 6 |
+@pytest.fixture
|
|
| 7 |
+def src(tmp_path):
|
|
| 8 |
+ src = tmp_path.joinpath("src")
|
|
| 9 |
+ src.mkdir()
|
|
| 10 |
+ |
|
| 11 |
+ with src.joinpath("test").open("w") as fp:
|
|
| 12 |
+ fp.write("test")
|
|
| 13 |
+ |
|
| 14 |
+ return src
|
|
| 15 |
+ |
|
| 16 |
+ |
|
| 17 |
+def test_move_to_empty_dir(src, tmp_path):
|
|
| 18 |
+ dst = tmp_path.joinpath("dst")
|
|
| 19 |
+ |
|
| 20 |
+ move_atomic(src, dst)
|
|
| 21 |
+ |
|
| 22 |
+ assert dst.joinpath("test").exists()
|
|
| 23 |
+ |
|
| 24 |
+ |
|
| 25 |
+def test_move_to_empty_dir_create_parents(src, tmp_path):
|
|
| 26 |
+ dst = tmp_path.joinpath("nested/dst")
|
|
| 27 |
+ |
|
| 28 |
+ move_atomic(src, dst)
|
|
| 29 |
+ assert dst.joinpath("test").exists()
|
|
| 30 |
+ |
|
| 31 |
+ |
|
| 32 |
+def test_move_to_empty_dir_no_create_parents(src, tmp_path):
|
|
| 33 |
+ dst = tmp_path.joinpath("nested/dst")
|
|
| 34 |
+ |
|
| 35 |
+ with pytest.raises(FileNotFoundError):
|
|
| 36 |
+ move_atomic(src, dst, ensure_parents=False)
|
|
| 37 |
+ |
|
| 38 |
+ |
|
| 39 |
+def test_move_non_existing_dir(tmp_path):
|
|
| 40 |
+ dst = tmp_path.joinpath("dst")
|
|
| 41 |
+ src = tmp_path.joinpath("src")
|
|
| 42 |
+ |
|
| 43 |
+ with pytest.raises(FileNotFoundError):
|
|
| 44 |
+ move_atomic(src, dst)
|
|
| 45 |
+ |
|
| 46 |
+ |
|
| 47 |
+def test_move_to_existing_empty_dir(src, tmp_path):
|
|
| 48 |
+ dst = tmp_path.joinpath("dst")
|
|
| 49 |
+ dst.mkdir()
|
|
| 50 |
+ |
|
| 51 |
+ move_atomic(src, dst)
|
|
| 52 |
+ assert dst.joinpath("test").exists()
|
|
| 53 |
+ |
|
| 54 |
+ |
|
| 55 |
+def test_move_to_existing_file(src, tmp_path):
|
|
| 56 |
+ dst = tmp_path.joinpath("dst")
|
|
| 57 |
+ |
|
| 58 |
+ with dst.open("w") as fp:
|
|
| 59 |
+ fp.write("error")
|
|
| 60 |
+ |
|
| 61 |
+ with pytest.raises(NotADirectoryError):
|
|
| 62 |
+ move_atomic(src, dst)
|
|
| 63 |
+ |
|
| 64 |
+ |
|
| 65 |
+def test_move_file_to_existing_file(tmp_path):
|
|
| 66 |
+ dst = tmp_path.joinpath("dst")
|
|
| 67 |
+ src = tmp_path.joinpath("src")
|
|
| 68 |
+ |
|
| 69 |
+ with src.open("w") as fp:
|
|
| 70 |
+ fp.write("src")
|
|
| 71 |
+ |
|
| 72 |
+ with dst.open("w") as fp:
|
|
| 73 |
+ fp.write("dst")
|
|
| 74 |
+ |
|
| 75 |
+ move_atomic(src, dst)
|
|
| 76 |
+ with dst.open() as fp:
|
|
| 77 |
+ assert fp.read() == "src"
|
|
| 78 |
+ |
|
| 79 |
+ |
|
| 80 |
+def test_move_to_existing_non_empty_dir(src, tmp_path):
|
|
| 81 |
+ dst = tmp_path.joinpath("dst")
|
|
| 82 |
+ dst.mkdir()
|
|
| 83 |
+ |
|
| 84 |
+ with dst.joinpath("existing").open("w") as fp:
|
|
| 85 |
+ fp.write("already there")
|
|
| 86 |
+ |
|
| 87 |
+ with pytest.raises(DirectoryExistsError):
|
|
| 88 |
+ move_atomic(src, dst)
|
