summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorTiago Gomes <tiago.gomes@codethink.co.uk>2018-07-16 16:45:16 +0100
committerTiago Gomes <tiago.gomes@codethink.co.uk>2018-07-20 12:25:35 +0100
commit90a204d50b4a2d14dc880531cfd7291fbdc8318f (patch)
tree0febc18faf6c588e8e0ae4779c3595ab1324d56c
parent21fb826dc90570914bb2e80a8348d408dec44be7 (diff)
downloadbuildstream-tiagogomes/tarball_checkout_1.2.tar.gz
Add support for creating a tarball on bst checkouttiagogomes/tarball_checkout_1.2
One of the tests added is configured to be skipped for now, as dumping binary data is causing a bad descriptor exception when using the pytest capture module. Closes #263.
-rw-r--r--NEWS9
-rw-r--r--buildstream/_frontend/cli.py24
-rw-r--r--buildstream/_stream.py114
-rw-r--r--man/bst-checkout.112
-rw-r--r--tests/frontend/buildcheckout.py109
5 files changed, 229 insertions, 39 deletions
diff --git a/NEWS b/NEWS
index c9ac8c366..e04136583 100644
--- a/NEWS
+++ b/NEWS
@@ -1,4 +1,12 @@
=================
+buildstream 1.1.5
+=================
+
+ o Add a `--tar` option to `bst checkout` which allows a tarball to be
+ created from the artifact contents.
+
+
+=================
buildstream 1.1.4
=================
@@ -19,6 +27,7 @@ buildstream 1.1.4
runs out of space. The exact behavior is configurable in the user's
buildstream.conf.
+
=================
buildstream 1.1.3
=================
diff --git a/buildstream/_frontend/cli.py b/buildstream/_frontend/cli.py
index 1639cb910..bf5312c86 100644
--- a/buildstream/_frontend/cli.py
+++ b/buildstream/_frontend/cli.py
@@ -626,7 +626,7 @@ def shell(app, element, sysroot, mount, isolate, build_, command):
##################################################################
@cli.command(short_help="Checkout a built artifact")
@click.option('--force', '-f', default=False, is_flag=True,
- help="Overwrite files existing in checkout directory")
+ help="Allow files to be overwritten")
@click.option('--deps', '-d', default='run',
type=click.Choice(['run', 'none']),
help='The dependencies to checkout (default: run)')
@@ -634,20 +634,30 @@ def shell(app, element, sysroot, mount, isolate, build_, command):
help="Whether to run integration commands")
@click.option('--hardlinks', default=False, is_flag=True,
help="Checkout hardlinks instead of copies (handle with care)")
+@click.option('--tar', default=False, is_flag=True,
+ help="Create a tarball from the artifact contents instead "
+ "of a file tree. If LOCATION is '-', the tarball "
+ "will be dumped to the standard output.")
@click.argument('element',
type=click.Path(readable=False))
-@click.argument('directory', type=click.Path(file_okay=False))
+@click.argument('location', type=click.Path())
@click.pass_obj
-def checkout(app, element, directory, force, deps, integrate, hardlinks):
- """Checkout a built artifact to the specified directory
+def checkout(app, element, location, force, deps, integrate, hardlinks, tar):
+ """Checkout a built artifact to the specified location
"""
+
+ if hardlinks and tar:
+ click.echo("ERROR: options --hardlinks and --tar conflict", err=True)
+ sys.exit(-1)
+
with app.initialized():
app.stream.checkout(element,
- directory=directory,
- deps=deps,
+ location=location,
force=force,
+ deps=deps,
integrate=integrate,
- hardlinks=hardlinks)
+ hardlinks=hardlinks,
+ tar=tar)
##################################################################
diff --git a/buildstream/_stream.py b/buildstream/_stream.py
index 646b7a27c..843c8e8e2 100644
--- a/buildstream/_stream.py
+++ b/buildstream/_stream.py
@@ -20,6 +20,7 @@
# Tristan Maat <tristan.maat@codethink.co.uk>
import os
+import sys
import stat
import shlex
import shutil
@@ -350,56 +351,91 @@ class Stream():
# checkout()
#
- # Checkout the pipeline target artifact to the specified directory
+ # Checkout target artifact to the specified location
#
# Args:
# target (str): Target to checkout
- # directory (str): The directory to checkout the artifact to
- # force (bool): Force overwrite files which exist in `directory`
+ # location (str): Location to checkout the artifact to
+ # force (bool): Whether files can be overwritten if necessary
+ # deps (str): The dependencies to checkout
# integrate (bool): Whether to run integration commands
# hardlinks (bool): Whether checking out files hardlinked to
# their artifacts is acceptable
+ # tar (bool): If true, a tarball from the artifact contents will
+ # be created, otherwise the file tree of the artifact
+ # will be placed at the given location. If true and
+ # location is '-', the tarball will be dumped on the
+ # standard output.
#
def checkout(self, target, *,
- deps='run',
- directory=None,
+ location=None,
force=False,
+ deps='run',
integrate=True,
- hardlinks=False):
+ hardlinks=False,
+ tar=False):
# We only have one target in a checkout command
elements, _ = self._load((target,), (), fetch_subprojects=True)
target = elements[0]
- try:
- os.makedirs(directory, exist_ok=True)
- except OSError as e:
- raise StreamError("Failed to create checkout directory: {}".format(e)) from e
-
- if not os.access(directory, os.W_OK):
- raise StreamError("Directory {} not writable".format(directory))
+ if not tar:
+ try:
+ os.makedirs(location, exist_ok=True)
+ except OSError as e:
+ raise StreamError("Failed to create checkout directory: '{}'"
+ .format(e)) from e
- if not force and os.listdir(directory):
- raise StreamError("Checkout directory is not empty: {}"
- .format(directory))
+ if not tar:
+ if not os.access(location, os.W_OK):
+ raise StreamError("Checkout directory '{}' not writable"
+ .format(location))
+ if not force and os.listdir(location):
+ raise StreamError("Checkout directory '{}' not empty"
+ .format(location))
+ elif os.path.exists(location) and location != '-':
+ if not os.access(location, os.W_OK):
+ raise StreamError("Output file '{}' not writable"
+ .format(location))
+ if not force and os.path.exists(location):
+ raise StreamError("Output file '{}' already exists"
+ .format(location))
# Stage deps into a temporary sandbox first
try:
- with target._prepare_sandbox(Scope.RUN, None, deps=deps, integrate=integrate) as sandbox:
+ with target._prepare_sandbox(Scope.RUN, None, deps=deps,
+ integrate=integrate) as sandbox:
# Copy or move the sandbox to the target directory
sandbox_root = sandbox.get_directory()
- with target.timed_activity("Checking out files in {}".format(directory)):
- try:
- if hardlinks:
- self._checkout_hardlinks(sandbox_root, directory)
- else:
- utils.copy_files(sandbox_root, directory)
- except OSError as e:
- raise StreamError("Failed to checkout files: {}".format(e)) from e
+ if not tar:
+ with target.timed_activity("Checking out files in '{}'"
+ .format(location)):
+ try:
+ if hardlinks:
+ self._checkout_hardlinks(sandbox_root, location)
+ else:
+ utils.copy_files(sandbox_root, location)
+ except OSError as e:
+ raise StreamError("Failed to checkout files: '{}'"
+ .format(e)) from e
+ else:
+ if location == '-':
+ with target.timed_activity("Creating tarball"):
+ with os.fdopen(sys.stdout.fileno(), 'wb') as fo:
+ with tarfile.open(fileobj=fo, mode="w|") as tf:
+ Stream._add_directory_to_tarfile(
+ tf, sandbox_root, '.')
+ else:
+ with target.timed_activity("Creating tarball '{}'"
+ .format(location)):
+ with tarfile.open(location, "w:") as tf:
+ Stream._add_directory_to_tarfile(
+ tf, sandbox_root, '.')
+
except BstError as e:
- raise StreamError("Error while staging dependencies into a sandbox: {}".format(e),
- reason=e.reason) from e
+ raise StreamError("Error while staging dependencies into a sandbox"
+ ": '{}'".format(e), reason=e.reason) from e
# workspace_open
#
@@ -1025,6 +1061,30 @@ class Stream():
else:
utils.link_files(sandbox_root, directory)
+ # Add a directory entry deterministically to a tar file
+ #
+ # This function takes extra steps to ensure the output is deterministic.
+ # First, it sorts the results of os.listdir() to ensure the ordering of
+ # the files in the archive is the same. Second, it sets a fixed
+ # timestamp for each entry. See also https://bugs.python.org/issue24465.
+ @staticmethod
+ def _add_directory_to_tarfile(tf, dir_name, dir_arcname, mtime=0):
+ for filename in sorted(os.listdir(dir_name)):
+ name = os.path.join(dir_name, filename)
+ arcname = os.path.join(dir_arcname, filename)
+
+ tarinfo = tf.gettarinfo(name, arcname)
+ tarinfo.mtime = mtime
+
+ if tarinfo.isreg():
+ with open(name, "rb") as f:
+ tf.addfile(tarinfo, f)
+ elif tarinfo.isdir():
+ tf.addfile(tarinfo)
+ Stream._add_directory_to_tarfile(tf, name, arcname, mtime)
+ else:
+ tf.addfile(tarinfo)
+
# Write the element build script to the given directory
def _write_element_script(self, directory, element):
try:
diff --git a/man/bst-checkout.1 b/man/bst-checkout.1
index 7f213be82..fcd212e8d 100644
--- a/man/bst-checkout.1
+++ b/man/bst-checkout.1
@@ -3,14 +3,14 @@
bst\-checkout \- Checkout a built artifact
.SH SYNOPSIS
.B bst checkout
-[OPTIONS] ELEMENT DIRECTORY
+[OPTIONS] ELEMENT LOCATION
.SH DESCRIPTION
-Checkout a built artifact to the specified directory
+Checkout a built artifact to the specified location
.SH OPTIONS
.TP
\fB\-f,\fP \-\-force
-Overwrite files existing in checkout directory
+Allow files to be overwritten
.TP
\fB\-d,\fP \-\-deps [run|none]
The dependencies to checkout (default: run)
@@ -19,4 +19,8 @@ The dependencies to checkout (default: run)
Whether to run integration commands
.TP
\fB\-\-hardlinks\fP
-Checkout hardlinks instead of copies (handle with care) \ No newline at end of file
+Checkout hardlinks instead of copies (handle with care)
+.TP
+\fB\-\-tar\fP
+Create a tarball from the artifact contents instead of a file tree. If
+LOCATION is '-', the tarball will be dumped to the standard output.
diff --git a/tests/frontend/buildcheckout.py b/tests/frontend/buildcheckout.py
index 0fce355d4..1ec8f491f 100644
--- a/tests/frontend/buildcheckout.py
+++ b/tests/frontend/buildcheckout.py
@@ -1,4 +1,6 @@
import os
+import tarfile
+import hashlib
import pytest
from tests.testutils import cli, create_repo, ALL_REPO_KINDS
@@ -54,7 +56,6 @@ def test_build_checkout(datafiles, cli, strict, hardlinks):
filename = os.path.join(checkout, 'usr', 'bin', 'hello')
assert os.path.exists(filename)
- # Check that the executable hello file is found in the checkout
filename = os.path.join(checkout, 'usr', 'include', 'pony.h')
assert os.path.exists(filename)
@@ -96,6 +97,88 @@ def test_build_checkout_deps(datafiles, cli, deps):
@pytest.mark.datafiles(DATA_DIR)
+def test_build_checkout_tarball(datafiles, cli):
+ project = os.path.join(datafiles.dirname, datafiles.basename)
+ checkout = os.path.join(cli.directory, 'checkout.tar')
+
+ result = cli.run(project=project, args=['build', 'target.bst'])
+ result.assert_success()
+
+ builddir = os.path.join(cli.directory, 'build')
+ assert os.path.isdir(builddir)
+ assert not os.listdir(builddir)
+
+ checkout_args = ['checkout', '--tar', 'target.bst', checkout]
+
+ result = cli.run(project=project, args=checkout_args)
+ result.assert_success()
+
+ tar = tarfile.TarFile(checkout)
+ assert os.path.join('.', 'usr', 'bin', 'hello') in tar.getnames()
+ assert os.path.join('.', 'usr', 'include', 'pony.h') in tar.getnames()
+
+
+@pytest.mark.skip(reason="Capturing the binary output is causing a stacktrace")
+@pytest.mark.datafiles(DATA_DIR)
+def test_build_checkout_tarball_stdout(datafiles, cli):
+ project = os.path.join(datafiles.dirname, datafiles.basename)
+ tarball = os.path.join(cli.directory, 'tarball.tar')
+
+ result = cli.run(project=project, args=['build', 'target.bst'])
+ result.assert_success()
+
+ builddir = os.path.join(cli.directory, 'build')
+ assert os.path.isdir(builddir)
+ assert not os.listdir(builddir)
+
+ checkout_args = ['checkout', '--tar', 'target.bst', '-']
+
+ result = cli.run(project=project, args=checkout_args)
+ result.assert_success()
+
+ with open(tarball, 'wb') as f:
+ f.write(result.output)
+
+ tar = tarfile.TarFile(tarball)
+ assert os.path.join('.', 'usr', 'bin', 'hello') in tar.getnames()
+ assert os.path.join('.', 'usr', 'include', 'pony.h') in tar.getnames()
+
+
+@pytest.mark.datafiles(DATA_DIR)
+def test_build_checkout_tarball_is_deterministic(datafiles, cli):
+ project = os.path.join(datafiles.dirname, datafiles.basename)
+ tarball1 = os.path.join(cli.directory, 'tarball1.tar')
+ tarball2 = os.path.join(cli.directory, 'tarball2.tar')
+
+ result = cli.run(project=project, args=['build', 'target.bst'])
+ result.assert_success()
+
+ builddir = os.path.join(cli.directory, 'build')
+ assert os.path.isdir(builddir)
+ assert not os.listdir(builddir)
+
+ checkout_args = ['checkout', '--force', '--tar', 'target.bst']
+
+ checkout_args1 = checkout_args + [tarball1]
+ result = cli.run(project=project, args=checkout_args1)
+ result.assert_success()
+
+ checkout_args2 = checkout_args + [tarball2]
+ result = cli.run(project=project, args=checkout_args2)
+ result.assert_success()
+
+ with open(tarball1, 'rb') as f:
+ contents = f.read()
+ hash1 = hashlib.sha1(contents).hexdigest()
+
+ with open(tarball2, 'rb') as f:
+ contents = f.read()
+ hash2 = hashlib.sha1(contents).hexdigest()
+
+ assert hash1 == hash2
+
+
+@pytest.mark.datafiles(DATA_DIR)
@pytest.mark.parametrize("hardlinks", [("copies"), ("hardlinks")])
def test_build_checkout_nonempty(datafiles, cli, hardlinks):
project = os.path.join(datafiles.dirname, datafiles.basename)
@@ -171,6 +254,30 @@ def test_build_checkout_force(datafiles, cli, hardlinks):
assert os.path.exists(filename)
+@pytest.mark.datafiles(DATA_DIR)
+def test_build_checkout_force_tarball(datafiles, cli):
+ project = os.path.join(datafiles.dirname, datafiles.basename)
+ tarball = os.path.join(cli.directory, 'tarball.tar')
+
+ result = cli.run(project=project, args=['build', 'target.bst'])
+ result.assert_success()
+
+ builddir = os.path.join(cli.directory, 'build')
+ assert os.path.isdir(builddir)
+ assert not os.listdir(builddir)
+
+ with open(tarball, "w") as f:
+ f.write("Hello")
+
+ checkout_args = ['checkout', '--force', '--tar', 'target.bst', tarball]
+
+ result = cli.run(project=project, args=checkout_args)
+ result.assert_success()
+
+ tar = tarfile.TarFile(tarball)
+ assert os.path.join('.', 'usr', 'bin', 'hello') in tar.getnames()
+ assert os.path.join('.', 'usr', 'include', 'pony.h') in tar.getnames()
+
fetch_build_checkout_combos = \
[("strict", kind) for kind in ALL_REPO_KINDS] + \
[("non-strict", kind) for kind in ALL_REPO_KINDS]