Skip to content

Commit

Permalink
Rework _copy_decouple to follow relative symlinks and symlinks to dir…
Browse files Browse the repository at this point in the history
…ectories.

The previous code handled absolute symlinks fine but when there were relative symlinks it would
traceback.  Additionally, it did not handle symlinks to directories that occurred outside of
/etc/pki.  This should fix both of those.
  • Loading branch information
abadger committed Jan 11, 2024
1 parent fb2e2d8 commit 2df5bd2
Showing 1 changed file with 118 additions and 42 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -73,6 +73,10 @@ def _check_deprecated_rhsm_skip():
)


class BrokenSymlinkError(Exception):
"""Raised when we encounter a broken symlink where we weren't expecting it."""


class _InputData(object):
def __init__(self):
self._consume_data()
Expand Down Expand Up @@ -328,6 +332,81 @@ def _get_files_owned_by_rpms(context, dirpath, pkgs=None, recursive=False):
return files_owned_by_rpms


def _mkdir_with_copied_mode(path, mode_from):
"""
Create directories with a file to copy the mode from.
:param path: The directory path to create.
:param mode_from: A file or directory whose mode we will copy to the
newly created directory.
:raises subprocess.CalledProcessError: mkdir or chmod fails. For instance,
the directory already exists, the file to get permissions from does
not exist, a parent directory does not exist.
"""
# Create with maximally restrictive permissions
run(['mkdir', '-m', '0', '-p', path])
run(['chmod', '--reference={}'.format(mode_from), path])


def _copy_or_link(symlink, srcdir):
"""
Copy file contents or create a symlink depending on where the pointee resides.
:param symlink: The source symlink to follow. This must be an absolute path.
:returns: A tuple of action and sourcefile. Action is one of 'copy' or 'link' and means that
the caller should either copy the sourcefile to the target location or create a symlink from
the sourcefile to the target location. sourcefile is the path to the file that should be
the source of the operation. It is either a real file outside of the srcdir hierarchy or
a file (real, directory, symlink or otherwise) inside of the srcdir hierarchy.
:raises ValueError: if the arguments are not correct
:raises BrokenSymlinkError: if the symlink is invalid
Determine whether the file pointed to by the symlink chain is within srcdir. If it is within,
then create a synlink that points from symlink to it.
If it is not within, then walk the symlink chain until we find something that is within srcdir.
If we reach a real file and it is outside of srcdir, then copy the file instead.
"""
if not symlink.startswith('/'):
raise ValueError('File{} must be an absolute path!'.format(symlink))

# os.path.exists follows symlinks
if not os.path.exists(symlink):
raise BrokenSymlinkError('File {} is a broken symlink!'.format(symlink))

pointee_as_abspath = symlink
seen = set([pointee_as_abspath])

while os.path.islink(pointee_as_abspath):
pointee = os.readlink(pointee_as_abspath)

# Note: os.path.join()'s behaviour if the pointee is an absolute path
# essentially ignores the first argument (which is what we want).
pointee_as_abspath = os.path.normpath(os.path.join(os.path.dirname(pointee_as_abspath), pointee))

if pointee_as_abspath in seen:
# On Linux, this should not happen as the os.path.exists() call
# before the loop should catch it.
if symlink == pointee_as_abspath:
error_msg = ('File {} is a broken symlink that references'
' itself!'.format(pointee_as_abspath))
else:
error_msg = ('File {} references {} which is a broken symlink'
' that references itself!'.format(symlink, pointee_as_abspath))

raise BrokenSymlinkError(error_msg)

seen.add(pointee_as_abspath)

if pointee_as_abspath.startswith(srcdir):
# Absolute path inside of the correct dir so we need to link to it
return ("link", pointee_as_abspath)

# The is not a link so copy it
return ('copy', pointee_as_abspath)


def _copy_decouple(srcdir, dstdir):
"""
Copy `srcdir` to `dstdir` while decoupling symlinks.
Expand All @@ -340,56 +419,52 @@ def _copy_decouple(srcdir, dstdir):
"""

for root, dummy_dirs, files in os.walk(srcdir):
symlinks_to_process = []
for root, directories, files in os.walk(srcdir):
# relative path from srcdir because srcdir is replaced with dstdir for
# the copy.
relpath = os.path.relpath(root, srcdir)

# Create all directories with proper permissions for security
# reasons (Putting private data into directories that haven't had their
# permissions set appropriately may leak the private information.)
for directory in directories:
source_dirpath = os.path.join(root, directory)
target_dirpath = os.path.join(dstdir, relpath, directory)
_mkdir_with_copied_mode(target_dirpath, source_dirpath)

for filename in files:
relpath = os.path.relpath(root, srcdir)
source_filepath = os.path.join(root, filename)
target_filepath = os.path.join(dstdir, relpath, filename)

# Skip and report broken symlinks
if not os.path.exists(source_filepath):
api.current_logger().warning(
'File {} is a broken symlink! Will not copy the file.'.format(source_filepath))
continue

# Copy symlinks to the target userspace
source_is_symlink = os.path.islink(source_filepath)
pointee = None
if source_is_symlink:
pointee = os.readlink(source_filepath)

# If source file is a symlink within `srcdir` then preserve it,
# otherwise resolve and copy it as a file it points to
if pointee is not None and not pointee.startswith(srcdir):
# Follow the path until we hit a file or get back to /etc/pki
while not pointee.startswith(srcdir) and os.path.islink(pointee):
pointee = os.readlink(pointee)

# Pointee points to a _regular file_ outside /etc/pki so we
# copy it instead
if not pointee.startswith(srcdir) and not os.path.islink(pointee):
source_is_symlink = False
source_filepath = pointee
else:
# pointee points back to /etc/pki
pass

# Ensure parent directory exists
parent_dir = os.path.dirname(target_filepath)
# Note: This is secure because we know that parent_dir is located
# inside of `$target_userspace/etc/pki` which is a directory that
# is not writable by unprivileged users. If this function is used
# elsewhere we may need to be more careful before running `mkdir -p`.
run(['mkdir', '-p', parent_dir])

if source_is_symlink:
# Preserve the owner and permissions of the original symlink
run(['ln', '-s', pointee, target_filepath])
run(['chmod', '--reference={}'.format(source_filepath), target_filepath])
# Defer symlinks until later because we may end up having to copy
# the file contents and the directory may not exist yet.
if os.path.islink(source_filepath):
symlinks_to_process.append((source_filepath, target_filepath))
continue

# Not a symlink so we can copy it now too
run(['cp', '-a', source_filepath, target_filepath])

# Now process all symlinks
for source_linkpath, target_linkpath in symlinks_to_process:
try:
action, source_path = _copy_or_link(source_linkpath, srcdir)
except BrokenSymlinkError as e:
# Skip and report broken symlinks
api.current_logger().warning('{} Will not copy the file!'.format(str(e)))
continue

if action == "copy":
# Note: source_path could be a directory, so '-a' or '-r' must be
# given to cp.
run(['cp', '-a', source_path, target_linkpath])
elif action == 'link':
run(["ln", "-s", source_path, target_linkpath])
else:
# This will not happen unless _copy_or_link() has a bug.
raise RuntimeError("Programming error: _copy_or_link() returned an unknown action:{}".format(action))


def _copy_certificates(context, target_userspace):
"""
Expand All @@ -413,6 +488,7 @@ def _copy_certificates(context, target_userspace):

# Backup container /etc/pki
run(['mv', target_pki, backup_pki])
_mkdir_with_copied_mode(target_pki, backup_pki)

# Copy source /etc/pki to the container
_copy_decouple('/etc/pki', target_pki)
Expand Down

0 comments on commit 2df5bd2

Please sign in to comment.