python-tuf/tests/test_updater_ng.py
2026-02-19 14:46:40 +01:00

368 lines
14 KiB
Python

# Copyright 2021, New York University and the TUF contributors
# SPDX-License-Identifier: MIT OR Apache-2.0
"""Test Updater class"""
from __future__ import annotations
import logging
import os
import shutil
import sys
import tempfile
import unittest
from collections.abc import Iterable
from typing import TYPE_CHECKING, ClassVar
from unittest.mock import MagicMock, patch
from securesystemslib.signer import Signer
from tests import utils
from tuf.api import exceptions
from tuf.api.metadata import (
Metadata,
Root,
Snapshot,
TargetFile,
Targets,
Timestamp,
)
from tuf.ngclient import Updater, UpdaterConfig
if TYPE_CHECKING:
from collections.abc import Callable, Iterable
logger = logging.getLogger(__name__)
class TestUpdater(unittest.TestCase):
"""Test the Updater class from 'tuf/ngclient/updater.py'."""
server_process_handler: ClassVar[utils.TestServerProcess]
@classmethod
def setUpClass(cls) -> None:
cls.tmp_test_root_dir = tempfile.mkdtemp(dir=os.getcwd())
# Launch a SimpleHTTPServer
# Test cases will request metadata and target files that have been
# pre-generated in 'tuf/tests/repository_data', and are copied to
# CWD/tmp_test_root_dir/*
cls.server_process_handler = utils.TestServerProcess(log=logger)
@classmethod
def tearDownClass(cls) -> None:
# Cleans resources, flush the logged lines (if any) and remove test dir
cls.server_process_handler.clean()
shutil.rmtree(cls.tmp_test_root_dir)
def setUp(self) -> None:
# Create tmp test dir inside of tmp test root dir to independently serve
# new repository files for each test. We delete all tmp dirs at once in
# tearDownClass after the server has released all resources.
self.tmp_test_dir = tempfile.mkdtemp(dir=self.tmp_test_root_dir)
# Copy the original repository files provided in the test folder so that
# any modifications are restricted to the copies.
# The 'repository_data' directory is expected to exist in 'tuf.tests/'.
original_repository_files = os.path.join(
utils.TESTS_DIR, "repository_data"
)
original_repository = os.path.join(
original_repository_files, "repository"
)
original_keystore = os.path.join(original_repository_files, "keystore")
original_client = os.path.join(
original_repository_files,
"client",
"test_repository1",
"metadata",
"current",
)
# Save references to the often-needed client repository directories.
# Test cases need these references to access metadata and target files.
self.repository_directory = os.path.join(
self.tmp_test_dir, "repository"
)
self.keystore_directory = os.path.join(self.tmp_test_dir, "keystore")
self.client_directory = os.path.join(self.tmp_test_dir, "client")
# Copy the original 'repository', 'client', and 'keystore' directories
# to the temporary repository the test cases can use.
shutil.copytree(original_repository, self.repository_directory)
shutil.copytree(original_client, self.client_directory)
shutil.copytree(original_keystore, self.keystore_directory)
# 'path/to/tmp/repository' -> 'localhost:8001/tmp/repository'.
repository_basepath = self.repository_directory[len(os.getcwd()) :]
url_prefix = (
"http://"
+ utils.TEST_HOST_ADDRESS
+ ":"
+ str(self.server_process_handler.port)
+ repository_basepath.replace("\\", "/")
)
self.metadata_url = f"{url_prefix}/metadata/"
self.targets_url = f"{url_prefix}/targets/"
self.dl_dir = tempfile.mkdtemp(dir=self.tmp_test_dir)
# Creating a repository instance. The test cases will use this client
# updater to refresh metadata, fetch target files, etc.
self.updater = Updater(
metadata_dir=self.client_directory,
metadata_base_url=self.metadata_url,
target_dir=self.dl_dir,
target_base_url=self.targets_url,
bootstrap=None,
)
def tearDown(self) -> None:
# Logs stdout and stderr from the sever subprocess.
self.server_process_handler.flush_log()
def _modify_repository_root(
self,
modification_func: Callable[[Metadata], None],
bump_version: bool = False,
) -> None:
"""Apply 'modification_func' to root and persist it."""
role_path = os.path.join(
self.repository_directory, "metadata", "root.json"
)
root = Metadata[Root].from_file(role_path)
modification_func(root)
if bump_version:
root.signed.version += 1
root_key_path = os.path.join(self.keystore_directory, "root_key")
uri = f"file2:{root_key_path}"
role = root.signed.get_delegated_role(Root.type)
key = root.signed.get_key(role.keyids[0])
signer = Signer.from_priv_key_uri(uri, key)
root.sign(signer)
root.to_file(
os.path.join(self.repository_directory, "metadata", "root.json")
)
root.to_file(
os.path.join(
self.repository_directory,
"metadata",
f"{root.signed.version}.root.json",
)
)
def _assert_files_exist(self, roles: Iterable[str]) -> None:
"""Assert that local metadata files match 'roles'"""
expected_files = [f"{role}.json" for role in roles]
found_files = [
e.name for e in os.scandir(self.client_directory) if e.is_file()
]
self.assertListEqual(sorted(found_files), sorted(expected_files))
def test_refresh_and_download(self) -> None:
# Test refresh without consistent targets - targets without hash prefix.
# top-level targets are already in local cache (but remove others)
os.remove(os.path.join(self.client_directory, "role1.json"))
os.remove(os.path.join(self.client_directory, "role2.json"))
# top-level metadata is in local directory already
self.updater.refresh()
self._assert_files_exist(
[Root.type, Snapshot.type, Targets.type, Timestamp.type]
)
# Get targetinfos, assert that cache does not contain files
info1 = self.updater.get_targetinfo("file1.txt")
assert isinstance(info1, TargetFile)
self._assert_files_exist(
[Root.type, Snapshot.type, Targets.type, Timestamp.type]
)
# Get targetinfo for 'file3.txt' listed in the delegated role1
info3 = self.updater.get_targetinfo("file3.txt")
assert isinstance(info3, TargetFile)
expected_files = [
"role1",
Root.type,
Snapshot.type,
Targets.type,
Timestamp.type,
]
self._assert_files_exist(expected_files)
self.assertIsNone(self.updater.find_cached_target(info1))
self.assertIsNone(self.updater.find_cached_target(info3))
# Download files, assert that cache has correct files
self.updater.download_target(info1)
path = self.updater.find_cached_target(info1)
self.assertEqual(path, os.path.join(self.dl_dir, info1.path))
self.assertIsNone(self.updater.find_cached_target(info3))
self.updater.download_target(info3)
path = self.updater.find_cached_target(info1)
self.assertEqual(path, os.path.join(self.dl_dir, info1.path))
path = self.updater.find_cached_target(info3)
self.assertEqual(path, os.path.join(self.dl_dir, info3.path))
def test_refresh_with_only_local_root(self) -> None:
os.remove(os.path.join(self.client_directory, "timestamp.json"))
os.remove(os.path.join(self.client_directory, "snapshot.json"))
os.remove(os.path.join(self.client_directory, "targets.json"))
os.remove(os.path.join(self.client_directory, "role1.json"))
os.remove(os.path.join(self.client_directory, "role2.json"))
self._assert_files_exist([Root.type])
self.updater.refresh()
self._assert_files_exist(
[Root.type, Snapshot.type, Targets.type, Timestamp.type]
)
# Get targetinfo for 'file3.txt' listed in the delegated role1
self.updater.get_targetinfo("file3.txt")
expected_files = [
"role1",
Root.type,
Snapshot.type,
Targets.type,
Timestamp.type,
]
self._assert_files_exist(expected_files)
def test_implicit_refresh_with_only_local_root(self) -> None:
os.remove(os.path.join(self.client_directory, "timestamp.json"))
os.remove(os.path.join(self.client_directory, "snapshot.json"))
os.remove(os.path.join(self.client_directory, "targets.json"))
os.remove(os.path.join(self.client_directory, "role1.json"))
os.remove(os.path.join(self.client_directory, "role2.json"))
self._assert_files_exist(["root"])
# Get targetinfo for 'file3.txt' listed in the delegated role1
self.updater.get_targetinfo("file3.txt")
expected_files = ["role1", "root", "snapshot", "targets", "timestamp"]
self._assert_files_exist(expected_files)
def test_both_target_urls_not_set(self) -> None:
# target_base_url = None and Updater._target_base_url = None
updater = Updater(
self.client_directory,
self.metadata_url,
self.dl_dir,
bootstrap=None,
)
info = TargetFile(1, {"sha256": ""}, "targetpath")
with self.assertRaises(ValueError):
updater.download_target(info)
def test_no_target_dir_no_filepath(self) -> None:
# filepath = None and Updater.target_dir = None
updater = Updater(
self.client_directory, self.metadata_url, bootstrap=None
)
info = TargetFile(1, {"sha256": ""}, "targetpath")
with self.assertRaises(ValueError):
updater.find_cached_target(info)
with self.assertRaises(ValueError):
updater.download_target(info)
def test_external_targets_url(self) -> None:
self.updater.refresh()
info = self.updater.get_targetinfo("file1.txt")
assert isinstance(info, TargetFile)
self.updater.download_target(info, target_base_url=self.targets_url)
def test_length_hash_mismatch(self) -> None:
self.updater.refresh()
targetinfo = self.updater.get_targetinfo("file1.txt")
assert isinstance(targetinfo, TargetFile)
length = targetinfo.length
with self.assertRaises(exceptions.RepositoryError):
targetinfo.length = 44
self.updater.download_target(targetinfo)
with self.assertRaises(exceptions.RepositoryError):
targetinfo.length = length
targetinfo.hashes = {"sha256": "abcd"}
self.updater.download_target(targetinfo)
def test_updating_root(self) -> None:
# Bump root version, resign and refresh
self._modify_repository_root(lambda _: None, bump_version=True)
self.updater.refresh()
self.assertEqual(self.updater._trusted_set.root.version, 2)
def test_missing_targetinfo(self) -> None:
self.updater.refresh()
# Get targetinfo for non-existing file
self.assertIsNone(self.updater.get_targetinfo("file33.txt"))
@patch.object(os, "replace", wraps=os.replace)
@patch.object(os, "remove", wraps=os.remove)
def test_persist_metadata_fails(
self, wrapped_remove: MagicMock, wrapped_replace: MagicMock
) -> None:
# Testing that when write succeeds (the file is created) and replace
# fails by throwing OSError, then the file will be deleted.
wrapped_replace.side_effect = OSError()
with self.assertRaises(OSError):
self.updater._persist_metadata("target", b"data")
wrapped_replace.assert_called_once()
wrapped_remove.assert_called_once()
# Assert that the created tempfile during writing is eventually deleted
# or in other words, there is no temporary file left in the folder.
for filename in os.listdir(self.updater._dir):
self.assertFalse(filename.startswith("tmp"))
def test_invalid_target_base_url(self) -> None:
info = TargetFile(1, {"sha256": ""}, "targetpath")
with self.assertRaises(exceptions.DownloadError):
self.updater.download_target(
info, target_base_url="http://invalid/"
)
def test_non_existing_target_file(self) -> None:
info = TargetFile(1, {"sha256": ""}, "/non_existing_file.txt")
# When non-existing target file is given, download fails with
# "404 Client Error: File not found for url"
with self.assertRaises(exceptions.DownloadHTTPError):
self.updater.download_target(info)
def test_user_agent(self) -> None:
# test default
self.updater.refresh()
poolmgr = self.updater._fetcher._proxy_env.get_pool_manager(
"http", "localhost"
)
ua = poolmgr.headers["User-Agent"]
self.assertEqual(ua[:11], "python-tuf/")
# test custom UA
updater = Updater(
self.client_directory,
self.metadata_url,
self.dl_dir,
self.targets_url,
config=UpdaterConfig(app_user_agent="MyApp/1.2.3"),
bootstrap=None,
)
updater.refresh()
poolmgr = updater._fetcher._proxy_env.get_pool_manager(
"http", "localhost"
)
ua = poolmgr.headers["User-Agent"]
self.assertEqual(ua[:23], "MyApp/1.2.3 python-tuf/")
if __name__ == "__main__":
utils.configure_test_logging(sys.argv)
unittest.main()