mirror of
https://github.com/theupdateframework/python-tuf
synced 2026-05-24 10:08:28 +00:00
352 lines
10 KiB
Python
352 lines
10 KiB
Python
import functools
|
|
import imp
|
|
import json
|
|
import socket
|
|
import urllib
|
|
import urllib2
|
|
|
|
|
|
# We import them directly into our namespace so that there is no name conflict.
|
|
from configuration import ConfigurationParser, InvalidConfiguration
|
|
from utility import Logger
|
|
from updater import UpdaterController
|
|
|
|
|
|
# Export nothing when: from tuf.interposition import *
|
|
__all__ = []
|
|
|
|
|
|
# TODO:
|
|
# - Document design decisions.
|
|
# - Interposition: Honour urllib/urllib2 contract.
|
|
# - Review security issues resulting from regular expressions (e.g. complexity attacks).
|
|
# - Warn user when TUF is used without any configuration.
|
|
# - Override other default (e.g. HTTPS) urllib2 handlers.
|
|
# - Failsafe: If TUF fails, offer option to unsafely resort back to urllib/urllib2?
|
|
|
|
|
|
|
|
|
|
|
|
############################## GLOBAL VARIABLES ################################
|
|
|
|
|
|
|
|
|
|
|
|
# Constants
|
|
NON_GET_HTTP_METHOD_MESSAGE = \
|
|
"Skipping {method} request to {url} because it is not a GET request."
|
|
|
|
|
|
# Our own public copies of the urllib and urllib2 modules.
|
|
# We use None as sentinel values.
|
|
urllib_tuf = None
|
|
urllib2_tuf = None
|
|
|
|
|
|
# A private, global Controller of Updaters.
|
|
__updater_controller = UpdaterController()
|
|
|
|
|
|
|
|
|
|
|
|
########################## GLOBAL PRIVATE FUNCTIONS ############################
|
|
|
|
|
|
|
|
|
|
|
|
def __monkey_patch():
|
|
"""Build and monkey patch public copies of the urllib and urllib2 modules.
|
|
|
|
We prefer simplicity, which leads to easier proof of security, even if it may
|
|
come at the cost of not honouring some provisions of the urllib and urllib2
|
|
module contracts unrelated to security.
|
|
|
|
References:
|
|
http://stackoverflow.com/a/11285504
|
|
http://docs.python.org/2/library/imp.html"""
|
|
|
|
global urllib_tuf
|
|
global urllib2_tuf
|
|
|
|
if urllib_tuf is None:
|
|
try:
|
|
module_file, pathname, description = imp.find_module("urllib")
|
|
urllib_tuf = \
|
|
imp.load_module( "urllib_tuf", module_file, pathname, description)
|
|
module_file.close()
|
|
except:
|
|
raise
|
|
else:
|
|
urllib_tuf.urlopen = __urllib_urlopen
|
|
urllib_tuf.urlretrieve = __urllib_urlretrieve
|
|
|
|
if urllib2_tuf is None:
|
|
try:
|
|
module_file, pathname, description = imp.find_module("urllib2")
|
|
urllib2_tuf = \
|
|
imp.load_module( "urllib2_tuf", module_file, pathname, description)
|
|
module_file.close()
|
|
except:
|
|
raise
|
|
else:
|
|
urllib2_tuf.urlopen = __urllib2_urlopen
|
|
|
|
|
|
|
|
|
|
|
|
def __urllib_urlopen(url, data=None, proxies=None):
|
|
"""Create a file-like object for the specified URL to read from."""
|
|
|
|
updater = __updater_controller.get(url)
|
|
|
|
if updater is None:
|
|
return urllib.urlopen(url, data=data, proxies=proxies)
|
|
else:
|
|
return updater.open(url, data=data)
|
|
|
|
|
|
|
|
|
|
|
|
def __urllib_urlretrieve(url, filename=None, reporthook=None, data=None):
|
|
"""Copy a network object denoted by a URL to a local file, if necessary."""
|
|
|
|
updater = __updater_controller.get(url)
|
|
|
|
if updater is None:
|
|
return urllib.urlretrieve(url, filename=filename, reporthook=reporthook, data=data)
|
|
else:
|
|
return updater.retrieve(url, filename=filename, reporthook=reporthook, data=data)
|
|
|
|
|
|
|
|
|
|
|
|
def __urllib2_urlopen(url, data=None, timeout=socket._GLOBAL_DEFAULT_TIMEOUT):
|
|
"""Create a file-like object for the specified URL to read from."""
|
|
|
|
# We assume that the first argument to instancemethod is a URL-like object;
|
|
# that is, either a string or a urllib2.Request.
|
|
|
|
updater = None
|
|
|
|
# If this is a urllib2.Request...
|
|
if isinstance(url, urllib2.Request):
|
|
# If this is a GET HTTP method...
|
|
if url.get_method() == "GET":
|
|
# ...then you should check with TUF.
|
|
updater = __updater_controller.get(url.get_full_url())
|
|
else:
|
|
# ...otherwise, revert to default behaviour.
|
|
Logger.warn(NON_GET_HTTP_METHOD_MESSAGE.format(method=url.get_method(),
|
|
url=url.get_full_url()))
|
|
return urllib2.urlopen(url, data=data, timeout=timeout)
|
|
else:
|
|
# ...otherwise, we assume this is a string.
|
|
updater = __updater_controller.get(url)
|
|
|
|
if updater is None:
|
|
return urllib2.urlopen(url, data=data, timeout=timeout)
|
|
else:
|
|
response = updater.open(url, data=data)
|
|
# See urllib2.AbstractHTTPHandler.do_open
|
|
# TODO: let Updater handle this
|
|
response.msg = ""
|
|
return response
|
|
|
|
|
|
|
|
|
|
|
|
########################### GLOBAL PUBLIC FUNCTIONS ############################
|
|
|
|
|
|
|
|
def __read_configuration(configuration_handler,
|
|
filename="tuf.interposition.json",
|
|
parent_repository_directory=None,
|
|
parent_ssl_certificates_directory=None):
|
|
"""
|
|
A generic function to read TUF interposition configurations off a file, and
|
|
then handle those configurations with a given function. configuration_handler
|
|
must be a function which accepts a tuf.interposition.Configuration
|
|
instance.
|
|
|
|
Returns the parsed configurations as a dictionary of configurations indexed
|
|
by hostnames."""
|
|
|
|
INVALID_TUF_CONFIGURATION = "Invalid configuration for {network_location}!"
|
|
INVALID_TUF_INTERPOSITION_JSON = "Invalid configuration in {filename}!"
|
|
NO_CONFIGURATIONS = "No configurations found in configuration in {filename}!"
|
|
|
|
# Configurations indexed by hostnames.
|
|
parsed_configurations = {}
|
|
|
|
try:
|
|
with open(filename) as tuf_interposition_json:
|
|
tuf_interpositions = json.load(tuf_interposition_json)
|
|
configurations = tuf_interpositions.get("configurations", {})
|
|
|
|
if len(configurations) == 0:
|
|
raise InvalidConfiguration(NO_CONFIGURATIONS.format(filename=filename))
|
|
|
|
else:
|
|
for network_location, configuration in configurations.iteritems():
|
|
try:
|
|
configuration_parser = ConfigurationParser(network_location,
|
|
configuration, parent_repository_directory=parent_repository_directory,
|
|
parent_ssl_certificates_directory=parent_ssl_certificates_directory)
|
|
|
|
configuration = configuration_parser.parse()
|
|
configuration_handler(configuration)
|
|
parsed_configurations[configuration.hostname] = configuration
|
|
|
|
except:
|
|
Logger.exception(INVALID_TUF_CONFIGURATION.format(network_location=network_location))
|
|
raise
|
|
|
|
except:
|
|
Logger.exception(INVALID_TUF_INTERPOSITION_JSON.format(filename=filename))
|
|
raise
|
|
|
|
else:
|
|
return parsed_configurations
|
|
|
|
|
|
|
|
|
|
|
|
# TODO: Is parent_repository_directory a security risk? For example, would it
|
|
# allow the user to overwrite another TUF repository metadata on the filesystem?
|
|
# On the other hand, it is beyond TUF's scope to handle filesystem permissions.
|
|
# TODO: Ditto for the parent_ssl_certificates_directory parameter.
|
|
|
|
def configure(filename="tuf.interposition.json",
|
|
parent_repository_directory=None,
|
|
parent_ssl_certificates_directory=None):
|
|
|
|
"""The optional parent_repository_directory parameter is used to specify the
|
|
containing parent directory of the "repository_directory" specified in a
|
|
configuration for *all* network locations, because sometimes the absolute
|
|
location of the "repository_directory" is only known at runtime. If you
|
|
need to specify a different parent_repository_directory for other
|
|
network locations, simply call this method again with different parameters.
|
|
|
|
Ditto for the optional parent_ssl_certificates_directory parameter.
|
|
|
|
Example of a TUF interposition configuration JSON object:
|
|
|
|
{
|
|
"configurations": {
|
|
"seattle.cs.washington.edu": {
|
|
"repository_directory": "client/",
|
|
"repository_mirrors" : {
|
|
"mirror1": {
|
|
"url_prefix": "http://seattle-tuf.cs.washington.edu",
|
|
"metadata_path": "metadata",
|
|
"targets_path": "targets",
|
|
"confined_target_dirs": [ "" ]
|
|
}
|
|
},
|
|
("target_paths": [
|
|
{ ".*/(simple/\\w+)/$": "{0}/index.html" },
|
|
{ ".*/(packages/.+)$": "{0}" }
|
|
],
|
|
"ssl_certificates": "cacert.pem")
|
|
}
|
|
}
|
|
}
|
|
|
|
"target_paths" is optional: If you do not tell TUF to selectively match
|
|
paths with regular expressions, TUF will work over any path under the given
|
|
network location. However, if you do specify it, you are then telling TUF
|
|
how to transform a specified path into another one, and TUF will *not*
|
|
recognize any unspecified path for the given network location.
|
|
|
|
Unless any "url_prefix" begins with "https://", "ssl_certificates" is
|
|
optional; it must specify certificates bundled as PEM (RFC 1422).
|
|
|
|
Returns the parsed configurations as a dictionary of configurations indexed
|
|
by hostnames."""
|
|
|
|
configurations = \
|
|
__read_configuration(__updater_controller.add, filename=filename,
|
|
parent_repository_directory=parent_repository_directory,
|
|
parent_ssl_certificates_directory=parent_ssl_certificates_directory)
|
|
|
|
return configurations
|
|
|
|
|
|
|
|
|
|
|
|
def deconfigure(configurations):
|
|
"""Remove TUF interposition for previously read configurations."""
|
|
|
|
for configuration in configurations.itervalues():
|
|
__updater_controller.remove(configuration)
|
|
|
|
|
|
|
|
|
|
|
|
def open_url(instancemethod):
|
|
"""Decorate an instance method of the form
|
|
instancemethod(self, url, ...) with me in order to pass it to TUF."""
|
|
|
|
@functools.wraps(instancemethod)
|
|
def wrapper(self, *args, **kwargs):
|
|
# We assume that the first argument to instancemethod is a URL-like object;
|
|
# that is, either a string or a urllib2.Request.
|
|
url_object = args[0]
|
|
data = kwargs.get("data")
|
|
|
|
# If this is a urllib2.Request...
|
|
if isinstance(url_object, urllib2.Request):
|
|
# If this is a GET HTTP method...
|
|
if url_object.get_method() == "GET":
|
|
# ...then you should check with TUF.
|
|
url = url_object.get_full_url()
|
|
else:
|
|
# ...otherwise, revert to default behaviour.
|
|
Logger.warn(NON_GET_HTTP_METHOD_MESSAGE.format(method=url_object.get_method(),
|
|
url=url_object.get_full_url()))
|
|
return instancemethod(self, *args, **kwargs)
|
|
# ...otherwise, we assume this is a string.
|
|
else:
|
|
url = url_object
|
|
|
|
updater = __updater_controller.get(url)
|
|
|
|
# If TUF has not been configured for this URL...
|
|
if updater is None:
|
|
# ...then revert to default behaviour.
|
|
return instancemethod(self, *args, **kwargs)
|
|
else:
|
|
# ...otherwise, use TUF to get this document.
|
|
return updater.open(url, data=data)
|
|
|
|
return wrapper
|
|
|
|
|
|
|
|
|
|
|
|
############################## GLOBAL SIDE EFFECTS #############################
|
|
|
|
|
|
|
|
|
|
|
|
# Build and monkey patch public copies of the urllib and urllib2 modules.
|
|
__monkey_patch()
|
|
|
|
|
|
|
|
|
|
|