Files
aqtinstall/aqt/helper.py
David Dalcino 7a2e7faf53 Allow ListCommand to choose tool by version
This adds the function `ListCommand.fetch_tool_by_simple_spec`. This
allows the caller to specify a SimpleSpec and the name of a tool, and
the function will return the Updates.xml record for the specified tool
with the largest version number that satisfies the SimpleSpec. This is
meant to allow users to install tools without specifying an explicit
version number.

This also adds some test code to validate the complicated parts of this
code.

This also extends `helper.xml_to_modules`, so that a caller can
automatically get all tags in an XML element without explicitly
specifying them.
2021-07-09 17:02:50 -07:00

536 lines
20 KiB
Python

#!/usr/bin/env python
#
# Copyright (C) 2019-2021 Hiroshi Miura <miurahr@linux.com>
#
# Permission is hereby granted, free of charge, to any person obtaining a copy of
# this software and associated documentation files (the "Software"), to deal in
# the Software without restriction, including without limitation the rights to
# use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
# the Software, and to permit persons to whom the Software is furnished to do so,
# subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
# FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
# COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
# IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
# CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
import configparser
import hashlib
import json
import logging.config
import os
import re
import sys
import xml.etree.ElementTree as ElementTree
from logging import getLogger
from logging.handlers import QueueListener
from typing import Callable, Dict, Iterable, List, Optional
from urllib.parse import urlparse
import requests
import requests.adapters
from semantic_version import Version
from aqt.exceptions import ArchiveConnectionError, ArchiveDownloadError, CliInputError
class ArchiveId:
CATEGORIES = ("tools", "qt5", "qt6")
HOSTS = ("windows", "mac", "linux")
TARGETS_FOR_HOST = {
"windows": ["android", "desktop", "winrt"],
"mac": ["android", "desktop", "ios"],
"linux": ["android", "desktop"],
}
ALL_EXTENSIONS = (
"wasm",
"src_doc_examples",
"preview",
"wasm_preview",
"x86_64",
"x86",
"armv7",
"arm64_v8a",
)
def __init__(self, category: str, host: str, target: str, extension: str = ""):
if category not in ArchiveId.CATEGORIES:
raise ValueError("Category '{}' is invalid".format(category))
if host not in ArchiveId.HOSTS:
raise ValueError("Host '{}' is invalid".format(host))
if target not in ArchiveId.TARGETS_FOR_HOST[host]:
raise ValueError("Target '{}' is invalid".format(target))
if extension and extension not in ArchiveId.ALL_EXTENSIONS:
raise ValueError("Extension '{}' is invalid".format(extension))
self.category: str = category
self.host: str = host
self.target: str = target
self.extension: str = extension
def is_preview(self) -> bool:
return "preview" in self.extension if self.extension else False
def is_qt(self) -> bool:
return self.category.startswith("qt")
def is_tools(self) -> bool:
return self.category == "tools"
def is_no_arch(self) -> bool:
"""Returns True if there should be no arch attached to the module names"""
return self.extension in ("src_doc_examples",)
def is_major_ver_mismatch(self, qt_version: Version) -> bool:
"""Returns True if the version specifies a version different from the specified category"""
return self.is_qt() and int(self.category[-1]) != qt_version.major
def to_url(self, qt_version_no_dots: Optional[str] = None, file: str = "") -> str:
base = "online/qtsdkrepository/{os}{arch}/{target}/".format(
os=self.host,
arch="_x86" if self.host == "windows" else "_x64",
target=self.target,
)
if not qt_version_no_dots:
return base
folder = "{category}_{ver}{ext}/".format(
category=self.category,
ver=qt_version_no_dots,
ext="_" + self.extension if self.extension else "",
)
return base + folder + file
def __str__(self) -> str:
return "{cat}/{host}/{target}{ext}".format(
cat=self.category,
host=self.host,
target=self.target,
ext="" if not self.extension else "/" + self.extension,
)
def _get_meta(url: str):
return requests.get(url + ".meta4")
def _check_content_type(ct: str) -> bool:
candidate = ["application/metalink4+xml", "text/plain"]
return any(ct.startswith(t) for t in candidate)
def getUrl(url: str, timeout) -> str:
logger = getLogger("aqt.helper")
with requests.Session() as session:
retries = requests.adapters.Retry(
total=Settings.max_retries, backoff_factor=Settings.backoff_factor
)
adapter = requests.adapters.HTTPAdapter(max_retries=retries)
session.mount("http://", adapter)
session.mount("https://", adapter)
try:
r = requests.get(url, allow_redirects=False, timeout=timeout)
num_redirects = 0
while 300 < r.status_code < 309 and num_redirects < 10:
num_redirects += 1
logger.debug(
"Asked to redirect({}) to: {}".format(
r.status_code, r.headers["Location"]
)
)
newurl = altlink(r.url, r.headers["Location"])
logger.info("Redirected: {}".format(urlparse(newurl).hostname))
r = session.get(newurl, stream=True, timeout=timeout)
except (
ConnectionResetError,
requests.exceptions.ConnectionError,
requests.exceptions.Timeout,
):
raise ArchiveConnectionError("Failure to connect to {}".format(url))
else:
if r.status_code != 200:
logger.error(
"Failed to retrieve file at {}\n"
"Server response code: {}, reason: {}".format(
url, r.status_code, r.reason
)
)
raise ArchiveDownloadError("Failure to retrieve {}".format(url))
result = r.text
return result
def downloadBinaryFile(url: str, out: str, hash_algo: str, exp: str, timeout):
logger = getLogger("aqt.helper")
with requests.Session() as session:
retries = requests.adapters.Retry(
total=Settings.max_retries, backoff_factor=Settings.backoff_factor
)
adapter = requests.adapters.HTTPAdapter(max_retries=retries)
session.mount("http://", adapter)
session.mount("https://", adapter)
try:
r = session.get(url, allow_redirects=False, stream=True, timeout=timeout)
if 300 < r.status_code < 309:
logger.debug(
"Asked to redirect({}) to: {}".format(
r.status_code, r.headers["Location"]
)
)
newurl = altlink(r.url, r.headers["Location"])
logger.info("Redirected: {}".format(urlparse(newurl).hostname))
r = session.get(newurl, stream=True, timeout=timeout)
except requests.exceptions.ConnectionError as e:
logger.error("Connection error: %s" % e.args)
raise e
except requests.exceptions.Timeout as e:
logger.error("Connection timeout: %s" % e.args)
raise e
else:
hash = hashlib.new(hash_algo)
try:
with open(out, "wb") as fd:
for chunk in r.iter_content(chunk_size=8196):
fd.write(chunk)
hash.update(chunk)
fd.flush()
if exp is not None:
if hash.digest() != exp:
raise ArchiveDownloadError(
"Download file is corrupted! Detect checksum error.\nExpected {}, Actual {}".format(
exp, hash.digest()
)
)
except Exception as e:
exc = sys.exc_info()
logger.error("Download error: %s" % exc[1])
raise e
def altlink(url: str, alt: str):
"""
Blacklisting redirected(alt) location based on Settings.blacklist configuration.
When found black url, then try download a url + .meta4 that is a metalink version4
xml file, parse it and retrieve best alternative url.
"""
logger = getLogger("aqt.helper")
if not any(alt.startswith(b) for b in Settings.blacklist):
return alt
try:
m = _get_meta(url)
except requests.exceptions.ConnectionError:
logger.error("Got connection error. Fall back to recovery plan...")
return alt
else:
# Expected response->'application/metalink4+xml; charset=utf-8'
if not _check_content_type(m.headers["content-type"]):
logger.error(
"Unexpected meta4 response;content-type: {}".format(
m.headers["content-type"]
)
)
return alt
try:
mirror_xml = ElementTree.fromstring(m.text)
meta_urls = {}
for f in mirror_xml.iter("{urn:ietf:params:xml:ns:metalink}file"):
for u in f.iter("{urn:ietf:params:xml:ns:metalink}url"):
meta_urls[u.attrib["priority"]] = u.text
mirrors = [
meta_urls[i] for i in sorted(meta_urls.keys(), key=lambda x: int(x))
]
except Exception:
exc_info = sys.exc_info()
logger.error("Unexpected meta4 file; parse error: {}".format(exc_info[1]))
return alt
else:
# Return first priority item which is not blacklist in mirrors list,
# if not found then return alt in default
return next(
filter(
lambda mirror: not any(
mirror.startswith(b) for b in Settings.blacklist
),
mirrors,
),
alt,
)
class MyQueueListener(QueueListener):
def __init__(self, queue):
handlers = []
super().__init__(queue, *handlers)
def handle(self, record):
"""
Handle a record from subprocess.
Override logger name then handle at proper logger.
"""
record = self.prepare(record)
logger = getLogger("aqt.installer")
record.name = "aqt.installer"
logger.handle(record)
def to_version(qt_ver: str) -> Version:
"""Converts a Qt version string with dots (5.X.Y, etc) into a semantic version.
If the version ends in `-preview`, the version is treated as a preview release.
If the patch value is missing, patch is assumed to be zero.
If the version cannot be converted to a Version, a CliInputError is raised.
"""
match = re.match(r"^(\d+)\.(\d+)(\.(\d+)|-preview)$", qt_ver)
if not match:
raise CliInputError(
"Invalid version: '{}'! Please use the form '5.X.Y'.".format(qt_ver)
)
major, minor, end, patch = match.groups()
is_preview = end == "-preview"
return Version(
major=int(major),
minor=int(minor),
patch=int(patch) if patch else 0,
prerelease=("preview",) if is_preview else None,
)
def to_version_permissive(version_str: str) -> Version:
"""Converts a version string with dots (5.X.Y, etc) into a semantic version.
If the version omits either the patch or minor versions, they will be filled in with zeros,
and the remaining version string becomes part of the prerelease component.
If the version cannot be converted to a Version, a ValueError is raised.
This function is intended to be used on Version tags in an Updates.xml file.
to_version_permissive('1.33.1-202102101246') => Version('1.33.1-202102101246')
to_version_permissive('1.33-202102101246') => Version('1.33.0-202102101246') # tools_conan
to_version_permissive('2020-05-19-1') => Version('2020.0.0-05-19-1') # tools_vcredist
"""
match = re.match(r"^(\d+)(\.(\d+)(\.(\d+))?)?(.*)$", version_str)
if not match:
raise ValueError("Invalid version detected: '{}'".format(version_str))
major, dot_minor, minor, dot_patch, patch, prerelease = match.groups()
return Version(
"{}.{}.{}{}".format(
major, minor if minor else 0, patch if patch else 0, prerelease
)
)
def get_semantic_version(qt_ver: str, is_preview: bool) -> Optional[Version]:
"""Converts a Qt version string (596, 512, 5132, etc) into a semantic version.
This makes a lot of assumptions based on established patterns:
If is_preview is True, the number is interpreted as ver[0].ver[1:], with no patch.
If the version is 3 digits, then major, minor, and patch each get 1 digit.
If the version is 4 or more digits, then major gets 1 digit, minor gets 2 digits
and patch gets all the rest.
As of May 2021, the version strings at https://download.qt.io/online/qtsdkrepository
conform to this pattern; they are not guaranteed to do so in the future.
"""
if not qt_ver or any(not ch.isdigit() for ch in qt_ver):
return None
if is_preview:
return Version(
major=int(qt_ver[:1]),
minor=int(qt_ver[1:]),
patch=0,
prerelease=("preview",),
)
elif len(qt_ver) >= 4:
return Version(
major=int(qt_ver[:1]), minor=int(qt_ver[1:3]), patch=int(qt_ver[3:])
)
elif len(qt_ver) == 3:
return Version(
major=int(qt_ver[:1]), minor=int(qt_ver[1:2]), patch=int(qt_ver[2:])
)
elif len(qt_ver) == 2:
return Version(major=int(qt_ver[:1]), minor=int(qt_ver[1:2]), patch=0)
raise ValueError("Invalid version string '{}'".format(qt_ver))
def xml_to_modules(
xml_text: str,
predicate: Callable[[ElementTree.Element], bool],
keys_to_keep: Optional[Iterable[str]] = None,
) -> Dict[str, Dict[str, str]]:
"""Converts an XML document to a dict of `PackageUpdate` dicts, indexed by `Name` attribute.
Only report elements that satisfy `predicate(element)`.
Only report keys in the list `keys_to_keep`.
:param xml_text: The entire contents of an xml file
:param predicate: A function that decides which elements to keep or discard
:param keys_to_keep: A list of which tags in the element should be kept.
If the list is empty, then no tags will be kept.
If the list is None, then all tags will be kept.
"""
try:
parsed_xml = ElementTree.fromstring(xml_text)
except ElementTree.ParseError:
return {}
packages = {}
for packageupdate in parsed_xml.iter("PackageUpdate"):
if predicate and not predicate(packageupdate):
continue
name = packageupdate.find("Name").text
packages[name] = {}
if keys_to_keep is None:
for child in packageupdate:
packages[name][child.tag] = child.text
else:
for key in keys_to_keep:
packages[name][key] = getattr(packageupdate.find(key), "text", None)
return packages
class MyConfigParser(configparser.ConfigParser):
def getlist(self, section: str, option: str, fallback=[]) -> List[str]:
value = self.get(section, option)
try:
result = list(filter(None, (x.strip() for x in value.splitlines())))
except Exception:
result = fallback
return result
def getlistint(self, section: str, option: str, fallback=[]):
try:
result = [int(x) for x in self.getlist(section, option)]
except Exception:
result = fallback
return result
class SettingsClass:
"""
Class to hold configuration and settings.
Actual values are stored in 'settings.ini' file.
It also holds a combinations database.
"""
def __init__(self):
self.config = MyConfigParser()
self.configfile = os.path.join(os.path.dirname(__file__), "settings.ini")
self.loggingconf = os.path.join(os.path.dirname(__file__), "logging.ini")
def load_settings(self, file=None):
with open(
os.path.join(os.path.dirname(__file__), "combinations.json"),
"r",
) as j:
self._combinations = json.load(j)[0]
if file is not None:
if isinstance(file, str):
result = self.config.read(file)
if len(result) == 0:
raise IOError("Fails to load specified config file {}".format(file))
self.configfile = file
else:
# passed through command line argparse.FileType("r")
self.config.read_file(file)
self.configfile = file
file.close()
else:
if isinstance(self.configfile, str):
with open(self.configfile, "r") as f:
self.config.read_file(f)
else:
self.configfile.seek(0)
self.config.read_file(self.configfile)
@property
def qt_combinations(self):
return self._combinations["qt"]
@property
def tools_combinations(self):
return self._combinations["tools"]
@property
def available_versions(self):
return self._combinations["versions"]
@property
def available_offline_installer_version(self):
res = self._combinations["new_archive"]
res.extend(self._combinations["versions"])
return res
def available_modules(self, qt_version):
"""Known module names
:returns: dictionary of qt_version and module names
:rtype: List[str]
"""
modules = self._combinations["modules"]
versions = qt_version.split(".")
version = "{}.{}".format(versions[0], versions[1])
result = None
for record in modules:
if record["qt_version"] == version:
result = record["modules"]
return result
@property
def concurrency(self):
"""concurrency configuration.
:return: concurrency
:rtype: int
"""
return self.config.getint("aqt", "concurrency", fallback=4)
@property
def blacklist(self):
"""list of sites in a blacklist
:returns: list of site URLs(scheme and host part)
:rtype: List[str]
"""
return self.config.getlist("mirrors", "blacklist", fallback=[])
@property
def baseurl(self):
return self.config.get("aqt", "baseurl", fallback="https://download.qt.io")
@property
def connection_timeout(self):
return self.config.getfloat("requests", "connection_timeout", fallback=3.5)
@property
def response_timeout(self):
return self.config.getfloat("requests", "response_timeout", fallback=10)
@property
def max_retries(self):
return self.config.getfloat("requests", "max_retries", fallback=5)
@property
def backoff_factor(self):
return self.config.getfloat("requests", "retry_backoff", fallback=0.1)
@property
def fallbacks(self):
return self.config.getlist("mirrors", "fallbacks", fallback=[])
@property
def zipcmd(self):
return self.config.get("aqt", "7zcmd", fallback="7z")
@property
def kde_patches(self):
return self.config.getlist("kde_patches", "patches", fallback=[])
Settings = SettingsClass()
def setup_logging(env_key="LOG_CFG"):
config = os.getenv(env_key, None)
if config is not None and os.path.exists(config):
logging.config.fileConfig(config)
else:
logging.config.fileConfig(Settings.loggingconf)