"""The artifact reader objects."""
import abc
import glob
import os
import json
import yaml
from artifacts import artifact
from artifacts import definitions
from artifacts import errors
[docs]
class BaseArtifactsReader:
"""Artifacts reader interface.
Attributes:
supported_os (set[str]): supported operating systems.
"""
[docs]
def __init__(self):
"""Initializes an artifacts reader."""
super().__init__()
self.supported_os = set()
[docs]
@abc.abstractmethod
def ReadArtifactDefinitionValues(self, artifact_definition_values):
"""Reads an artifact definition from a dictionary.
Args:
artifact_definition_values (dict[str, object]): artifact definition
values.
Returns:
ArtifactDefinition: an artifact definition.
Raises:
FormatError: if the format of the artifact definition is not set
or incorrect.
"""
[docs]
@abc.abstractmethod
def ReadDirectory(self, path, extension=None):
"""Reads artifact definitions from a directory.
This function does not recurse sub directories.
Args:
path (str): path of the directory to read from.
extension (Optional[str]): extension of the filenames to read.
Yields:
ArtifactDefinition: an artifact definition.
"""
[docs]
@abc.abstractmethod
def ReadFile(self, filename):
"""Reads artifact definitions from a file.
Args:
filename (str): name of the file to read from.
Yields:
ArtifactDefinition: an artifact definition.
"""
[docs]
@abc.abstractmethod
def ReadFileObject(self, file_object):
"""Reads artifact definitions from a file-like object.
Args:
file_object (file): file-like object to read from.
Yields:
ArtifactDefinition: an artifact definition.
Raises:
FormatError: if the format of the artifact definition is not set
or incorrect.
"""
[docs]
class ArtifactsReader(BaseArtifactsReader):
"""Artifacts reader common functionality."""
[docs]
def __init__(self):
"""Initializes an artifacts reader."""
super().__init__()
self.supported_os = set(definitions.SUPPORTED_OS)
# Pylint fails on detecting the type of definition_object based on
# the docstring.
# pylint: disable=missing-type-doc
def _ReadSupportedOS(self, definition_values, definition_object, name):
"""Reads the optional artifact or source type supported OS.
Args:
definition_values (dict[str, object]): artifact definition values.
definition_object (ArtifactDefinition|SourceType): the definition object.
name (str): name of the artifact definition.
Raises:
FormatError: if there are undefined supported operating systems.
"""
supported_os = definition_values.get("supported_os", [])
if not isinstance(supported_os, list):
supported_os_type = type(supported_os)
raise errors.FormatError(
f"Invalid supported_os type: {supported_os_type!s}"
)
undefined_supported_os = set(supported_os).difference(self.supported_os)
if undefined_supported_os:
undefined_supported_os = ", ".join(undefined_supported_os)
raise errors.FormatError(
f"Artifact definition: {name:s} undefined supported operating "
f"system: {undefined_supported_os:s}."
)
definition_object.supported_os = supported_os
def _ReadSources(self, artifact_definition_values, artifact_definition, name):
"""Reads the artifact definition sources.
Args:
artifact_definition_values (dict[str, object]): artifact definition
values.
artifact_definition (ArtifactDefinition): an artifact definition.
name (str): name of the artifact definition.
Raises:
FormatError: if the type indicator is not set or unsupported,
or if required attributes are missing.
"""
sources = artifact_definition_values.get("sources")
if not sources:
raise errors.FormatError(
f"Invalid artifact definition: {name:s} missing sources."
)
for source in sources:
type_indicator = source.get("type", None)
if not type_indicator:
raise errors.FormatError(
f"Invalid artifact definition: {name:s} source type."
)
attributes = source.get("attributes", None)
try:
source_type = artifact_definition.AppendSource(
type_indicator, attributes
)
except errors.FormatError as exception:
raise errors.FormatError(
f"Invalid artifact definition: {name:s}, with error: {exception!s}"
)
# TODO: deprecate these left overs from the collector definition.
if source_type:
if source.get("returned_types", None):
raise errors.FormatError(
f"Invalid artifact definition: {name:s} returned_types no "
f"longer supported."
)
self._ReadSupportedOS(source, source_type, name)
if set(source_type.supported_os) - set(
artifact_definition.supported_os
):
raise errors.FormatError(
f"Invalid artifact definition: {name:s} missing "
f"supported_os."
)
[docs]
def ReadArtifactDefinitionValues(self, artifact_definition_values):
"""Reads an artifact definition from a dictionary.
Args:
artifact_definition_values (dict[str, object]): artifact definition
values.
Returns:
ArtifactDefinition: an artifact definition.
Raises:
FormatError: if the format of the artifact definition is not set
or incorrect.
"""
if not artifact_definition_values:
raise errors.FormatError("Missing artifact definition values.")
different_keys = set(artifact_definition_values) - definitions.TOP_LEVEL_KEYS
if different_keys:
different_keys = ", ".join(different_keys)
raise errors.FormatError(f"Undefined keys: {different_keys:s}")
name = artifact_definition_values.get("name", None)
if not name:
raise errors.FormatError("Invalid artifact definition missing name.")
# The description is assumed to be mandatory.
description = artifact_definition_values.get("doc", None)
if not description:
raise errors.FormatError(
f"Invalid artifact definition: {name:s} missing description."
)
aliases = artifact_definition_values.get("aliases", None)
artifact_definition = artifact.ArtifactDefinition(
name, aliases=aliases, description=description
)
if artifact_definition_values.get("collectors", []):
raise errors.FormatError(
f"Invalid artifact definition: {name:s} still uses collectors."
)
urls = artifact_definition_values.get("urls", [])
if not isinstance(urls, list):
raise errors.FormatError(
f"Invalid artifact definition: {name:s} urls is not a list."
)
self._ReadSupportedOS(artifact_definition_values, artifact_definition, name)
artifact_definition.urls = urls
self._ReadSources(artifact_definition_values, artifact_definition, name)
return artifact_definition
[docs]
def ReadDirectory(self, path, extension="yaml"):
"""Reads artifact definitions from a directory.
This function does not recurse sub directories.
Args:
path (str): path of the directory to read from.
extension (Optional[str]): extension of the filenames to read.
Yields:
ArtifactDefinition: an artifact definition.
"""
if extension:
glob_spec = os.path.join(path, f"*.{extension:s}")
else:
glob_spec = os.path.join(path, "*")
for artifact_file in glob.glob(glob_spec):
yield from self.ReadFile(artifact_file)
[docs]
def ReadFile(self, filename):
"""Reads artifact definitions from a file.
Args:
filename (str): name of the file to read from.
Yields:
ArtifactDefinition: an artifact definition.
"""
with open(filename, encoding="utf-8") as file_object:
yield from self.ReadFileObject(file_object)
[docs]
@abc.abstractmethod
def ReadFileObject(self, file_object):
"""Reads artifact definitions from a file-like object.
Args:
file_object (file): file-like object to read from.
Yields:
ArtifactDefinition: an artifact definition.
Raises:
FormatError: if the format of the artifact definition is not set
or incorrect.
"""
[docs]
class JsonArtifactsReader(ArtifactsReader):
"""JSON artifacts reader."""
[docs]
def ReadFileObject(self, file_object):
"""Reads artifact definitions from a file-like object.
Args:
file_object (file): file-like object to read from.
Yields:
ArtifactDefinition: an artifact definition.
Raises:
FormatError: if the format of the JSON artifact definition is not set
or incorrect.
"""
# TODO: add try, except?
json_definitions = json.loads(file_object.read())
last_artifact_definition = None
for json_definition in json_definitions:
try:
artifact_definition = self.ReadArtifactDefinitionValues(json_definition)
except errors.FormatError as exception:
error_location = "At start"
if last_artifact_definition:
error_location = f"After: {last_artifact_definition.name:s}"
raise errors.FormatError(f"{error_location:s} {exception!s}")
yield artifact_definition
last_artifact_definition = artifact_definition
[docs]
class YamlArtifactsReader(ArtifactsReader):
"""YAML artifacts reader."""
[docs]
def ReadFileObject(self, file_object):
"""Reads artifact definitions from a file-like object.
Args:
file_object (file): file-like object to read from.
Yields:
ArtifactDefinition: an artifact definition.
Raises:
FormatError: if the format of the YAML artifact definition is not set
or incorrect.
"""
# TODO: add try, except?
yaml_generator = yaml.safe_load_all(file_object)
last_artifact_definition = None
for yaml_definition in yaml_generator:
if not isinstance(yaml_definition, dict):
raise errors.FormatError(
f"YAML markup did not produce a dictionary: {yaml_definition!r}"
)
try:
artifact_definition = self.ReadArtifactDefinitionValues(yaml_definition)
except errors.FormatError as exception:
error_location = "At start"
if last_artifact_definition:
error_location = f"After: {last_artifact_definition.name:s}"
raise errors.FormatError(f"{error_location:s} {exception!s}")
yield artifact_definition
last_artifact_definition = artifact_definition