Source code for bw_interface_schemas.models

import json
import re
from enum import StrEnum
from pathlib import Path
from typing import Annotated, Any, Literal, Self, Union

from pydantic import BaseModel, ConfigDict, Field, JsonValue, model_validator


[docs]
Identifier = Annotated[int | str, Field()]




[docs]
class Parsimonius(BaseModel):
    """Change default `model_dump` behaviour to not export unset values by default"""


[docs]
    model_config = ConfigDict(
        extra="allow",
    )



[docs]
    def model_dump(self, exclude_unset=True, *args, **kwargs):
        # Change default value of `exclude_unset` to `True`
        return super().model_dump(*args, exclude_unset=exclude_unset, **kwargs)





[docs]
class DataSource(Parsimonius):
    """
    A data source, such as a publication or field measurement.

    A very rough draft; expect changes.
    """


[docs]
    authors: list[str]


[docs]
    year: int


[docs]
    title: str


[docs]
    doi: str | None = None





[docs]
class NodeTypes(StrEnum):
    """
    The built-in node types. These are sufficient to describe standard life
    cycle assessment, but you can use custom types for new `Node` classes if
    needed.
    """


[docs]
    project = "project"


[docs]
    product_system = "product_system"


[docs]
    product_system_variant = "product_system_variant"


[docs]
    process = "process"


[docs]
    product = "product"


[docs]
    elementary_flow = "elementary_flow"


[docs]
    impact_assessment_method = "impact_assessment_method"


[docs]
    impact_category = "impact_category"


[docs]
    normalization = "normalization"


[docs]
    weighting = "weighting"





[docs]
class Node(Parsimonius):
    """
    Base class for nodes in the graph. Can include processes, products, and
    elementary flows, but also LCIA objects, and organizational tools like
    product systems and projects.

    All nodes must have a name and a type.
    """

    # Recommended labels for these attributes

[docs]
    name: str


[docs]
    node_type: NodeTypes | str

    # Comment can be a single string or something more structured.

[docs]
    comment: Union[str, dict[str, str], None] = None

    # Was previously classifications - we want something more generic
    # Tags are chosen from defined set of possibilities

[docs]
    tags: dict[str, JsonValue] | None = None





[docs]
class Collection(Node):
    """
    A `Collection` is a group of nodes organized in a common container.

    These nodes can be part of inventory supply chains, impact assessment methods,
    parameterization sets, or any other logical unit of organization.

    `Collection` nodes are normally linked to other nodes via qualitative
    relationship edges, such as `EdgeTypes.belongs_to`.

    The edge type should clearly differentiate the intended edge direction. In
    this case, a `Product` node (source) `belongs_to` a `Collection`.

    Collections can be nested. For example, a product system collection can
    belong to a project collection.
    """




[docs]
class Project(Collection):
    """
    A set of `ProductSystem` and `ImpactAssessmentMethod` collections which
    encapsulate a sustainability assessment project. Projects can be
    self-contained, or can link to other `Project` collections.
    """


[docs]
    node_type: Literal[NodeTypes.project] = NodeTypes.project





[docs]
class ProductSystem(Collection):
    """
    A collection of unit processes with elementary and product flows,
    performing one or more defined functions, and which models the life cycle
    of a product. From ISO 14040.
    """


[docs]
    license: str


[docs]
    node_type: Literal[NodeTypes.product_system] = NodeTypes.product_system


[docs]
    references: list[DataSource] | None = None





[docs]
class ImpactAssessmentMethod(Collection):
    """
    A set of impact categories, weightings, and normalizations, with their
    associated factors.
    """


[docs]
    license: str


[docs]
    node_type: Literal[NodeTypes.impact_assessment_method] = (
        NodeTypes.impact_assessment_method
    )


[docs]
    references: list[DataSource] | None = None





[docs]
class InventoryNode(Node):
    """
    Common base class for inventory nodes. Please only use subclasses of this
    node.
    """


[docs]
    location: str | None = None


[docs]
    references: list[DataSource] | None = None

    # Properties are quantitative but can be in a nested structure like
    # `{"a": {"amount": 7}}`

[docs]
    properties: dict[str, JsonValue] | None = None





[docs]
class Process(InventoryNode):
    """
    The smallest element considered in the life cycle inventory analysis for
    which input and output data are quantified. From ISO 14040.

    Can have one or more functional product edges. Multfunctional processes
    still have the type `NodeTypes.process`.

    Processes extend `InventoryNode` with a required `location` (string).
    """


[docs]
    node_type: Literal[NodeTypes.process] = NodeTypes.process


[docs]
    location: str


    # TBD: Time range?



[docs]
class Product(InventoryNode):
    """
    Any good or service. From ISO 14040.

    Products extend `InventoryNode` with a required `unit` - this unit is the
    default used for every edge consuming or producing this product.

    The functional unit of sustainability assessment is always product(s).
    """


[docs]
    node_type: Literal[NodeTypes.product] = NodeTypes.product


[docs]
    unit: str





[docs]
class ElementaryFlow(InventoryNode):
    """
    A material or energy entering the system being studied that has been drawn
    from the environment without previous human transformation, or material or
    energy leaving the system being studied that is released into the
    environment without subsequent human transformation. From ISO 14040.

    For sustainability assessment, an elementary flow is a concept (e.g. CO2)
    situated in a context (e.g. emission to air). The same underlying concept
    (e.g. CO2) can be both a product and an elementary flow, but because they
    operate in different contexts they are separate objects.

    Elementary flows extend `InventoryNode` with a required `unit` - this unit
    is the default used for every edge consuming or producing this product.
    They also require a `context`, which is a list of strings.
    """


[docs]
    node_type: Literal[NodeTypes.elementary_flow] = NodeTypes.elementary_flow


[docs]
    unit: str


[docs]
    context: list[str]





[docs]
class ImpactCategory(Node):
    """
    A class representing environmental issues of concern to which life cycle
    inventory analysis results may be assigned. From ISO 14040.

    In practical terms characterization is a list of factors (midpoint or
    endpoint) associated with elementary flows. This class stores metadata
    about the category, such as lineage and units.
    """


[docs]
    node_type: Literal[NodeTypes.impact_category] = NodeTypes.impact_category


[docs]
    name: list[str]


[docs]
    unit: str





[docs]
class Normalization(Node):
    """
    Normalization is the calculation of the magnitude of the category indicator
    results relative to some reference information. The aim of the
    normalization is to understand better the relative magnitude for each
    indicator result of the product system under study. From ISO 14044.

    In practical terms normalization is a list of factors associated with
    elementary flows. This class stores metadata about normalization.
    """


[docs]
    node_type: Literal[NodeTypes.normalization] = NodeTypes.normalization


[docs]
    name: list[str]


[docs]
    unit: str





[docs]
class Weighting(Node):
    """
    Weighting is the process of converting indicator results of different
    impact categories by using numerical factors based on value-choices. It may
    include aggregation of the weighted indicator results. From ISO 14044.

    In practical terms weighting is a single factor associated with a
    normalization or characterization set. This class stores metadata about
    weighting.
    """


[docs]
    node_type: Literal[NodeTypes.weighting] = NodeTypes.weighting


[docs]
    name: list[str]


[docs]
    unit: str





[docs]
class QualitativeEdgeTypes(StrEnum):

[docs]
    belongs_to = "belongs_to"


[docs]
    variant_of = "variant_of"





[docs]
class QuantitativeEdgeTypes(StrEnum):

[docs]
    technosphere = "technosphere"


[docs]
    biosphere = "biosphere"


[docs]
    characterization = "characterization"


[docs]
    weighting = "weighting"


[docs]
    normalization = "normalization"





[docs]
class Edge(Parsimonius):

[docs]
    edge_type: str


[docs]
    source: Identifier


[docs]
    target: Identifier


[docs]
    comment: Union[str, dict[str, str], None] = None


[docs]
    references: list[DataSource] | None = None


[docs]
    tags: dict[str, JsonValue] | None = None


[docs]
    properties: dict[str, JsonValue] | None = None





[docs]
class QualitativeEdge(Edge):
    """
    A qualitative edge linking two nodes in the graph.

    The type of relationship is defined by the `edge_type`. Normally these are
    drawn from `QualitativeEdgeTypes` but don't have to be.
    """


[docs]
    edge_type: QualitativeEdgeTypes





[docs]
class QuantitativeEdge(Edge):
    """An quantitative edge linking two nodes in the graph."""


[docs]
    edge_type: QuantitativeEdgeTypes


[docs]
    amount: float


[docs]
    uncertainty_type: int | None = None


[docs]
    loc: float | None = None


[docs]
    scale: float | None = None


[docs]
    shape: float | None = None


[docs]
    minimum: float | None = None


[docs]
    maximum: float | None = None


[docs]
    negative: bool | None = None





[docs]
class CharacterizationQuantitativeEdge(QuantitativeEdge):
    """"""


[docs]
    edge_type: Literal[QuantitativeEdgeTypes.characterization] = (
        QuantitativeEdgeTypes.characterization
    )


[docs]
    location: str | None = None





[docs]
class NormalizationQuantitativeEdge(QuantitativeEdge):
    """"""


[docs]
    edge_type: Literal[QuantitativeEdgeTypes.normalization] = (
        QuantitativeEdgeTypes.normalization
    )





[docs]
class WeightingQuantitativeEdge(QuantitativeEdge):
    """"""


[docs]
    edge_type: Literal[QuantitativeEdgeTypes.weighting] = (
        QuantitativeEdgeTypes.weighting
    )





[docs]
class BiosphereQuantitativeEdge(QuantitativeEdge):

[docs]
    edge_type: Literal[QuantitativeEdgeTypes.biosphere] = (
        QuantitativeEdgeTypes.biosphere
    )


    @model_validator(mode="before")
    @classmethod

[docs]
    def not_functional(cls, data):
        assert "functional" not in data, "biosphere edges can never be functional"
        return data





[docs]
class TechnosphereQuantitativeEdge(QuantitativeEdge):

[docs]
    functional: bool = False


[docs]
    edge_type: Literal[QuantitativeEdgeTypes.technosphere] = (
        QuantitativeEdgeTypes.technosphere
    )




if __name__ == "__main__":

[docs]
    hiss = lambda name: re.sub(r"(?<!^)(?=[A-Z])", "_", name).lower()

    dirpath = Path(__file__).parent / "json_schema"
    objects = [
        BiosphereQuantitativeEdge,
        CharacterizationQuantitativeEdge,
        ProductSystem,
        DataSource,
        Edge,
        ElementaryFlow,
        ImpactAssessmentMethod,
        ImpactCategory,
        InventoryNode,
        Node,
        Normalization,
        NormalizationQuantitativeEdge,
        Process,
        Product,
        Project,
        QualitativeEdge,
        QuantitativeEdge,
        TechnosphereQuantitativeEdge,
        Weighting,
        WeightingQuantitativeEdge,
    ]
    for obj in objects:
        with open(dirpath / (hiss(obj.__name__) + ".json"), "w") as f:
            json.dump(obj.model_json_schema(), f, indent=2, ensure_ascii=False)