MUSE_OS/src/muse/new_input/readers.py at d762472d2f2ac8dfd949339a328f81edfd0ee44a · EnergySystemsModellingLab/MUSE_OS · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
import numpy as np
import xarray as xr
from sqlalchemy import CheckConstraint, ForeignKey
from sqlalchemy.orm import DeclarativeBase, Mapped, mapped_column


class TableBase(DeclarativeBase):
    pass


class Regions(TableBase):
    __tablename__ = "regions"

    name: Mapped[str] = mapped_column(primary_key=True)


class Commodities(TableBase):
    __tablename__ = "commodities"

    name: Mapped[str] = mapped_column(primary_key=True)
    type: Mapped[str] = mapped_column(
        CheckConstraint("type IN ('energy', 'service', 'material', 'environmental')")
    )
    unit: Mapped[str]


class Demand(TableBase):
    __tablename__ = "demand"

    year: Mapped[int] = mapped_column(primary_key=True, autoincrement=False)
    commodity: Mapped[Commodities] = mapped_column(
        ForeignKey("commodities.name"),
        primary_key=True,
        info=dict(header="commodity_name"),
    )
    region: Mapped[Regions] = mapped_column(
        ForeignKey("regions.name"), primary_key=True
    )
    demand: Mapped[float]


def read_inputs(data_dir):
    from sqlalchemy import create_engine

    engine = create_engine("duckdb:///:memory:")
    TableBase.metadata.create_all(engine)
    con = engine.raw_connection().driver_connection

    with open(data_dir / "regions.csv") as f:
        regions = read_csv(f, Regions, con)  # noqa: F841

    with open(data_dir / "commodities.csv") as f:
        commodities = read_csv(f, Commodities, con)

    with open(data_dir / "demand.csv") as f:
        demand = read_csv(f, Demand, con)  # noqa: F841

    data = {}
    data["global_commodities"] = calculate_global_commodities(commodities)
    return data


def read_csv(buffer_, table_class, con):
    table_name = table_class.__tablename__
    columns = ", ".join(
        column.info.get("header", column.name)
        for column in table_class.__table__.columns
    )

    rel = con.read_csv(buffer_, header=True, delimiter=",")  # noqa: F841
    con.execute(f"INSERT INTO {table_name} SELECT {columns} FROM rel")
    return con.execute(f"SELECT * from {table_name}").fetchnumpy()


def calculate_global_commodities(commodities):
    names = commodities["name"].astype(np.dtype("str"))
    types = commodities["type"].astype(np.dtype("str"))
    units = commodities["unit"].astype(np.dtype("str"))

    type_array = xr.DataArray(
        data=types, dims=["commodity"], coords=dict(commodity=names)
    )

    unit_array = xr.DataArray(
        data=units, dims=["commodity"], coords=dict(commodity=names)
    )

    data = xr.Dataset(data_vars=dict(type=type_array, unit=unit_array))
    return data