VirtualMicrogridSegmentation/virtual_microgrids/powerflow/pp_network.py at 7e570a97e1d0897ede9d7bb35210c9b7739190e5 · bmeyers/VirtualMicrogridSegmentation · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
import numpy as np
import pandas as pd
import pandapower as pp
from copy import deepcopy
from virtual_microgrids.configs import get_config
from virtual_microgrids.powerflow.network_generation import get_net
from virtual_microgrids.utils import Graph


class NetModel(object):
    """Building and interacting with a network model to simulate power flow.

    In this class we model all of the network component including loads,
    generators, batteries, lines, buses, and transformers. The state of each is
    tracked in a pandapower network object.
    """
    def __init__(self, config=None, env_name='Six_Bus_POC', baseline=True,
                 actor='DDPG'):
        """Initialize attributes of the object and zero out certain components
        in the standard test network."""

        if config is not None:
            self.config = config
            self.net = get_net(self.config)
        else:
            self.config = get_config(env_name, baseline, actor)
            self.net = get_net(self.config)

        self.reward_val = 0.0

        self.tstep = self.config.tstep
        self.net_zero_reward = self.config.net_zero_reward
        self.initial_net = pp.copy.deepcopy(self.net)
        self.time = 0
        self.n_load = len(self.net.load)
        self.n_sgen = len(self.net.sgen)
        self.n_gen = len(self.net.gen)
        self.n_storage = len(self.net.storage)
        if self.config.with_soc:
            self.observation_dim = self.n_load + self.n_sgen + self.n_storage
        else:
            self.observation_dim = self.n_load + self.n_sgen
        self.observation_dim *= 2
        self.action_dim = self.n_gen + self.n_storage
        self.graph = Graph(len(self.net.bus))
        for idx, entry in self.net.line.iterrows():
            self.graph.addEdge(entry.from_bus, entry.to_bus)
        for idx, entry in self.net.trafo.iterrows():
            self.graph.addEdge(entry.hv_bus, entry.lv_bus)

        self.current_state = None
        self.last_state = None


    def reset(self):
        """Reset the network and reward values back to how they were initialized."""
        if not self.config.randomize_env:
            self.net = pp.copy.deepcopy(self.initial_net)
        else:
            self.config = get_config(self.config.env_name, self.config.use_baseline,
                                     self.config.actor)
            self.net = get_net(self.config)
        self.reward_val = 0.0
        self.time = 0
        self.run_powerflow()
        self.current_state = self.get_state(self.config.with_soc)
        self.last_state = deepcopy(self.current_state)
        return np.concatenate([self.current_state, self.current_state - self.last_state])

    def step(self, p_set):
        """Update the simulation by one step

        :param p_set: 1D numpy array of floats, the action for the agent
        :return:
        """
        # Increment the time
        self.time += 1
        self.last_state = deepcopy(self.current_state)
        # Update non-controllable resources from their predefined data feeds
        new_loads = pd.Series(data=None, index=self.net.load.bus)
        new_sgens = pd.Series(data=None, index=self.net.sgen.bus)
        for bus, feed in self.config.static_feeds.items():
            if isinstance(feed, dict):
                for idx, feed2 in feed.items():
                    p_new = feed2[self.time]
                    if p_new > 0:
                        new_loads[bus] = p_new
                    else:
                        new_sgens[bus] = p_new
            else:
                p_new = feed[self.time]
                if p_new > 0:
                    new_loads[bus] = p_new
                else:
                    new_sgens[bus] = p_new
        self.update_loads(new_p=new_loads.values)
        self.update_static_generation(new_p=new_sgens.values)
        # Update controllable resources
        new_gens = p_set[:self.n_gen]
        new_storage = p_set[self.n_gen:]
        self.update_generation(new_p=new_gens)
        self.update_batteries(new_p=new_storage)
        # Run power flow
        self.run_powerflow()
        # Collect items to return
        state = self.get_state(self.config.with_soc)
        self.current_state = state
        reward = self.calculate_reward(eps=self.config.reward_epsilon)
        done = self.time >= self.config.max_ep_len
        info = ''
        return np.concatenate([self.current_state, self.current_state - self.last_state]), reward, done, info

    def get_state(self, with_soc=False):
        """Get the current state of the game

        The state is given by the power supplied or consumed by all devices
        on the network, plus the state of charge (SoC) of the batteries. This
        method defines a "global ordering" for this vector:
            - Non-controllable loads (power, kW)
            - Non-controllable generators (power, kW)
            - Controllable generators (power, kW)
            - Controllable batteries (power, kW)
            - SoC for batteries (soc, no units)

        We are not currently considering reactive power (Q) as part of the
        problem.

        :return: A 1D numpy array containing the current state
        """
        p_load = self.net.res_load.p_kw
        p_sgen = self.net.res_sgen.p_kw
        p_gen = self.net.res_gen.p_kw
        p_storage = self.net.res_storage.p_kw
        if with_soc:
            soc_storage = self.net.storage.soc_percent
            state = np.concatenate([p_load, p_sgen, soc_storage])
        else:
            state = np.concatenate([p_load, p_sgen])
        return state

    def update_loads(self, new_p=None, new_q=None):

        """Update the loads in the network.

        This method assumes that the orders match, i.e. the order the buses in
        self.net.load.bus matches where the loads in new_p and new_q should be
        applied based on their indexing.

        Parameters
        ----------
        new_p, new_q: array_like
            New values for the real and reactive load powers, shape (number of load buses, 1).

        Attributes
        ----------
        self.net.load: object
            The load values in the network object are updated.
        """
        if new_p is not None:
            self.net.load.p_kw = new_p
        if new_q is not None:
            self.net.load.q_kvar = new_q

    def update_static_generation(self, new_p=None, new_q=None):
        """Update the static generation in the network.

        This method assumes that the orders match, i.e. the order the buses in
        self.net.sgen.bus matches where the generation values in new_sgen_p and
        new_sgen_q should be applied based on their indexing.

        Parameters
        ----------
        new_sgen_p, new_sgen_q: array_like
            New values for the real and reactive static generation, shape
            (number of static generators, 1).

        Attributes
        ----------
        self.net.sgen: object
            The static generation values in the network object are updated.
        """
        if new_p is not None:
            self.net.sgen.p_kw = new_p
        if new_q is not None:
            self.net.sgen.q_kvar = new_q

    def update_generation(self, new_p=None, new_q=None):
        """Update the traditional (not static) generation in the network.

        This method assumes that the orders match, i.e. the order the buses in
        self.net.gen.bus matches where the generation values in new_gen_p
        should be applied based on their indexing.

        Parameters
        ----------
        new_gen_p: array_like
            New values for the real and reactive generation, shape (number of
            traditional generators, 1).

        Attributes
        ----------
        self.net.gen: object
            The traditional generation values in the network object are updated.
        """
        if new_p is not None:
            self.net.gen.p_kw = new_p
        if new_q is not None:
            self.net.gen.q_kvar = new_q

    def update_batteries(self, new_p):
        """Update the batteries / storage units in the network.

        This method assumes that the orders match, i.e. the order the buses in
        self.net.gen.bus matches where the generation values in new_gen_p
        should be applied based on their indexing.

        Parameters
        ----------
        battery_powers: array_like
            The power flow into / out of each battery, shape (number of traditional generators, 1).

        Attributes
        ----------
        self.net.storage: object
            The storage values in the network object are updated.
        """
        soc = self.net.storage.soc_percent
        cap = self.net.storage.max_e_kwh
        eff = self.net.storage.eff
        pmin = self.net.storage.min_p_kw
        pmin_soc = -1 * soc * cap * eff / self.tstep
        pmin = np.max([pmin, pmin_soc], axis=0)
        pmax = self.net.storage.max_p_kw
        pmax_soc = (1. - soc) * cap / (eff * self.tstep)
        pmax = np.min([pmax, pmax_soc], axis=0)
        ps = np.clip(new_p, pmin, pmax)
        self.net.storage.p_kw = ps
        soc_next = soc + ps * self.tstep * eff / cap
        msk = ps < 0
        soc_next[msk] = (soc + ps * self.tstep / (eff * cap))[msk]
        self.net.storage.soc_percent = soc_next

    def run_powerflow(self):
        """Evaluate the power flow. Results are stored in the results matrices
        of the net object, e.g. self.net.res_bus.

        Attributes
        ----------
        self.net: object
            The network matrices are updated to reflect the results.
            Specifically: self.net.res_bus, self.net.res_line, self.net.res_gen,
            self.net.res_sgen, self.net.res_trafo, self.net.res_storage.
        """
        try:
            pp.runpp(self.net, enforce_q_lims=True,
                     calculate_voltage_angles=False,
                     voltage_depend_loads=False)
        except:
            print('There was an error running the powerflow! pp.runpp() didnt work')

    def calculate_reward(self, eps=0.001, type=4):
        """Calculate the reward associated with a power flow result.

        We count zero flow through the line as when the power flowing into the
        line is equal to the power lost in it. This gives a positive reward.

        A cost (negative reward) is incurred for running the batteries, based
        on the capital cost of the battery and the expected lifetime (currently
        hardcoded to 1000 cycles). So, if the capital cost of the battery is set
        to zero, then producing or consuming power with the battery is free to
        use.

        Parameters
        ----------
        eps: float
            Tolerance

        Attributes
        ----------
        reward_val: The value of the reward function is returned.
        """
        c1 = np.abs(self.net.res_line.p_to_kw - self.net.res_line.pl_kw) < eps
        c2 = np.abs(self.net.res_line.p_from_kw - self.net.res_line.pl_kw) < eps
        zeroed_lines = np.logical_or(c1.values, c2.values)
        # Type 1 Reward: count of lines with zero-net-flow
        if type == 1:
            self.reward_val = np.sum(zeroed_lines, dtype=np.float)
        # Type 2 Reward: count of nodes not pulling power from grid
        elif type in [2, 3, 4]:
            graph_new = deepcopy(self.graph)
            for line_idx, zeroed in enumerate(zeroed_lines):
                if zeroed:
                    v = self.net.line.from_bus[line_idx]
                    w = self.net.line.to_bus[line_idx]
                    graph_new.removeEdge(v, w)
            self.reward_val = 0
            ext_connections = self.net.ext_grid.bus.values
            num_vmgs = 0
            for subgraph in graph_new.connectedComponents():
                if not np.any([item in subgraph for item in ext_connections]):
                    self.reward_val += len(subgraph)
                    num_vmgs += 1
            self.reward_val *= num_vmgs
        elif type == 5:
            pass

        # Add distance function:
        if type == 3:
            line_flow_values = np.maximum(np.abs(self.net.res_line.p_to_kw),
                                          np.abs(self.net.res_line.p_from_kw)) - self.net.res_line.pl_kw
            self.reward_val -= self.config.cont_reward_lambda * np.linalg.norm(line_flow_values, 1)
        elif type == 4:
            line_flow_values = np.maximum(np.abs(self.net.res_line.p_to_kw),
                                          np.abs(self.net.res_line.p_from_kw)) - self.net.res_line.pl_kw
            self.reward_val -= self.config.cont_reward_lambda * np.sum(np.minimum(np.abs(line_flow_values),
                                                                                  3.0*np.ones(np.shape(line_flow_values)[0])))
        # Costs for running batteries
        cap_costs = self.net.storage.cap_cost
        max_e = self.net.storage.max_e_kwh
        min_e = self.net.storage.min_e_kwh
        betas = cap_costs / (2 * 1000 * (max_e - min_e))
        incurred_costs = betas * np.abs(self.net.storage.p_kw)
        for c in incurred_costs:
            self.reward_val -= c
        return self.reward_val

if __name__ == "__main__":
    env1 = NetModel(env_name='rural_1')  # 'Six_Bus_POC')
    # env1.config.reward_epsilon = 0.1
    # env1.reset()
    env1.step([-20.17500389, -20.46192559, -19.49983787,  19.80725726, 20.07191253, 20.18946847])
    # env1.step([-0.02, -0.02])