-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathgreybox_generalize.py
256 lines (218 loc) · 9.81 KB
/
greybox_generalize.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
import numpy as np
import pyomo.environ as pyo
from scipy.sparse import coo_matrix
from pyomo.contrib.pynumero.interfaces.external_grey_box import ExternalGreyBoxModel
from pyomo.contrib.pynumero.interfaces.external_grey_box import ExternalGreyBoxBlock
class LogDetModel(ExternalGreyBoxModel):
def __init__(
self,
n_parameters=2,
initial_fim=None,
use_exact_derivatives=True,
print_level=0,
):
"""
Greybox model to compute the log determinant of a sqaure symmetric matrix.
Arguments
---------
n_parameters: int
Number of parameters in the model. The square symmetric matrix is of shape n_parameters*n_parameters
initial_fim: dict
key: tuple (i,j) where i, j are the row, column number of FIM. value: FIM[i,j]
Initial value of the matrix. If None, the identity matrix is used.
use_exact_derivatives: bool
If True, the exact derivatives are used.
If False, the finite difference approximation can be used, but not recommended/tested.
print_level: integer
0 (default): no extra output
1: minimal info to indicate if initialized well
print the following:
- initial FIM received by the grey-box moduel
2: intermediate info for debugging
print all the level 1 print statements, plus:
- the FIM output of the current iteration, both the output as the FIM matrix, and the flattened vector
3: all details for debugging
print all the level 2 print statements, plus:
- the log determinant of the FIM output of the current iteration
- the eigen values of the FIM output of the current iteration
Return
------
None
"""
self._use_exact_derivatives = use_exact_derivatives
self.print_level = print_level
self.n_parameters = n_parameters
# make sure it's integer since this is a number of inputs that shouldn't be fractional
self.num_input = int(
n_parameters + (n_parameters * n_parameters - n_parameters) / 2
)
self.initial_fim = initial_fim
# variable to store the output value
# Output constraint multiplier values. This is a 1-element vector because there is one output
self._output_con_mult_values = np.zeros(1)
if not use_exact_derivatives:
raise NotImplementedError("use_exact_derivatives == False not supported")
def input_names(self):
"""Return the names of the inputs.
Define only the upper triangle of FIM because FIM is symmetric
Return
------
input_name_list: a list of the names of inputs
"""
# store the input names as a tuple
input_name_list = []
# loop over parameters
for i in range(self.n_parameters):
# loop over upper triangle
for j in range(i, self.n_parameters):
input_name_list.append((i, j))
return input_name_list
def equality_constraint_names(self):
"""Return the names of the equality constraints."""
# no equality constraints
return []
def output_names(self):
"""Return the names of the outputs."""
return ["log_det"]
def set_output_constraint_multipliers(self, output_con_multiplier_values):
"""
Set the values of the output constraint multipliers.
Arguments
---------
output_con_multiplier_values: a scalar number for the output constraint multipliers
"""
# because we only have one output constraint, the length is 1
if len(output_con_multiplier_values) != 1:
raise ValueError("Output should be a scalar value. ")
np.copyto(self._output_con_mult_values, output_con_multiplier_values)
def finalize_block_construction(self, pyomo_block):
"""
Finalize the construction of the ExternalGreyBoxBlock.
This function initializes the inputs with an initial value
Arguments
---------
pyomo_block: pass the created pyomo block here
"""
# ele_to_order map the input position in FIM, like (a,b), to its flattend index
# for e.g., ele_to_order[(0,0)] = 0
ele_to_order = {}
count = 0
if self.print_level >= 1:
if self.initial_fim is not None:
print("Grey-box initialize inputs with: ", self.initial_fim)
else:
print("Grey-box initialize inputs with an identity matrix.")
# only generating upper triangular part
# loop over parameters
for i in range(self.n_parameters):
# loop over parameters from current parameter to end
for j in range(i, self.n_parameters):
# flatten (i,j)
ele_to_order[(i, j)] = count
# this tuple is the position of this input in the FIM
tuple_name = (i, j)
# if an initial FIM is given, we can initialize with these values
if self.initial_fim is not None:
pyomo_block.inputs[tuple_name].value = self.initial_fim[tuple_name]
# if not given initial FIM, we initialize with an identity matrix
else:
# identity matrix
if i == j:
pyomo_block.inputs[tuple_name].value = 1
else:
pyomo_block.inputs[tuple_name].value = 0
count += 1
self.ele_to_order = ele_to_order
def set_input_values(self, input_values):
"""
Set the values of the inputs.
This function refers to the notebook:
https://colab.research.google.com/drive/1VplaeOTes87oSznboZXoz-q5W6gKJ9zZ?usp=sharing
Arguments
---------
input_values: input initial values
"""
# see the colab link in the doc string for why this should be a list
self._input_values = list(input_values)
def evaluate_equality_constraints(self):
"""Evaluate the equality constraints.
Return None because there are no equality constraints.
"""
return None
def evaluate_outputs(self):
"""
Evaluate the output of the model.
We call numpy here to compute the logdet of FIM. slogdet is used to avoid ill-conditioning issue
This function refers to the notebook:
https://colab.research.google.com/drive/1VplaeOTes87oSznboZXoz-q5W6gKJ9zZ?usp=sharing
Return
------
logdet: a one-element numpy array, containing the log det value as float
"""
# form matrix as a list of lists
M = self._extract_and_assemble_fim()
# compute log determinant
(sign, logdet) = np.linalg.slogdet(M)
if self.print_level >= 2:
print("iteration")
print("\n Consider M =\n", M)
print("Solution: ", self._input_values)
if self.print_level == 3:
print(" logdet = ", logdet, "\n")
print("Eigvals:", np.linalg.eigvals(M))
# see the colab link in the doc string for why this should be a array with dtype as float64
return np.asarray([logdet], dtype=np.float64)
def evaluate_jacobian_equality_constraints(self):
"""Evaluate the Jacobian of the equality constraints."""
return None
def _extract_and_assemble_fim(self):
"""
This function make the flattened inputs back into the shape of an FIM
Return
------
M: a numpy array containing FIM.
"""
# FIM shape Np*Np
M = np.zeros((self.n_parameters, self.n_parameters))
# loop over parameters.
# Expand here to be the full matrix.
for i in range(self.n_parameters):
for k in range(self.n_parameters):
# get symmetry part.
# only have upper triangle, so the smaller index is the row number
row_number, col_number = min(i, k), max(i, k)
M[i, k] = self._input_values[
self.ele_to_order[(row_number, col_number)]
]
return M
def evaluate_jacobian_outputs(self):
"""
Evaluate the Jacobian of the outputs.
Return
------
A sparse matrix, containing the first order gradient of the OBJ, in the shape [1,N_input]
where N_input is the No. of off-diagonal elements//2 + Np
"""
if self._use_exact_derivatives:
M = self._extract_and_assemble_fim()
# compute pseudo inverse to be more numerically stable
Minv = np.linalg.pinv(M)
# compute gradient of log determinant
row = np.zeros(self.num_input) # to store row index
col = np.zeros(self.num_input) # to store column index
data = np.zeros(self.num_input) # to store data
# construct gradients as a sparse matrix
# loop over the upper triangular
# loop over parameters
for i in range(self.n_parameters):
# loop over parameters from current parameter to end
for j in range(i, self.n_parameters):
order = self.ele_to_order[(i, j)]
# diagonal elements. See Eq. 16 in paper for explanation
if i == j:
row[order], col[order], data[order] = (0, order, Minv[i, j])
# off-diagonal elements
else: # factor = 2 since it is a symmetric matrix. See Eq. 16 in paper for explanation
row[order], col[order], data[order] = (0, order, 2 * Minv[i, j])
# sparse matrix
return coo_matrix((data, (row, col)), shape=(1, self.num_input))