FPsolve/newton.sage at master · mschlund/FPsolve · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
from sage.symbolic.ring import SR

# n = newton_fixpoint_solve(F, [x,y,z], 10)
# n.subs( a=0.5, b=0.3 )
# TODO (plan, long run):
# substitute either functions (p_(i,j)(n) = transition probabilities) or constants for some parameters
# and substitute the function f(x) = 1/(1-x) for s() to evaluate :) --> we get a rational expression in the free parameters
# Ultimately: Use it to approximate e.g. the expected value of the "runtime" (or some other "cost") as well as its variance (in terms of the input size n)
# Also:
# - Derive the equations from Flowgraphs, Remopla/PDS (which are derived from e.g. Java Bytecode)
# - More semirings (other analyses), integrate semirings, polynomials over them, and Newton's method nicely into Sage


# symbolic functions for the Kleene star of elements
from sage.symbolic.function_factory import function
s = function('s', nargs=1, eval_func=lambda self, x: 1 if x == 0 else s(x,hold=True))
#s = 1/(1-x)

from sage.matrix.constructor import block_matrix
def compute_mat_star(M) :
    if M.nrows() == 1 and M.ncols() == 1: # just a scalar in a matrix
        return s(M[0,0]) # apply the Kleene star to the only element and return
    else: # there is a matrix to deconstruct
        M = copy(M)
        if M.nrows() % 2 == 0 and M.ncols() % 2: # even number of rows/columns, split in half
            M.subdivide(M.nrows()/2,M.ncols()/2)
        else:   # odd number of rows/columns, peeling mode
            M.subdivide(M.nrows()-1,M.ncols()-1)
        a_11 = M.subdivision(0,0)
        a_12 = M.subdivision(0,1)
        a_21 = M.subdivision(1,0)
        a_22 = M.subdivision(1,1)
        as_11 = compute_mat_star(a_11)
        as_22 = compute_mat_star(a_22)
        # matrix divided and precalculated, now do the rest
        A_11 = compute_mat_star(a_11 + a_12 * as_22 * a_21)
        A_22 = compute_mat_star(a_22 + a_21 * as_11 * a_12)
        A_12 = as_11 * a_12 * A_22
        A_21 = as_22 * a_21 * A_11
        return block_matrix([A_11,A_12,A_21,A_22],  subdivide=False)

# taken from sage/symbolic/expression.pyx
# modified it to be able to specify the variables
# should be fixed in lib
def nhessian(self, poly_vars=None):
    from sage.matrix.constructor import matrix
    if poly_vars is None:
        poly_vars = self.arguments()
    return matrix([[g.derivative(x) for x in poly_vars] for g in self.gradient(poly_vars)])


# compute symbolic delta with a parameter vector u
# NOTE: this is for quadratic polynomials only!!
def compute_symbolic_delta(u,F,v) :
    d = []
    for i in F: # iterate over equations
        H = nhessian(i[0], v)
        d.append((1/2*u.transpose()*H*u)[0,0]) #TODO: make this nice :)
    return vector(SR,d).transpose()

# compute the degree of f when viewed as a polynomial in the variables v
# (necessary since some "symbolic variables" may actually be symbolic constants for us
def compute_degree(f,poly_vars) :
    variables = poly_vars[:]
    maxdeg = sum([f.degree(t) for t in variables])
    deg = 0
    while deg < maxdeg and len(variables) > 0:
        x = variables.pop()
        degx = f.degree(x)
        deg += degx
        f = f.diff([x]*degx)
        if (f==0) :
            break
    return deg

import itertools as it
# symbolic delta computation also for non-quadratic polynomials F
# parameter vectors are v and v_upd (which may also be concrete values if wanted :))
# v should be the (d-1)-st newton iterand and v_upd should be the (d)-th newton-update
def compute_symbolic_delta_general(v, v_upd, F, poly_vars) :
    n = len(v)
    assert(len(poly_vars) == n)
    delta = vector(SR,n)
    for i in range(n) :
        f = F[i][0]
        deg = compute_degree(f, poly_vars)

        for idx in it.product(range(0,deg+1), repeat=n) :
            if sum(idx) <=deg and sum(idx) >= 2 :
#                print str(idx)
                dx = reduce(lambda x,y : x + ([y[0]]*y[1]), zip(poly_vars,idx), [])
                prd = reduce(lambda p,x : p*(x[0]**x[1]), zip(v_upd,idx), 1)
                sub_dict = dict(zip(poly_vars,v))
                delta[i] = delta[i] + diff(f,dx).subs(sub_dict) * prd / prod([factorial(x) for x in idx])
#        delta[i] = delta[i]/factorial(deg) #FIXME!!! WRONG!
    return delta.column()


# given a vector of polynomials F in variables poly_vars, its Jacobian,
# a starting value v, and the "update" delta, compute the update
# v_update = J^*|v * delta
# such that v_new = v + v_update

def newton_step(F, poly_vars, J_s, v, delta) :
    assert(len(poly_vars) == v.nrows())

    sub_dict = dict(zip(poly_vars,v.list()) )
    J_s = J_s.subs(sub_dict)

#    v_new = v + J_s*delta
    v_upd = J_s*delta
    return v_upd


# iterate until convergence, but for at most max_iter iterations
# 1) compute the concrete delta (from the precomputed symbolic expression)
# 2) execute a newton_step

from sage.calculus.functions import jacobian
def newton_fixpoint_solve(F, poly_vars, max_iter=10) :
    J = jacobian(F, poly_vars)
    J_s = compute_mat_star(J) #only compute matrix star once
#    print J_s

    u = var(join(['u%d' %i for i in range(J.ncols())]))
    u_upd = var(join(['u_upd%d' %i for i in range(J.ncols())]))

    if(J.ncols() == 1) :
        u = (u,)
        u_upd = (u_upd,)

#    delta = compute_symbolic_delta(vector(u).column(),F,poly_vars)
    delta = compute_symbolic_delta_general(u, u_upd, F, poly_vars)

    print delta

    v = matrix(SR,F.nrows(),1) # v^0 = 0
    delta_new = F.subs( dict( (v,0) for v in poly_vars ))

    v_upd = newton_step(F,poly_vars,J_s,v,delta_new)
#    v = v + v_upd

    # define symbolic variables for v^[i] and v^(i)
    tmp_var = var(join(['vs%d_%d' %(1,j) for j in range(v.nrows())]))
    if (v.nrows() == 1) :
        tmp_var = (tmp_var,)
    v_s = matrix(tmp_var).transpose()

    tmp_var = var(join(['vus%d_%d' %(1,j) for j in range(v_upd.nrows())]))
    if (v_upd.nrows() == 1) :
        tmp_var = (tmp_var,)
    vu_s = matrix(tmp_var).transpose()
    # save the current values
    v_list = zip(v_s.list(), v.list())
    vu_list = zip(vu_s.list(), v_upd.list())

    # newton-iteration..
    for i in range(2,max_iter+1) :
 #       delta_new = delta.subs( dict( zip(u,v_upd.list()) ) )
        delta_new = delta.subs(dict( zip(u_upd,vu_s.list()) + zip(u, v_s.list())) )

        v = v_s + vu_s

        tmp_var = var(join(['vs%d_%d' %(i,j) for j in range(v.nrows())]))
        if (v.nrows() == 1) :
            tmp_var = (tmp_var,)
        v_s = matrix(tmp_var).transpose()
        v_list += zip(v_s.list(), v.list())

        v_upd = newton_step(F,poly_vars,J_s,v_s,delta_new)
        tmp_var = var(join(['vus%d_%d' %(i,j) for j in range(v_upd.nrows())]))
        if (v_upd.nrows() == 1) :
            tmp_var = (tmp_var,)
        vu_s = matrix(tmp_var).transpose()

        vu_list += zip(vu_s.list(), v_upd.list())

    v_dict = dict(v_list)
    vu_dict = dict(vu_list)

    # try intelligent backsubstitution
    # but this is an ugly implementation
    # this evaluates the symbolic variables bottom up
    for i in range(1,max_iter):
        v_var = var(join(['vs%d_%d' %(i,j) for j in range(v.nrows())]))
        vu_var = var(join(['vus%d_%d' %(i,j) for j in range(v.nrows())]))

        if(v.nrows() == 1) :
            v_var = (v_var,)
            vu_var = (vu_var,)

        for j in range(F.nrows()):
            v_new_var = var('vs%d_%d' %(i+1,j))
            vu_new_var = var('vus%d_%d' %(i+1,j))
            # substitute all occurrences
            for variable in v_var:
                # replace each dictionary key with a new one where the symbolic variables are
                # substituted with the previous iteration
                v_dict[v_new_var] = v_dict[v_new_var].subs(dict([(variable,v_dict[variable])]))
                vu_dict[vu_new_var] = vu_dict[vu_new_var].subs(dict([(variable,v_dict[variable])]))
            for variable in vu_var:
                v_dict[v_new_var] = v_dict[v_new_var].subs(dict([(variable,vu_dict[variable])]))
                vu_dict[vu_new_var] = vu_dict[vu_new_var].subs(dict([(variable,vu_dict[variable])]))
        # the i-th iteration is almost done except the occurence of vs_n in vus_n
        for j in range(F.nrows()):
            v_var = var(join(['vs%d_%d' %(i+1,l) for l in range(v.nrows())]))
            if(v.nrows() == 1) :
                v_var = (v_var,)
            vu_new_var = var('vus%d_%d' %(i+1,j))
            for variable in v_var:
                vu_dict[vu_new_var] = vu_dict[vu_new_var].subs(dict([(variable,v_dict[variable])]))

    # last step
    v = v + v_upd
    v = v.subs(v_dict)
    v = v.subs(vu_dict)

    return v

# Newton's method as a textbook-implementation
# find a zero of the multivariate polynomial (vector) F starting with v_0
# TODO: nicefy... or rather throw away and write new :)
from numpy import linalg
import numpy
from sage.symbolic.ring import NumpyToSRMorphism

# x = newton_numerical(F_diff, [x,y,z])
# vgl. mit x_sym = newton_fixpoint_solve(F_c, [x,y,z])

def newton_numerical(F, poly_vars, max_iter=10) :
    np_to_SR = NumpyToSRMorphism(numpy.float64, SR)
    J = jacobian(F,poly_vars)

    v_0 = numpy.array([0]*len(poly_vars))
    v = vector(map(np_to_SR,v_0)).column()
    for i in range(1,max_iter+1) :
        v = vector(map(np_to_SR,v)).column()
        sub = dict(zip(poly_vars,v.list()))
        A = J.subs(sub)
        b = F.subs(sub)
        x = linalg.solve(A,b) #TODO: solve system in software rather than with numpy (finite precision!)??
        v = v - x

    return v


def gen_random_quadratic_eqns(n, eps) :
    poly_vars = ['x%d' %i for i in range(n)]


    # n variables ==> n choose 2 monomials, select eps*n of those which will be non-zero
    monomials = [m for m in itertools.combinations(poly_vars,2)]

    k = int(eps*(n*n/2 - n/2))

    if(k<2) :
        k=2

    #for the non-zero monomials choose random coefficients from (0,1) that add up to 1
    # this can be done by sampling from a (/the) k-dimensional (symmetric) Dirichlet-distribution

    for i in range(n) :
        non_zero = random.sample(monomials, k-1)
        coeff = list(numpy.random.dirichlet([1]*k))
        const_coeff = coeff.pop()

        mon_coeffs = map(lambda x : str(x[0]) + " " + "<"+x[1][0]+">"+"<"+x[1][1]+">", zip(coeff,non_zero) )
        f = reduce(lambda x, y : x + " | " + y, mon_coeffs)
        f = f + " | " + str(const_coeff)
        print "<" + poly_vars[i] + ">" + " ::= " + f + ";"