def test_geodesics(): from scipy.linalg import expm alpha = np.random.randint(1, 10, (2)) * .1 beta = alpha[1] * .1 m, d = (5, 3) man = ComplexPositiveSemidefinite(m, d, alpha=alpha, beta=beta) X = man.rand() alf = alpha[1] / alpha[0] def calc_gamma(man, X, xi, eta): g_inv_Jst_solve_J_g_in_Jst_DJ = man.g_inv( X, man.Jst(X, man.solve_J_g_inv_Jst(X, man.D_J(X, xi, eta)))) proj_christoffel = man.proj_g_inv(X, man.christoffel_form(X, xi, eta)) return g_inv_Jst_solve_J_g_in_Jst_DJ + proj_christoffel eta = man.randvec(X) g1 = calc_gamma(man, X, eta, eta) g2 = man.christoffel_gamma(X, eta, eta) print(man._vec(g1 - g2)) egrad = man._rand_ambient() print(man.base_inner_ambient(g1, egrad)) print(man.rhess02_alt(X, eta, eta, egrad, 0)) print(man.rhess02(X, eta, eta, egrad, man.zerovec(X))) # second solution: A = X.Y.T.conj() @ eta.tY t = 2 K = eta.tY - X.Y @ (X.Y.T.conj() @ eta.tY) Yp, R = np.linalg.qr(K) x_mat = np.bmat([[2 * alf * A, -R.T.conj()], [R, zeros((d, d))]]) Yt = np.bmat([X.Y, Yp]) @ expm(t*x_mat)[:, :d] @ \ expm(t*(1-2*alf)*A) x_d_mat = x_mat[:, :d].copy() x_d_mat[:d, :] += (1 - 2 * alf) * A Ydt = np.bmat([X.Y, Yp]) @ expm(t*x_mat) @ x_d_mat @\ expm(t*(1-2*alf)*A) x_dd_mat = x_mat @ x_d_mat + x_d_mat @ ((1 - 2 * alf) * A) Yddt = np.bmat([X.Y, Yp]) @ expm(t*x_mat) @ x_dd_mat @\ expm(t*(1-2*alf)*A) sqrtP = X.evec @ np.diag(np.sqrt(X.evl)) @ X.evec.T.conj() isqrtP = X.evec @ np.diag(1 / np.sqrt(X.evl)) @ X.evec.T.conj() Pinn = t * isqrtP @ eta.tP @ isqrtP ePinn = expm(Pinn) Pt = sqrtP @ ePinn @ sqrtP Pdt = eta.tP @ isqrtP @ ePinn @ sqrtP Pddt = eta.tP @ isqrtP @ ePinn @ isqrtP @ eta.tP Xt = psd_point(np.array(Yt), np.array(Pt)) Xdt = psd_ambient(np.array(Ydt), np.array(Pdt)) Xddt = psd_ambient(np.array(Yddt), np.array(Pddt)) gcheck = Xddt + calc_gamma(man, Xt, Xdt, Xdt) print(man._vec(gcheck)) Xt1 = man.exp(X, t * eta) print((Xt1.Y - Xt.Y)) print((Xt1.P - Xt.P))
def test_rhess_02(): n, d = (50, 3) alpha = randint(1, 10, 2) * .1 beta = randint(1, 10, 2)[0] * .1 man = ComplexPositiveSemidefinite(n, d, alpha=alpha, beta=beta) S = man.rand() # simple function. Distance to a given matrix # || S - A||_F^2 A = hsym(crandn(n, n)) def f(S): diff = (A - S.Y @ S.P @ S.Y.T.conjugate()) return trace(diff @ diff.T.conjugate()) def df(S): return psd_ambient(-4 * A @ S.Y @ S.P, 2 * (S.P - S.Y.T.conjugate() @ A @ S.Y)) def ehess_form(S, xi, eta): return ( trace(-4 * A @ (xi.tY @ S.P + S.Y @ xi.tP) @ eta.tY.T.conjugate()) + 2 * trace( (xi.tP - xi.tY.T.conjugate() @ A @ S.Y - S.Y.T.conjugate() @ A @ xi.tY) @ eta.tP.T.conjugate())).real def ehess_vec(S, xi): return psd_ambient( -4 * A @ (xi.tY @ S.P + S.Y @ xi.tP), 2 * (xi.tP - xi.tY.T.conjugate() @ A @ S.Y - S.Y.T.conjugate() @ A @ xi.tY)) xxi = man.randvec(S) dlt = 1e-8 Snew = psd_point(S.Y + dlt * xxi.tY, S.P + dlt * xxi.tP) d1 = (f(Snew) - f(S)) / dlt d2 = df(S) print(d1 - man.base_inner_ambient(d2, xxi)) eeta = man.randvec(S) d1 = man.base_inner_ambient((df(Snew) - df(S)), eeta) / dlt ehess_val = ehess_form(S, xxi, eeta) dv2 = ehess_vec(S, xxi) print(man.base_inner_ambient(dv2, eeta)) print(d1, ehess_val, d1 - ehess_val) # now check the formula: ehess = xi (eta_func(f)) - <D_xi eta, df(Y)> # promote eta to a vector field. m1 = crandn(n, n) m2 = crandn(d, d) m_p = crandn(d * d, d * d) def eta_field(Sin): return man.proj( S, psd_ambient(m1 @ (Sin.Y - S.Y) @ m2, hsym((m_p @ (Sin.P - S.P).reshape(-1)).reshape( d, d)))) + eeta # xietaf: should go to ehess(xi, eta) + df(Y) @ etafield) xietaf = (man.base_inner_ambient(df(Snew), eta_field(Snew)) - man.base_inner_ambient(df(S), eta_field(S))) / dlt # appy eta_func to f: should go to tr(m1 @ xxi @ m2 @ df(Y).T) Dxietaf = man.base_inner_ambient( (eta_field(Snew) - eta_field(S)), df(S)) / dlt # this is ehess. should be same as d1 or ehess_val print(xietaf - Dxietaf) print(xietaf - Dxietaf - ehess_val) # now check: rhess. Need to make sure xi, eta in the tangent space. # first compare this with numerical differentiation xi1 = man.proj(S, xxi) eta1 = man.proj(S, eeta) egvec = df(S) ehvec = ehess_vec(S, xi1) rhessvec = man.ehess2rhess(S, egvec, ehvec, xi1) # check it numerically: def rgrad_func(Y): return man.proj_g_inv(Y, df(Y)) # val2a, _, _ = calc_covar_numeric_raw(man, W, xi1, df) val2, _, _ = calc_covar_numeric(man, S, xi1, rgrad_func) val2_p = man.proj(S, val2) # print(rhessvec) # print(val2_p) print(man._vec(rhessvec - val2_p)) rhessval = man.inner_product_amb(S, rhessvec, eta1) print(man.inner_product_amb(S, val2, eta1)) print(rhessval) # check symmetric: ehvec_e = ehess_vec(S, eta1) rhessvec_e = man.ehess2rhess(S, egvec, ehvec_e, eta1) rhessval_e = man.inner_product_amb(S, rhessvec_e, xi1) print(rhessval_e) # the above computed inner_prod(Nabla_xi Pi * df, eta) # in the following check. Extend eta1 to eta_proj # (Pi Nabla_hat Pi g_inv df, g eta) # = D_xi (Pi g_inv df, g eta) - (Pi g_inv df g Pi Nabla_hat eta) def eta_proj(S): return man.proj(S, eta_field(S)) print(check_zero(man._vec(eta1 - eta_proj(S)))) e1 = man.inner(S, man.proj_g_inv(S, df(S)), eta_proj(S)) e1a = man.base_inner_ambient(df(S), eta_proj(S)) print(e1, e1a, e1 - e1a) Snew = psd_point(S.Y + dlt * xi1.tY, S.P + dlt * xi1.tP) e2 = man.inner(Snew, man.proj_g_inv(Snew, df(Snew)), eta_proj(Snew)) e2a = man.base_inner_ambient(df(Snew), eta_proj(Snew)) print(e2, e2a, e2 - e2a) first = (e2 - e1) / dlt first1 = (man.base_inner_ambient(df(Snew), eta_proj(Snew)) - man.base_inner_ambient(df(S), eta_proj(S))) / dlt print(first - first1) val3, _, _ = calc_covar_numeric(man, S, xi1, eta_proj) second = man.inner(S, man.proj_g_inv(S, df(S)), man.proj(S, val3)) second2 = man.inner(S, man.proj_g_inv(S, df(S)), val3) print(second, second2, second - second2) print('same as rhess_val %f' % (first - second))
def test_all_projections(): alpha = randint(1, 10, 2) * .1 beta = randint(1, 10, 1)[0] * .02 n = 5 d = 3 man = ComplexPositiveSemidefinite(n, d, alpha=alpha, beta=beta) print(man) S = man.rand() test_inner(man, S) test_J(man, S) # now check metric, Jst etc # check Jst: vectorize the operator J then compare Jst with jmat.T jmat = make_j_mat(man, S) test_Jst(man, S, jmat) ginv_mat = make_g_inv_mat(man, S) ee = man._rand_ambient() g1 = man._unvec(ginv_mat @ man._vec(ee)) print(check_zero(man.g_inv(S, ee).tP - g1.tP)) print(check_zero(man.g_inv(S, ee).tY - g1.tY)) # test g_inv_Jst for ii in range(10): a = man._rand_range_J() avec = man._vec_range_J(a) jtout = ginv_mat @ jmat.T @ avec jtout2 = man._vec(man.g_inv_Jst(S, a)) diff = check_zero(jtout - jtout2) print(diff) # test projection test_projection(man, S) # now diff projection for i in range(1): e = man._rand_ambient() S1 = man.rand() xi = man.randvec(S1) dlt = 1e-7 S2 = psd_point(S1.Y + dlt * xi.tY, S1.P + dlt * xi.tP) # S = psd_point(S1.Y, S1.P) d1P = (man.proj(S2, e).tP - man.proj(S1, e).tP) / dlt d1Y = (man.proj(S2, e).tY - man.proj(S1, e).tY) / dlt d2 = man.D_proj(S1, xi, e) print(check_zero(d1P - d2.tP) + check_zero(d1Y - d2.tY)) for i in range(10): a = man._rand_range_J() eta = man._rand_ambient() print(man.base_inner_ambient(eta, man.Jst(S, a))) print((trace((eta.tP.T.conjugate() - eta.tP) @ a['P'] + (man.alpha[1] * eta.tY.T.conjugate() @ S.Y + man.beta * (S.Pinv @ eta.tP.T.conjugate() - eta.tP.T.conjugate() @ S.Pinv)) @ a['YP'])).real) print((trace(2 * eta.tP.T.conjugate() @ a['P']) + trace( (man.alpha[1] * eta.tY.T.conjugate() @ S.Y + man.beta * (S.Pinv @ eta.tP.T.conjugate() - eta.tP.T.conjugate() @ S.Pinv)) @ a['YP'])).real) print((trace( eta.tP.T.conjugate() @ (2 * a['P'] + man.beta * (a['YP'] @ S.Pinv - S.Pinv @ a['YP']))) + trace(eta.tY.T.conjugate() @ (man.alpha[1] * S.Y @ a['YP'])) ).real) print(man.base_inner_E_J(man.J(S, eta), a)) print(( trace((eta.tP - eta.tP.T.conjugate()).T.conjugate() @ a['P'] + (man.alpha[1] * S.Y.T.conjugate() @ eta.tY + man.beta * (eta.tP @ S.Pinv - S.Pinv @ eta.tP)).T.conjugate() @ a['YP'] )).real) for i in range(10): a = man._rand_range_J() beta = man.beta alf = man.alpha anew1 = man.J(S, man.g_inv_Jst(S, a)) anew = {} saYP = a['YP'] + a['YP'].T.conjugate() anew['P'] = 4 / beta * S.P @ a['P'] @ S.P + S.P @ saYP - saYP @ S.P anew['YP'] = alf[1] * a['YP'] + beta * ( ((2 / man.beta) * S.P @ a['P'] @ S.P + S.P @ a['YP'] - a['YP'] @ S.P) @ S.Pinv - S.Pinv @ ( (2 / man.beta) * S.P @ a['P'] @ S.P + S.P @ a['YP'] - a['YP'] @ S.P)) anew['YP'] = alf[1] * a['YP'] + ( (2 * S.P @ a['P'] + beta * S.P @ a['YP'] @ S.Pinv - beta * a['YP']) - (2 * a['P'] @ S.P + beta * a['YP'] - beta * S.Pinv @ a['YP'] @ S.P)) anew['YP'] = (alf[1] - 2 * beta) * a['YP'] + ( (2 * S.P @ a['P'] + beta * S.P @ a['YP'] @ S.Pinv) - (2 * a['P'] @ S.P - beta * S.Pinv @ a['YP'] @ S.P)) anew['YP'] = (alf[1] - 2 * beta) * a['YP'] + ( (2 * S.P @ a['P'] - 2 * a['P'] @ S.P + beta * S.P @ a['YP'] @ S.Pinv + beta * S.Pinv @ a['YP'] @ S.P)) print(check_zero(man._vec_range_J(anew1) - man._vec_range_J(anew))) for i in range(10): a = man._rand_range_J() b1 = man.J(S, man.g_inv_Jst(S, a)) b2 = man.J_g_inv_Jst(S, a) print(check_zero(man._vec_range_J(b1) - man._vec_range_J(b2))) a1 = man.solve_J_g_inv_Jst(S, b1) print(check_zero(man._vec_range_J(a) - man._vec_range_J(a1))) for ii in range(10): E = man._rand_ambient() a2 = man.J_g_inv(S, E) a1 = man.J(S, man.g_inv(S, E)) print(check_zero(man._vec_range_J(a1) - man._vec_range_J(a2))) for i in range(20): Uran = man._rand_ambient() Upr = man.proj(S, man.g_inv(S, Uran)) Upr2 = man.proj_g_inv(S, Uran) print(check_zero(man._vec(Upr) - man._vec(Upr2))) for ii in range(10): a = man._rand_range_J() xi = man.randvec(S) jtout2 = man.Jst(S, a) dlt = 1e-7 Snew = psd_point(S.Y + dlt * xi.tY, S.P + dlt * xi.tP) jtout2a = man.Jst(Snew, a) d1 = (jtout2a - jtout2).scalar_mul(1 / dlt) d2 = man.D_Jst(S, xi, a) print(check_zero(man._vec(d2) - man._vec(d1))) for ii in range(10): S1 = man.rand() eta = man._rand_ambient() xi = man.randvec(S1) a1 = man.J(S1, eta) dlt = 1e-8 Snew = psd_point(S1.Y + dlt * xi.tY, S1.P + dlt * xi.tP) a2 = man.J(Snew, eta) d1 = { 'P': (a2['P'] - a1['P']) / dlt, 'YP': (a2['YP'] - a1['YP']) / dlt } d2 = man.D_J(S1, xi, eta) print(check_zero(man._vec_range_J(d2) - man._vec_range_J(d1))) # derives metrics for ii in range(10): S1 = man.rand() xi = man.randvec(S1) omg1 = man._rand_ambient() omg2 = man._rand_ambient() dlt = 1e-7 S2 = psd_point(S1.Y + dlt * xi.tY, S1.P + dlt * xi.tP) p1 = man.inner(S1, omg1, omg2) p2 = man.inner(S2, omg1, omg2) der1 = (p2 - p1) / dlt der2 = man.base_inner_ambient(man.D_g(S1, xi, omg2), omg1) print(der1 - der2) if np.abs(der1 - der2) > 1e-4: print(der1, der2) break # cross term for christofel for i in range(10): S1 = man.rand() xi = man.randvec(S1) eta1 = man.randvec(S1) eta2 = man.randvec(S1) dr1 = man.D_g(S1, xi, eta1) x12 = man.contract_D_g(S1, eta1, eta2) p1 = man.base_inner_ambient(dr1, eta2) p2 = man.base_inner_ambient(x12, xi) print(p1, p2, p1 - p2) # now test christofel: # two things: symmetric on vector fields # and christofel relation # in the case metric for i in range(10): S1 = man.rand() xi = man.randvec(S1) eta1 = man.randvec(S1) eta2 = man.randvec(S1) p1 = man.proj_g_inv(S1, man.christoffel_form(S1, xi, eta1)) p2 = man.proj_g_inv(S1, man.christoffel_form(S1, eta1, xi)) print(check_zero(man._vec(p1) - man._vec(p2))) v1 = man.base_inner_ambient(man.christoffel_form(S1, eta1, eta2), xi) v2 = man.base_inner_ambient(man.D_g(S1, eta1, eta2), xi) v3 = man.base_inner_ambient(man.D_g(S1, eta2, eta1), xi) v4 = man.base_inner_ambient(man.D_g(S1, xi, eta1), eta2) print(v1, 0.5 * (v2 + v3 - v4), v1 - 0.5 * (v2 + v3 - v4))