
clear all
clc
close all



% rnd_s = randi(100000);
% rng(rnd_s);

rng(7);


d = 4;
k = 2;

% A = [0.99106488, 0.0816012, 0.05;...
%     0.0541349, 0.990121, 0.0708383;...
%     0.08,0.04,0.990132655];
% B = [-0.8900150808;-0.880096;0.667345];
% C = [0.8510150808;-0.751096;-0.791345];
%
%
% Ru = 1*eye(k);
% gamma = sqrt(1);
% Rv = gamma^2*eye(k);
% Q = 1*eye(d);

max_iter = 5000;

Dist_NE = zeros(max_iter,3); % 3 means 3 cases: double-loop, N_L=50, primal-dual
P_2_NE = zeros(max_iter,3);



%% Hard case
A = 1.2*eye(d)+1*rand(d,d);
B = rand(d,k);
C = 0.02*rand(d,k);


Ru = 1*eye(k)+1*rand(1)*eye(k);
gamma = sqrt(1);
Rv = gamma^2*eye(k);
Q = eye(d)+0.1*rand(1)*eye(d);



%% iterative dare
% P2 = my_gare(A,B,C,Q,Ru,Rv)
%
% min(eig(Rv-C'*P2*C))
% min(eig(Ru+B'*P2*B))
%
% Ks2 = (Ru+B'*P2*B-B'*P2*C*((-Rv+C'*P2*C)\(C'*P2*B)))\(B'*P2*A-(B'*P2*C/(-Rv+C'*P2*C))*C'*P2*A)
% Ls2 = (-Rv+C'*P2*C-C'*P2*B*((Ru+B'*P2*B)\(B'*P2*C)))\(C'*P2*A-(C'*P2*B/(Ru+B'*P2*B))*B'*P2*A)
%
% P22 = solvePKL(A,B,C,Q,Ru,Rv,Ks2,Ls2)

% set an initial K0, calculate Hinf under it, and then perturb the Hinf
% bound

while (true)
    ini_range = 5;
    K0 = ini_range*rand(k,d)-ini_range/2;
    if max(abs(eig(A-B*K0)))<1
        break;
    end
end


sys = ss((A-B*K0),C,(Q+K0'*Ru*K0)^(1/2),0,[]);

% HinfNK0 = norm(sys,Inf,1e-6);
HinfNK0 = hinfnorm(sys,1e-6)

Rv = HinfNK0^2*eye(k)*(1-1*rand(1)); % the larger, the better


P2 = my_gare(A,B,C,Q,Ru,Rv)

min(eig(Rv-C'*P2*C))
min(eig(Ru+B'*P2*B))

Ks2 = (Ru+B'*P2*B-B'*P2*C*((-Rv+C'*P2*C)\(C'*P2*B)))\(B'*P2*A-(B'*P2*C/(-Rv+C'*P2*C))*C'*P2*A)
Ls2 = (-Rv+C'*P2*C-C'*P2*B*((Ru+B'*P2*B)\(B'*P2*C)))\(C'*P2*A-(C'*P2*B/(Ru+B'*P2*B))*B'*P2*A)

P22 = solvePKL(A,B,C,Q,Ru,Rv,Ks2,Ls2)


%% Robustify K_0

sys_ini = ss((A-B*K0),C,(Q+K0'*Ru*K0)^(1/2),0,[]);
HinfNK_ini = hinfnorm(sys_ini,1e-6)


K0 = Robustify_Zeroth_K_1_Point(K0,A,B,C,Q,Ru,Rv);


%% Update 1: double-loop

eta_K = 0.00005;

K_ini = K0;
L_ini = zeros(k,d);


flg = 0;


K_tmp = K_ini;
L_tmp = L_ini;
P_KL_old = zeros(d,d);


step_len_1 = 1;

for steps = 1:max_iter
    steps
    
    test_P_KL = my_gare_gv_K(A,B,C,Q, Ru,Rv,K_tmp);
    test_L_gv_K = (-Rv+C'*test_P_KL*C)\(C'*test_P_KL*(A-B*K_tmp));
    
    Lp_tmp = test_L_gv_K;
    
    
    %     test_P_KL = my_gare_gv_L(A,B,C,Q, Ru,Rv,L_tmp);
    %     test_K_gv_L = (Ru+B'*test_P_KL*B)\(B'*test_P_KL*(A-C*L_tmp));
    
    for j = 1:step_len_1
        P_KL = solvePKL(A,B,C,Q,Ru,Rv,K_tmp,Lp_tmp);
        
        % Gauss-Newton
        %              Kp_tmp = K_tmp - eta_K*2*((Ru+B'*P_KL*B)\((Ru+B'*P_KL*B)*K_tmp-B'*P_KL*(A-C*L_tmp)))
        
        % Natural PG
        Kp_tmp = K_tmp - eta_K*2*((Ru+B'*P_KL*B)*K_tmp-B'*P_KL*(A-C*Lp_tmp));
        
        K_tmp = Kp_tmp;
    end
    
    
    
    K_tmp = Kp_tmp;
    L_tmp = Lp_tmp;
    if max(abs(eig(A-B*K_tmp-C*L_tmp)))>1
        %             pause;
        flg = 1;
        break;
    end
    if max(abs(eig(A-B*K_tmp-C*L_tmp)))<1 && flg == 1
        %             pause;
        flg = 2;
    end
%     Kp_tmp
%     Lp_tmp
    
    Delta_P = P_KL-P_KL_old;
    P_KL_old = P_KL;
    
    P_2_NE(steps,1) = norm(P_KL-P2,2);
    Dist_NE(steps,1) = norm([K_tmp L_tmp]-[Ks2 Ls2],2);
    
    max(abs(eig(A-B*K_tmp-C*L_tmp)))
end


%% Update 2: N_L=50

eta_K = 0.00007;
eta_L = 0.00007;

K_ini = K0;
L_ini = zeros(k,d);

flg = 0;


K_tmp = K_ini;
L_tmp = L_ini;
P_KL_old = zeros(d,d);



step_len_2 = 50;
step_len_1 = 1;

for steps = 1:max_iter
    steps
    
    %     test_P_KL = my_gare_gv_K(A,B,C,Q, Ru,Rv,K_tmp);
    %     test_L_gv_K = (-Rv+C'*test_P_KL*C)\(C'*test_P_KL*(A-B*K_tmp));
    
    for j = 1:step_len_2
        P_KL = solvePKL(A,B,C,Q,Ru,Rv,K_tmp,L_tmp);
        
        % Gauss-Newton
        %         Lp_tmp = L_tmp + eta_L*2*((Rv-C'*P_KL*C)\((-Rv+C'*P_KL*C)*L_tmp-C'*P_KL*(A-B*K_tmp)))
        
        % Natural PG
        Lp_tmp = L_tmp + eta_L*2*((-Rv+C'*P_KL*C)*L_tmp-C'*P_KL*(A-B*K_tmp));
        
        L_tmp = Lp_tmp;
        
    end
    
    
    %     test_P_KL = my_gare_gv_L(A,B,C,Q, Ru,Rv,L_tmp);
    %     test_K_gv_L = (Ru+B'*test_P_KL*B)\(B'*test_P_KL*(A-C*L_tmp));
    
    for j = 1:step_len_1
        P_KL = solvePKL(A,B,C,Q,Ru,Rv,K_tmp,Lp_tmp);
        
        % Gauss-Newton
        %              Kp_tmp = K_tmp - eta_K*2*((Ru+B'*P_KL*B)\((Ru+B'*P_KL*B)*K_tmp-B'*P_KL*(A-C*L_tmp)))
        
        % Natural PG
        Kp_tmp = K_tmp - eta_K*2*((Ru+B'*P_KL*B)*K_tmp-B'*P_KL*(A-C*Lp_tmp));
        
        K_tmp = Kp_tmp;
    end
    
    
    
    K_tmp = Kp_tmp;
    L_tmp = Lp_tmp;
    if max(abs(eig(A-B*K_tmp-C*L_tmp)))>1
        %             pause;
        flg = 1;
        break;
    end
    if max(abs(eig(A-B*K_tmp-C*L_tmp)))<1 && flg == 1
        %             pause;
        flg = 2;
    end
%     Kp_tmp
%     Lp_tmp
    
    Delta_P = P_KL-P_KL_old;
    P_KL_old = P_KL;
    
    P_2_NE(steps,2) = norm(P_KL-P2,2);
    Dist_NE(steps,2) = norm([K_tmp L_tmp]-[Ks2 Ls2],2);
    
    max(abs(eig(A-B*K_tmp-C*L_tmp)))
end

%% Update 3: Primal-Dual

eta_K = 0.0001;
eta_L = 0.0001;

K_ini = K0;
L_ini = zeros(k,d);


flg = 0;



K_tmp = K_ini;
L_tmp = L_ini;
P_KL_old = zeros(d,d);



step_len_2 = 1;
step_len_1 = 1;

for steps = 1:max_iter
    steps
    
    %     test_P_KL = my_gare_gv_K(A,B,C,Q, Ru,Rv,K_tmp);
    %     test_L_gv_K = (-Rv+C'*test_P_KL*C)\(C'*test_P_KL*(A-B*K_tmp));
    
    for j = 1:step_len_2
        P_KL = solvePKL(A,B,C,Q,Ru,Rv,K_tmp,L_tmp);
        
        % Gauss-Newton
        %         Lp_tmp = L_tmp + eta_L*2*((Rv-C'*P_KL*C)\((-Rv+C'*P_KL*C)*L_tmp-C'*P_KL*(A-B*K_tmp)))
        
        % Natural PG
        Lp_tmp = L_tmp + eta_L*2*((-Rv+C'*P_KL*C)*L_tmp-C'*P_KL*(A-B*K_tmp));
        
    end
    
    
    %     test_P_KL = my_gare_gv_L(A,B,C,Q, Ru,Rv,L_tmp);
    %     test_K_gv_L = (Ru+B'*test_P_KL*B)\(B'*test_P_KL*(A-C*L_tmp));
    
    for j = 1:step_len_1
        P_KL = solvePKL(A,B,C,Q,Ru,Rv,K_tmp,L_tmp);
        
        % Gauss-Newton
        %              Kp_tmp = K_tmp - eta_K*2*((Ru+B'*P_KL*B)\((Ru+B'*P_KL*B)*K_tmp-B'*P_KL*(A-C*L_tmp)))
        
        % Natural PG
        Kp_tmp = K_tmp - eta_K*2*((Ru+B'*P_KL*B)*K_tmp-B'*P_KL*(A-C*L_tmp));
        
    end
    
    
    
    K_tmp = Kp_tmp;
    L_tmp = Lp_tmp;
    if max(abs(eig(A-B*K_tmp-C*L_tmp)))>1
        %             pause;
        flg = 1;
        break;
    end
    if max(abs(eig(A-B*K_tmp-C*L_tmp)))<1 && flg == 1
        %             pause;
        flg = 2;
    end
%     Kp_tmp
%     Lp_tmp
    
    Delta_P = P_KL-P_KL_old;
    P_KL_old = P_KL;
    
    P_2_NE(steps,3) = norm(P_KL-P2,2);
    Dist_NE(steps,3) = norm([K_tmp L_tmp]-[Ks2 Ls2],2);
    
    max(abs(eig(A-B*K_tmp-C*L_tmp)))
end





save LQG_Hinf_initialization_RARL_plot_Sec5_Zeroth_Order_1_Point_res


plot_ind = 1:3;
% cmap = colormap(hsv(length(plot_ind)*10));
color_marker_tt = {'ro','g*','bx'};
% color_ind = randperm(length(plot_ind)*2,length(plot_ind));

h1 = figure;
for i = 1:length(plot_ind)
    semilogy(Dist_NE(:,plot_ind(i)),color_marker_tt{i},'MarkerSize',6,'LineWidth',2)
    hold on
end
set(gca,'FontSize', 24,'FontName', 'Times New Roman');
legend({'Double Loop','Descent Ascent $N_L=50$','Simultaneous Update'},'Interpreter','Latex')
xlabel('Iterations','Interpreter','Latex')
ylabel('$\|K-K^*\|_2+\|L-L^*\|_2$','Interpreter','Latex')

h2 = figure;
for i = 1:length(plot_ind)
    semilogy(P_2_NE(:,plot_ind(i)),color_marker_tt{i},'MarkerSize',6,'LineWidth',2)
    hold on
end
set(gca,'FontSize', 24,'FontName', 'Times New Roman');
legend({'Double Loop','Descent Ascent $N_L=50$','Simultaneous Update'},'Interpreter','Latex')
xlabel('Iterations','Interpreter','Latex')
ylabel('$\|P_{K,L}-P^{*}\|_2$','Interpreter','Latex')




