function [wh_x_de,wh_x_re]=uLSIF(x_de,x_nu,x_re,sigma_list,lambda_list,b,fold)
%
% Unconstrained least-squares importance fitting (with leave-one-out cross validation)
%
% Estimating ratio of probability densities
%   \frac{ p_{nu}(x) }{ p_{de}(x) }
% from samples
%    { xde_i | xde_i\in R^{d} }_{i=1}^{n_{de}} 
% drawn independently from p_{de}(x) and samples
%    { xnu_i | xnu_i\in R^{d} }_{i=1}^{n_{nu}} 
% drawn independently from p_{nu}(x).
%
% Usage:
%       [wh_x_de,wh_x_re]=uLSIF(x_de,x_nu,x_re,sigma_list,lambda_list,b)
%
% Input:
%    x_de:         d by n_de sample matrix corresponding to `denominator' (iid from density p_de)
%    x_nu:         d by n_nu sample matrix corresponding to `numerator'   (iid from density p_nu)
%    x_re:         (OPTIONAL) d by n_re reference sample matrix
%    sigma_list:   (OPTIONAL) Gaussian width
%                  If sigma_list is a vector, one of them is selected by cross validation.
%                  If sigma_list is a scalar, this value is used without cross validation.
%                  If sigma_list is empty/undefined, Gaussian width is chosen from
%                  some default canditate list by cross validation.
%    lambda_list: (OPTIONAL) regularization parameter
%                 If lambda_list is a vector, one of them is selected by cross validation.
%                 If lambda_list is a scalar, this value is used without cross validation
%                 If lambda_list is empty, Gaussian width is chosen from
%                 some default canditate list by cross validation
%    b:           (OPTINLAL) positive integer representing the number of kernels (default: 100)
%    fold:        (OPTINLAL) positive integer representing the number of folds
%                 in cross validation / 0: leave-one-out (default: 0)
%
% Output:
%    wh_x_de:     estimates of density ratio w=p_nu/p_de at x_de
%    wh_x_re:     estimates of density ratio w=p_nu/p_de at x_re (if x_re is provided)
%
% (c) Masashi Sugiyama, Department of Compter Science, Tokyo Institute of Technology, Japan.
%     sugi@cs.titech.ac.jp,     http://sugiyama-www.cs.titech.ac.jp/~sugi/software/uLSIF/

  if nargin<2
    error('number of input arguments is not enough!!!')
  end

  [d,   n_de]=size(x_de);
  [d_nu,n_nu]=size(x_nu);
  if d~=d_nu
    error('dimension of two samples are diferent!!!')
  end
  
  if nargin<4 || isempty(sigma_list)
    sigma_list=logspace(-3,1,9); % Candidates of Gaussian width
  elseif sum(sigma_list<=0)>0
    error('Gaussian width must be positive')
  end

  if nargin<5 || isempty(lambda_list)
    lambda_list=logspace(-3,1,9); % Candidates of regularization parameter
  elseif sum(lambda_list<0)>0
    error('regularization parameter must be non-negative')
  end

  if nargin<6 || isempty(b)
    b = 100;
  end  

  if nargin<7 || isempty(fold)
    fold = 0; %leave-one-out
  end  

  disp('Run uLSIF')

  %%%%%%%%%%%%%%%% Choose Gaussian kernel center `x_ce'
  rand_index=randperm(n_nu);
  b=min(b,n_nu);
  x_ce=x_nu(:,rand_index(1:b)); 
  n_min=min(n_de,n_nu);

  x_de2=sum(x_de.^2,1);
  x_nu2=sum(x_nu.^2,1);
  x_ce2=sum(x_ce.^2,1);
  dist2_x_de=repmat(x_ce2',[1 n_de])+repmat(x_de2,[b 1])-2*x_ce'*x_de;
  dist2_x_nu=repmat(x_ce2',[1 n_nu])+repmat(x_nu2,[b 1])-2*x_ce'*x_nu;
  
  score_cv=zeros(length(sigma_list),length(lambda_list));
  
  if length(sigma_list)==1 && length(lambda_list)==1 % need cross-validation?
    sigma_chosen=sigma_list;
    lambda_chosen=lambda_list;
  else 
    %%%%%%%%%%%%%%%% Searching Gaussian kernel width `sigma_chosen'
    %%%%%%%%%%%%%%%% and regularization parameter `lambda_chosen' 

    if fold~=0 % k-fold cross-validation
      cv_index_nu=randperm(n_nu);
      cv_split_nu=floor([0:n_nu-1]*fold./n_nu)+1;
      cv_index_de=randperm(n_de);
      cv_split_de=floor([0:n_de-1]*fold./n_de)+1;
    end
    
    for sigma_index=1:length(sigma_list)
      sigma=sigma_list(sigma_index);
      K_de=exp(-dist2_x_de/(2*sigma^2));
      K_nu=exp(-dist2_x_nu/(2*sigma^2));
      if fold==0 % leave-one-out cross-validation
        K_de2=K_de(:,1:n_min);
        K_nu2=K_nu(:,1:n_min);
        H=K_de*K_de'/size(K_de,2);
        h=mean(K_nu,2);
      end
      
      for lambda_index=1:length(lambda_list)
        lambda=lambda_list(lambda_index);

        if fold==0 % leave-one-out cross-validation
          C=H+lambda*(n_de-1)/n_de*eye(b);
          invC=inv(C);           
          beta=invC*h;
          invCK_de=invC*K_de2;
          tmp=n_de*ones(1,n_min)-sum(K_de2.*invCK_de,1);
          B0=beta*ones(1,n_min)+invCK_de*diag((beta'*K_de2)./tmp);
          B1=invC*K_nu2+invCK_de*diag(sum(K_nu2.*invCK_de,1)./tmp);
          A=max(0,(n_de-1)/(n_de*(n_nu-1))*(n_nu*B0-B1));
          wh_x_de2=sum(K_de2.*A,1)';
          wh_x_nu2=sum(K_nu2.*A,1)';
          score_cv(sigma_index,lambda_index)=mean(wh_x_de2.^2)/2-mean(wh_x_nu2);
        
        else % k-fold cross-validation
          score_tmp=zeros(1,fold);

          for k=1:fold
            Ktmp=K_de(:,cv_index_de(cv_split_de~=k));
            alphat_cv=mylinsolve(Ktmp*Ktmp'/size(Ktmp,2)+lambda*eye(b), ...
                                 mean(K_nu(:,cv_index_nu(cv_split_nu~=k)),2));
            alphah_cv=max(0,alphat_cv);
            score_tmp(k)=mean((K_de(:,cv_index_de(cv_split_de==k))'*alphah_cv).^2)/2 ...
                -mean(K_nu(:,cv_index_nu(cv_split_nu==k))'*alphah_cv);
          end % for fold

          score_cv(sigma_index,lambda_index)=mean(score_tmp);
        end % if fold==0
        
      end % for lambda_index
    end % for sigma_index
    
    [score_cv_tmp,lambda_chosen_index]=min(score_cv,[],2);
    [score,sigma_chosen_index]=min(score_cv_tmp);
    lambda_chosen=lambda_list(lambda_chosen_index(sigma_chosen_index));
    sigma_chosen=sigma_list(sigma_chosen_index);
  end %cross-validation

  disp(sprintf('sigma = %g, lambda = %g',sigma_chosen,lambda_chosen))

  %%%%%%%%%%%%%%%% Computing the final solution `wh_x_de'
  K_de=exp(-dist2_x_de/(2*sigma_chosen^2));
  K_nu=exp(-dist2_x_nu/(2*sigma_chosen^2));
  alphat=mylinsolve(K_de*K_de'/n_de+lambda_chosen*eye(b),mean(K_nu,2));
  alphah=max(0,alphat);
  wh_x_de=alphah'*K_de;
  
  if nargin<3 || isempty(x_re)
    wh_x_re=nan;
  else
    [d,   n_re]=size(x_re);
    x_re2=sum(x_re.^2,1);
    dist2_x_re=repmat(x_ce2',[1 n_re])+repmat(x_re2,[b 1])-2*x_ce'*x_re;
    wh_x_re=alphah'*exp(-dist2_x_re/(2*sigma_chosen^2));
  end
  
