doc/html/rankingsvm_8hpp_source.html

#ifndef RANKINGSVM_H

#define RANKINGSVM_H


#include <libcmaes/eo_matrix.h>

#include <vector>

#include <limits>

#include <cstdlib>

#include <random>

#include <iostream>


class SVMKernel

{

 public:

  SVMKernel() {};

  ~SVMKernel() {};


  double K(const dVec &x1, const dVec &x2);

  void init(const dMat &x) {};

};


class LinearKernel : public SVMKernel

{

public:

  LinearKernel()

    :SVMKernel()

  {}


  ~LinearKernel() {}


  double K(const dVec &x1, const dVec &x2) { return x1.transpose()*x2; }

};


template <int d,int c=1>


class PolyKernel : public SVMKernel

{

public:

  PolyKernel()

  :SVMKernel()

  {}


  ~PolyKernel() {}


  double K(const dVec &x1, const dVec &x2) { return pow((x1.transpose()*x2 + c),d); }

};


class RBFKernel : public SVMKernel

{

 public:

  RBFKernel()

    :SVMKernel()

    {}


  ~RBFKernel() {}


  double K(const dVec &x1, const dVec &x2) { return exp(-_gamma*((x1-x2).squaredNorm())); }


  void init(const dMat &x)

  {

    double avgdist = 0.0;

    for (int i=0;i<x.cols();i++)

      for (int j=i+1;j<x.cols();j++)

    avgdist += (x.col(i)-x.col(j)).norm();

    avgdist /= 0.5*(x.cols()*(x.cols()-1.0));

    double sigma = _sigma_a * std::pow(avgdist,_sigma_pow);

    _gamma = 1.0/(2.0*sigma*sigma);


    //debug

    //std::cout << "avgdist=" << avgdist << " / sigma=" << sigma << " / gamma=" << _gamma << std::endl;

    //debug

  }


  double _gamma = 1.0;

  double _sigma_a = 1.0;

  double _sigma_pow = 1.0;

};


template<class TKernel=RBFKernel>


class RankingSVM

{

 public:

  RankingSVM()

  {

    _udist = std::uniform_real_distribution<>(0,1);

  }


  ~RankingSVM()

  {

  }


  void train(dMat &x,

         const int &niter,

         const dMat &covinv,

         const dVec &xmean)

  {

    //debug

    //std::cout << "Learning RSVM with niter=" << niter << std::endl;

    //debug


    // init structures.

    int nalphas = x.cols()-1;

    _C = dMat::Constant(nalphas,1,_Cval);

    for (int i=0;i<nalphas;i++)

      _C(nalphas-1-i) = _Cval*pow(nalphas-i,2);

    _dKij = dMat::Zero(nalphas,nalphas);

    _alpha = dVec::Zero(nalphas);


    if (_encode)

      encode(x,covinv,xmean);

    compute_training_kernel(x);

    optimize(x,niter);


    //debug

    //std::cout << "alpha=" << _alpha.transpose() << std::endl;

    //debug

  }


  void predict(dVec &fit,

           dMat &x_test,

           dMat &x_train,

           const dMat &covinv,

           const dVec &xmean)

  {

    if (_alpha.size() == 0)

      return; // model is not yet trained.

    fit = dVec::Zero(x_test.cols());

    if (_encode)

      {

    encode(x_train,covinv,xmean);

    encode(x_test,covinv,xmean);

      }

#pragma omp parallel for

    for (int i=0;i<x_test.cols();i++)

      {

    dVec Kvals(x_train.cols());

    for (int j=0;j<x_train.cols();j++)

      Kvals(j) = _kernel.K(x_test.col(i),x_train.col(j));

    double curfit = 0.0;

    for (int j=0;j<x_train.cols()-1;j++)

      curfit += _alpha(j) * (Kvals(j)-Kvals(j+1));

    fit(i) = curfit;

      }


    //debug

    //std::cout << "fit=" << fit.transpose() << std::endl;

    //debug

  }


  void encode(dMat &x,

          const dMat &covinv,

          const dVec &xmean)

  {

    for (int i=0;i<x.cols();i++)

      x.col(i) -= xmean;

    if (covinv.cols() > 1)

      x = covinv * x;

    else

      {

    for (int i=0;i<x.cols();i++)

      x.col(i) = covinv.cwiseProduct(x.col(i));

      }

  }


  void compute_training_kernel(dMat &x)

  {

    _kernel.init(x);

    _K = dMat::Zero(x.cols(),x.cols());

#pragma omp parallel for

      for (int i=0;i<_K.rows();i++)

    for (int j=i;j<_K.cols();j++)

      _K(i,j)=_K(j,i)=_kernel.K(x.col(i),x.col(j));


    //debug

    //std::cout << "K=" << _K << std::endl;

    //debug

  }


  void optimize(const dMat &x,

        const int &niter)

  {

    // initialization of temporary variables

    dVec sum_alphas = dVec::Zero(_dKij.cols());

    dMat div_dKij = dMat::Zero(_dKij.rows(),_dKij.cols());

#pragma omp parallel

    {

#pragma omp for

      for (int i=0;i<_dKij.rows();i++)

    {

      for (int j=0;j<_dKij.cols();j++)

        {

          _dKij(i,j) = _K(i,j) - _K(i,j+1) - _K(i+1,j) + _K(i+1,j+1);

        }

      double fact = _udist(_rng);

      _alpha(i) = _C(i) * (0.95 + 0.05*fact);

    }

#pragma omp for

      for (int i=0;i<_dKij.rows();i++)

    {

      double sum_alpha = 0.0;

      for (int j=0;j<_dKij.cols();j++)

        {

          sum_alpha += _alpha(j) * _dKij(i,j);

          div_dKij(i,j) = _dKij(i,j) / _dKij(j,j);

        }

      sum_alphas(i) = (_epsilon - sum_alpha) / _dKij(i,i);

    }

    }


    // optimize for niter

    double L=0.0;

    int i1 = 0;

    double old_alpha = 0.0, new_alpha = 0.0, delta_alpha = 0.0;

    for (int i=0;i<niter;i++)

      {

    i1 = i % _dKij.cols();

    old_alpha = _alpha(i1);

    new_alpha = old_alpha + sum_alphas(i1);

    new_alpha = std::max(std::min(new_alpha,_C(i1)),0.0);

    delta_alpha = new_alpha - old_alpha;

    double dL = delta_alpha * _dKij(i1,i1) * (sum_alphas(i1) - 0.5*delta_alpha + _epsilon);

    if (dL > 0)

      {

        sum_alphas -= delta_alpha * div_dKij.row(i1);

        _alpha(i1) = new_alpha;

      }

    L += dL;

      }

  }


  double error(dMat &x_test,

           dMat &x_train,

           const dVec &ref_fit,

           const dMat &covinv,

           const dVec &xmean)

  {

    dVec fit;

    predict(fit,x_test,x_train,covinv,xmean);

    if (fit.size() == 0)

      return 1.0;

    double err = 0.0;

    double sum = 0.0;

    for (int i=0;i<ref_fit.size();i++)

      {

    for (int j=0;j<ref_fit.size();j++)

      {

        if (i != j)

          {

        err += ((ref_fit(i) > ref_fit(j) && fit(i) < fit(j)) || (ref_fit(i) < ref_fit(j) && fit(i) > fit(j))) ? 1 : 0;

        sum++;

          }

      }

      }

    err /= static_cast<double>((ref_fit.size()*ref_fit.size())-ref_fit.size());

    return err;

  }


 public:

  bool _encode = false;

  dMat _K;

  dVec _alpha;

  dMat _dKij;

  dMat _C;

  double _Cval = 1e6;

  double _epsilon = 1.0;


  TKernel _kernel;

  std::mt19937 _rng;

  std::uniform_real_distribution<> _udist;

};


#endif

LinearKernel
linear kernel
Definition rankingsvm.hpp:56

PolyKernel
Polynomial kernel.
Definition rankingsvm.hpp:72

RBFKernel
Radial Basis Function kernel.
Definition rankingsvm.hpp:87

RankingSVM
Ranking SVM algorithm with support for custom kernels.
Definition rankingsvm.hpp:122

RankingSVM::_Cval
double _Cval
Definition rankingsvm.hpp:352

RankingSVM::_kernel
TKernel _kernel
Definition rankingsvm.hpp:355

RankingSVM::error
double error(dMat &x_test, dMat &x_train, const dVec &ref_fit, const dMat &covinv, const dVec &xmean)
computes the ranker's error over a dataset
Definition rankingsvm.hpp:318

RankingSVM::train
void train(dMat &x, const int &niter, const dMat &covinv, const dVec &xmean)
trains a ranker from a set of points
Definition rankingsvm.hpp:142

RankingSVM::predict
void predict(dVec &fit, dMat &x_test, dMat &x_train, const dMat &covinv, const dVec &xmean)
predicts a ranking from a learnt ranker
Definition rankingsvm.hpp:180

RankingSVM::compute_training_kernel
void compute_training_kernel(dMat &x)
pre-computation of the kernel values for every examples and coordinates
Definition rankingsvm.hpp:236

RankingSVM::_C
dMat _C
Definition rankingsvm.hpp:351

RankingSVM::_K
dMat _K
Definition rankingsvm.hpp:348

RankingSVM::optimize
void optimize(const dMat &x, const int &niter)
optimizes a ranker's model given a training set x
Definition rankingsvm.hpp:255

RankingSVM::_alpha
dVec _alpha
Definition rankingsvm.hpp:349

RankingSVM::encode
void encode(dMat &x, const dMat &covinv, const dVec &xmean)
encoding a set of point in a transformed space
Definition rankingsvm.hpp:217

RankingSVM::_encode
bool _encode
Definition rankingsvm.hpp:346

SVMKernel
Kernel base class.
Definition rankingsvm.hpp:43