refman/html/test__working___fitting_gradient_i_g_soft_8cpp_source.html

 #include <iostream>

 #include <Pds/Ra>

 #include <Pds/Ml>

 #include <Pds/Sp>


 namespace Pds{

 namespace LogisticModel{


 Pds::Vector FittingGradientIGSoft(  Pds::IterationConf &Conf,

                                                         const Pds::Matrix &X,

                                                         const Pds::Vector &Y,

                                                         const Pds::Vector &W0);


 Pds::Vector GradientCostInformationGainSoft(const Pds::Vector &W,

                                                                 const Pds::Matrix &X,

                                                                 const Pds::Vector &Y,

                                                                 double h);


 Pds::Vector GradientCostInformationGainSoft2(   const Pds::Vector &W,

                                                 const Pds::Matrix &X,

                                                 const Pds::Vector &Y);


 double CostInformationGainSoft( const Pds::Vector &W,

                                                     const Pds::Matrix &X,

                                                     const Pds::Vector &Y);


 }//LogisticModel

 }//Pds


 double Pds::LogisticModel::CostInformationGainSoft( const Pds::Vector &W,

                                                     const Pds::Matrix &X,

                                                     const Pds::Vector &Y)

 {

     if(W.IsEmpty())             return Pds::Ra::Nan;

     if(X.IsEmpty())             return Pds::Ra::Nan;

     if(Y.IsEmpty())             return Pds::Ra::Nan;


     if(X.Nlin()!=Y.Nlin())      return Pds::Ra::Nan;

     if(X.Ncol()!=(W.Nlin()-1))  return Pds::Ra::Nan;


     Pds::Vector Yh=Y.Geq(0.5);


     Pds::Vector z=Pds::LogisticModel::Classify(W,X);


     unsigned int L=Yh.Nlin();


     double Nt=Yh.Sum();

     double Na=z.Sum();

     double N1=Yh.Dot(z);


     /*

     // Information gain

     double Et=Pds::Hb(Nt/L);

     double E1=Pds::Hb(N1/Na);

     double val=(Nt-N1)/(L-Na);

     if(val>1.0) val=1.0;

     if(val<0)   val=0;

     if(L==Na)   val=1;

     double E0=Pds::Hb(val);

     */


     // Gini index

     double q=2.0;

     double F=Pds::qHbn(0.5,2.0);

     double Et=Pds::qHbn(Nt/L,q)/F;

     double E1=Pds::qHbn(N1/Na,q)/F;

     double val=(Nt-N1)/(L-Na);

     if(val>1.0) val=1.0;

     if(val<0)   val=0;

     if(L==Na)   val=1;

     double E0=Pds::qHbn(val,q)/F;


     return Et-(Na/L)*E1-((L-Na)/L)*E0;

 }


 Pds::Vector Pds::LogisticModel::GradientCostInformationGainSoft(const Pds::Vector &W,

                                                                 const Pds::Matrix &X,

                                                                 const Pds::Vector &Y,

                                                                 double h)

 {

     if(W.IsEmpty())             return Pds::Vector();

     if(X.IsEmpty())             return Pds::Vector();

     if(Y.IsEmpty())             return Pds::Vector();


     if(X.Nlin()!=Y.Nlin())      return Pds::Vector();

     if(X.Ncol()!=(W.Nlin()-1))  return Pds::Vector();


     if(h==0.0)  return Pds::Vector();


     unsigned int N=W.Nel();


     Pds::Vector D(N);

     Pds::Vector Whp(N);

     Pds::Vector Whm(N);

     double dn;


     Whp.Copy(W);

     Whm.Copy(W);


     for(unsigned int n=0;n<N;n++)

     {

         Whp.SetRaw(n,W.GetRaw(n)+h);

         Whm.SetRaw(n,W.GetRaw(n)-h);


         dn=( Pds::LogisticModel::CostInformationGainSoft(Whp,X,Y)

             -Pds::LogisticModel::CostInformationGainSoft(Whm,X,Y) )/(2*h);


         D.SetRaw(n,dn);


         Whp.SetRaw(n,W.GetRaw(n));

         Whm.SetRaw(n,W.GetRaw(n));

     }

     return D;

 }


 Pds::Vector Pds::LogisticModel::GradientCostInformationGainSoft2(const Pds::Vector &W,

                                                                 const Pds::Matrix &X,

                                                                 const Pds::Vector &Y)

 {

     if(W.IsEmpty())             return Pds::Vector();

     if(X.IsEmpty())             return Pds::Vector();

     if(Y.IsEmpty())             return Pds::Vector();


     if(X.Nlin()!=Y.Nlin())      return Pds::Vector();

     if(X.Ncol()!=(W.Nlin()-1))  return Pds::Vector();


     Pds::Vector Yt=Y.Geq(0.5);

     unsigned int N=Yt.Sum();

     unsigned int L=Yt.Nel();

     Pds::Matrix R=Pds::RegressorMatrix(X);

     Pds::Vector z=Pds::Sigmoid(R*W);

     Pds::Vector Dz=z.Product(1.0-z);


     double Na=z.Sum();

     double N1=Yt.Dot(z);

     double p1=N1/Na;

     double p2=(N-N1)/(L-Na);


     double h1=Pds::Hb(p1);

     double h2=Pds::Hb(p2);

     double Dh1=-Pds::Logit2(p1);

     double Dh2=-Pds::Logit2(p2);

     /*

     double q=4.0;

     double K=Pds::qHbn(0.5,q);

     double h1=Pds::qHbn(p1,q)/K;

     double h2=Pds::qHbn(p2,q)/K;

     double Dh1=Pds::qDHbn(p1,q)/K;

     double Dh2=Pds::qDHbn(p2,q)/K;

     */

     double factor1=(-h1+h2+p1*Dh1-p2*Dh2)/L;

     double factor2=(-Dh1+Dh2)/L;

     Pds::Vector DIG=  factor1*R.TMul(Dz)+factor2*R.TMul(Dz.Product(Yt));


     std::cout<<"\n";

     std::cout<<"N:"<<N<<"\n";

     std::cout<<"L:"<<L<<"\n";

     std::cout<<"N1:"<<N1<<"\t N1<Na True positive in Na side\n";

     std::cout<<"Na:"<<Na<<"\t elems. classify as 1\n";

     std::cout<<"p1:"<<p1<<"\n";

     std::cout<<"p2:"<<p2<<"\n";

     std::cout<<"factor1:"<<factor1<<"\n";

     std::cout<<"factor2:"<<factor2<<"\n";

     std::cout<<"IGs:"<<Pds::LogisticModel::CostInformationGainSoft(W,X,Y)<<"\n";

     std::cout<<"IGh:"<<Pds::LogisticModel::CostInformationGain(W,X,Y)<<"\n";

     DIG.T().Print("DIG: ");


     return DIG;

 }


 void print_IterationConf_IG_soft_init_data(Pds::IterationConf Conf,std::string str="")

 {

     double Alpha  = Conf.GetAlpha();

     double MinError= Conf.GetMinError();

     double MaxIter = Conf.GetMaxIter();


     std::ios_base::fmtflags f( std::cout.flags() );


     std::cout.precision(4);

     std::cout<<"┌──────────────────────────────┐"<<std::endl;

     std::cout<<"│    "<<std::left<<std::setw(22)<<str<<"    │"<<std::endl;

     std::cout<<"│    IterationConf init data   │"<<std::endl;

     std::cout<<"├──────────────────────────────┤"<<std::endl;

     std::cout<<"│           Alpha: "<<std::setw(10)<<Alpha  <<"  │"<<std::endl;

     std::cout<<"│       MinErrorΔ: "<<std::setw(10)<<std::scientific<<MinError<<std::defaultfloat<<"  │"<<std::endl;

     std::cout<<"│         MaxIter: "<<std::setw(10)<<MaxIter<<"  │"<<std::endl;

     std::cout<<"└──────────────────────────────┘"<<std::endl;


     std::cout.flags( f );

 }


 void print_IterationConf_IG_soft_end_data(Pds::IterationConf Conf,std::string str="")

 {

     std::ios_base::fmtflags f( std::cout.flags() );


     double Alpha  = Conf.GetAlpha();

     std::cout.precision(3);

     std::cout<<"┌──────────────────────────────┐"<<std::endl;

     std::cout<<"│    "<<std::left<<std::setw(22)<<str<<"    │"<<std::endl;

     std::cout<<"│    IterationConf end data    │"<<std::endl;

     std::cout<<"├──────────────────────────────┤"<<std::endl;

     std::cout<<"│           Alpha: "<<std::setw(10)<<Alpha<<"  │"<<std::endl;

     std::cout<<"│          ErrorΔ: "<<std::setw(10)<<std::scientific<<Conf.LastError<<std::defaultfloat<<"  │"<<std::endl;

     std::cout<<"│        LastIter: "<<std::setw(10)<<Conf.LastIter<<"  │"<<std::endl;

     std::cout<<"└──────────────────────────────┘"<<std::endl;


     std::cout.flags( f );

 }

 void print_iterative_IG_soft_data(unsigned int iter,double Alpha,double last_error,double cost_error,bool END)

 {


     std::ios_base::fmtflags f( std::cout.flags() );


     std::cout.precision(3);

     std::cout<<std::left

              <<"┌──────────────────────────────┐"<<std::endl

              <<"│            Iter: "<<std::setw(10)<<iter<<"  │"<<std::endl

              <<"│           Alpha: "<<std::setw(10)<<Alpha<<"  │"<<std::endl

              <<"│          ErrorΔ: "<<std::setw(10)<<std::scientific<<last_error<<"  │"<<std::endl

              <<"│              IG: "<<std::setw(10)<<cost_error<<std::defaultfloat<<"  │"<<std::endl

              <<"└──────────────────────────────┘"<<std::endl;

     if(END==false) std::cout<<"\x1b[A\r"<<"\x1b[A\r"<<"\x1b[A\r"<<"\x1b[A\r"<<"\x1b[A\r"<<"\x1b[A\r";


     std::cout.flags( f );

 }


 Pds::Vector Pds::LogisticModel::FittingGradientIGSoft(  Pds::IterationConf &Conf,

                                                         const Pds::Matrix &X,

                                                         const Pds::Vector &Y,

                                                         const Pds::Vector &W0)

 {

     if(W0.IsEmpty())            return Pds::Matrix();

     if(X.IsEmpty())             return Pds::Matrix();

     if(Y.IsEmpty())             return Pds::Matrix();


     if(X.Nlin()!=Y.Nlin())      return Pds::Matrix();

     if(X.Ncol()!=(W0.Nlin()-1)) return Pds::Matrix();


     unsigned int YSUM=Y.Geq(0.5).Sum();

     if(YSUM==Y.Nel())   return Pds::LogisticModel::GetW0CornerMeanMethod(X);

     if(YSUM==0)         return -Pds::LogisticModel::GetW0CornerMeanMethod(X);


     double Alpha=Conf.GetAlpha();

     //double Gamma=Conf.GetGamma();

     //double Lambda=Conf.GetLambda();

     double MinError=Conf.GetMinError();

     double MaxIter=Conf.GetMaxIter();


     pds_print_error_message("Esta función aun no trabaja bien, es demasiado abrupta");


     if(Conf.Show)   print_IterationConf_IG_soft_init_data(Conf,"Gradient IG");


     Pds::Vector W=W0;

     Pds::Vector Wopt=W;

     Pds::Vector DIG,DCE;

     double Costmax=-1;

     double Cost;


     Pds::Fir FIR5(Pds::Vector(5,1.0)/5);

     //double fir5;

     //Pds::Fir FIR10(Pds::Vector(10,1.0)/10);

     //double fir10;


     double last_error=1000, before_error=0,delta_error=1;;

     unsigned int iter=0;


     Pds::Matrix R=Pds::RegressorMatrix(X);

     Pds::Vector DY,DW;

     Pds::Matrix I=Pds::Eye(W.Nel());I.SetRaw(0,0,0);

     Pds::Vector Yt;


     std::vector<double> ig;

     std::vector<double> err;


     double A=W.Norm()*0.1+0.01;


     do{

         //double h;

         //h=W.RMS()*0.5;

         //DIG=Pds::LogisticModel::GradientCostInformationGainSoft(W,X,Y,h);

         DW=-Pds::LogisticModel::GradientCostInformationGainSoft2(W,X,Y);

         DW.T().Print("DW: ");

         DW=(A/DW.Norm())*DW;

         DW.T().Print("DW: ");


         W=W-Alpha*DW;


         W.T().Print(" W: ");


         Pds::Octave::Plot::PointsX2DY(X,Pds::Sigmoid(R*W),"testando.m","test_"+std::to_string(iter)+".png");


         Cost=Pds::LogisticModel::CostInformationGain(W,X,Y);


         before_error=last_error;


         last_error  = 1.0-Cost;

         //last_error += (Lambda*0.5/W.Nel())*(W.Dot(W)-W[0]*W[0]);


         delta_error=fabs(FIR5.Evaluate(last_error)-before_error);


         if(Cost>Costmax)

         {

             Costmax=Cost;

             Wopt=W;

         }


         ig.push_back(Cost);

         err.push_back(last_error);


         iter++;


         //if(Conf.Show)   print_iterative_IG_soft_data(iter,Alpha,delta_error,Cost,true);


     }while( (delta_error>MinError)&&(iter<MaxIter) );


     if(Conf.Show)   print_iterative_IG_soft_data(iter,Alpha,delta_error,Cost,true);


     Conf.SetAlpha(Alpha);

     Conf.LastError=delta_error;

     Conf.LastIter=iter;


     Pds::Ra::SaveStdVector(ig,"ig.txt");

     Pds::Ra::SaveStdVector(err,"err.txt");


     if(Conf.Show)   print_IterationConf_IG_soft_end_data(Conf,"Gradient IG");


     double alpha=1.0;

     /*

     double s2;

     Yt=R*Wopt;

     double Delta=0.001;

     Pds::Matrix Yo=Y.Geq(0.5)*(1.0-2*Delta)+Delta;

     s2=Yt.SumSquare();

     if(s2>0)    alpha=Yt.Dot(Pds::Logit(Yo))/s2;

     else        alpha=1;

     */

     return Wopt*alpha;

 }


 double average_distance_between_samples(const Pds::Matrix &X)

 {

     if(X.IsEmpty()) return Pds::Ra::Nan;


     Pds::Vector Min=X.MinInCols();

     Pds::Vector Max=X.MaxInCols();


     unsigned int N=X.Ncol();

     unsigned int L=X.Nlin();

     unsigned int n;


     double S=1;

     double d;

     for(n=0;n<N;n++)

     {

         d=fabs(Max[n]-Min[n]);

         if(d!=0)    S=S*d;

     }


     return pow(S/L,1.0/N);

 }


 #include "extra_newhb.h"


 // ./test/test_working_FittingGradientIGSoft

 int main(void)

 {

     Pds::IterationConf Conf;

     Conf.Show=true;

     Conf.SetMaxIter(100);

     Conf.SetMinError(1e-07);

     Conf.SetAlpha(0.5);

     Conf.SetLambda(0.0);

     Conf.SetGamma(0.1);

     Pds::Ra::Randomize();


     // Generating data

     /* // Data 1

     Pds::Matrix X(Pds::Ra::TextFormat,"../test/hard-data-x.txt");

     Pds::Vector Y(Pds::Ra::TextFormat,"../test/hard-data-y.txt");

     X=X-X.MeanInCols();

     */

     // Data 2

     unsigned int L=1000;    Pds::Matrix X;  Pds::Vector Y;

     Pds::DataSet::Classification::LoadDataBand(L,X,Y);


     Pds::Octave::XLabel="x_1";

     Pds::Octave::YLabel="x_2";

     Pds::Octave::Plot::PointsX2DY(X,Y,"testando.m","test_working_FittingGradientIGSoft.png");


     /*

     Pds::Vector W,DW;

     for(unsigned int n=0;n<10;n++)

     {

         W=Pds::LogisticModel::GetW0MeanMethod(X);

         double h=W.RMS()*0.001;

         DW=Pds::LogisticModel::GradientCostInformationGainSoft(W,X,Y,h);

         DW.Normalize();

         DW.T().Print("\nDW1: ");

         DW=Pds::LogisticModel::GradientCostInformationGainSoft2(W,X,Y);

         DW.Normalize();

         DW.T().Print("DW2: ");

         //W=Pds::LogisticModel::FittingGradientIGSoft(Conf,X,Y,W);

     }

     */


     /*

     Pds::Vector W;

     W=10*Pds::LogisticModel::GetW0MeanMethod(X);

     W=Pds::LogisticModel::FittingGradientIGSoft(Conf,X,Y,W);

     */

     unsigned int N=128;

     double b=4;

     Pds::Vector w1=Pds::LinSpace(-b,b,N);

     Pds::Vector w2=Pds::LinSpace(-b,b,N);

     Pds::Matrix W1,W2;

     Pds::Matrix IG(N,N);

     Pds::Matrix IGsoft(N,N);

     double val;


     std::cout<<"avr: "<<average_distance_between_samples(X)<<"\n";


     Pds::Meshgrid (w1,w2,W1,W2);


     for(unsigned int i=0;i<N;i++)

     for(unsigned int j=0;j<N;j++)

     {

         Pds::Vector w({0.5,w1[i],w2[j]});

         val=Pds::LogisticModel::CostInformationGain( w,X,Y);

         IG.SetRaw(i,j,val);

         val=Pds::LogisticModel::CostXqEntropy( w,X,Y,q_factor_val); //w*(100/w.Norm())

         IGsoft.SetRaw(i,j,val);

     }


     // No treinar bias

     // Agrega ||W-w_i|| e inicia desde best ortogonal


     Pds::Octave::Plot::SurfC(W1,W2,(1-IG),"testando.m","ig_matrix.png");

     Pds::Octave::Plot::SurfC(W1,W2,IGsoft,"testando_soft.m","ig_soft_matrix.png");


     return 0;

 }

Pds::IterationConf
La clase tipo Pds::IterationConf . Esta clase genera una matriz de Nlin lineas y 1 columna....
Definition: IterationConf.hpp:57

Pds::IterationConf::Show
bool Show
Definition: IterationConf.hpp:86

Pds::IterationConf::LastError
double LastError
Definition: IterationConf.hpp:89

Pds::IterationConf::LastIter
double LastIter
Definition: IterationConf.hpp:92

Pds::IterationConf::SetLambda
bool SetLambda(double Lambda)
Coloca el valor lambda.

Pds::IterationConf::SetAlpha
bool SetAlpha(double Alpha)
Coloca el valor alpha.

Pds::IterationConf::GetMinError
double GetMinError(void) const
Devuelve el valor MinError.

Pds::IterationConf::GetAlpha
double GetAlpha(void) const
Devuelve el valor alpha.

Pds::IterationConf::SetMaxIter
bool SetMaxIter(unsigned int MaxIter)
Coloca el valor MaxIter.

Pds::IterationConf::SetMinError
bool SetMinError(double MinError)
Coloca el valor MinError.

Pds::IterationConf::SetGamma
bool SetGamma(double Lambda)
Coloca el valor gamma.

Pds::IterationConf::GetMaxIter
unsigned int GetMaxIter(void) const
Devuelve el valor MaxIter.

Pds::DataSet::Classification::LoadDataBand
void LoadDataBand(unsigned int L, Pds::Matrix &X, Pds::Vector &Y)
Clasificacion de datos separados por mas de una curva.

Pds::LogisticModel::GetW0CornerMeanMethod
Pds::Vector GetW0CornerMeanMethod(const Pds::Matrix &X, double Delta=0.001)
Obtiene de forma rapida un vector  inicial para usar en regresion logistica.

Pds::LogisticModel::CostInformationGain
double CostInformationGain(const Pds::Vector &W, const Pds::Matrix &X, const Pds::Vector &Y)
Calculo de costo.

Pds::LogisticModel::Classify
Pds::Vector Classify(const Pds::Vector &W, const Pds::Matrix &X)
Calculo del resultado del clasificador.

Pds::LogisticModel::CostInformationGainSoft
double CostInformationGainSoft(const Pds::Vector &W, const Pds::Matrix &X, const Pds::Vector &Y)
Definition: test_working_FittingGradientIGSoft.cpp:51

Pds::LogisticModel::FittingGradientIGSoft
Pds::Vector FittingGradientIGSoft(Pds::IterationConf &Conf, const Pds::Matrix &X, const Pds::Vector &Y, const Pds::Vector &W0)
Definition: test_working_FittingGradientIGSoft.cpp:254

Pds::LogisticModel::GradientCostInformationGainSoft2
Pds::Vector GradientCostInformationGainSoft2(const Pds::Vector &W, const Pds::Matrix &X, const Pds::Vector &Y)
Definition: test_working_FittingGradientIGSoft.cpp:141

Pds::LogisticModel::CostXqEntropy
double CostXqEntropy(const Pds::Vector &W, const Pds::Matrix &X, const Pds::Vector &Y, double q)
Definition: extra_newhb.h:32

Pds::LogisticModel::GradientCostInformationGainSoft
Pds::Vector GradientCostInformationGainSoft(const Pds::Vector &W, const Pds::Matrix &X, const Pds::Vector &Y, double h)
Definition: test_working_FittingGradientIGSoft.cpp:101

Pds
Nombre de espacio para Pds (Procesamiento Digital de Senales)
Definition: ClassificationMetrics.hpp:42