en/latest/sfa_8cpp_source.html

 /*   This program is free software: you can redistribute it and/or modify

  *   it under the terms of the GNU General Public License as published by

  *   the Free Software Foundation, either version 3 of the License, or

  *   (at your option) any later version.

  *

  *   This program is distributed in the hope that it will be useful,

  *   but WITHOUT ANY WARRANTY; without even the implied warranty of

  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  *   GNU General Public License for more details.

  *

  *   You should have received a copy of the GNU General Public License

  *   along with this program.  If not, see <http://www.gnu.org/licenses/>.

  *

  *   Copyright (C) 2009 - 2012 Jun Liu and Jieping Ye

  */


 #include <shogun/lib/slep/flsa/sfa.h>

 #ifdef USE_GPL_SHOGUN


 #include <stdlib.h>

 #include <stdio.h>

 #include <time.h>

 #include <math.h>


 #define delta 1e-10


 /*

    Revision History


    First Version available on October 10, 2009


    A runnable version on October 15, 2009


    Major revision on October 29, 2009

    (Some functions appearing in a previous version have deleted, please refer to the previous version for the old functions.

    Some new functions have been added as well)


 */


 /*


    Files contained in this header file sfa.h:


    1. Algorithms for solving the linear system A A^T z0 = Av (see the description of A from the following context)


    void Thomas(double *zMax, double *z0,

    double * Av, int nn)


    void Rose(double *zMax, double *z0,

    double * Av, int nn)


    int supportSet(double *x, double *v, double *z,

    double *g, int * S, double lambda, int nn)


    void dualityGap(double *gap, double *z,

    double *g, double *s, double *Av,

    double lambda, int nn)


    void dualityGap2(double *gap, double *z,

    double *g, double *s, double *Av,

    double lambda, int nn)


    2. The Subgraident Finding Algorithm (SFA) for solving problem (4) (refer to the description of the problem for detail)


    int sfa(double *x,     double *gap,

    double *z,     double *z0,   double * v,   double * Av,

    double lambda, int nn,       int maxStep,

    double *s,     double *g,

    double tol,    int tau,       int flag)


    int sfa_special(double *x,     double *gap,

    double *z,     double * v,   double * Av,

    double lambda, int nn,       int maxStep,

    double *s,     double *g,

    double tol,    int tau)


    int sfa_one(double *x,     double *gap,

    double *z,     double * v,   double * Av,

    double lambda, int nn,       int maxStep,

    double *s,     double *g,

    double tol,    int tau)


 */


 /*


    Some mathematical background.


    In this file, we discuss how to solve the following subproblem,


    min_x  1/2 \|x-v\|^2  + lambda \|A x\|_1,                 (1)


    which is a key problem used in the Fused Lasso Signal Approximator (FLSA).


    Also, note that, FLSA is a building block for solving the optimation problmes with fused Lasso penalty.


    In (1), x and v are n-dimensional vectors,

    and A is a matrix with size (n-1) x n, and is defined as follows (e.g., n=4):

    A= [ -1  1  0  0;

    0  -1 1  0;

    0  0  -1 1]


    The above problem can be reformulated as the following equivalent min-max optimization problem


    min_x  max_z  1/2 \|x-v\|^2  + <A x, z>

    subject to   \|z\|_{infty} \leq lambda                     (2)


    It is easy to get that, at the optimal point


    x = v - AT z,                             (3)


    where z is the optimal solution to the following optimization problem


    min_z  1/2  z^T A AT z - < z, A v>,

    subject to  \|z\|_{infty} \leq lambda                      (4)


    Let B=A A^T. It is easy to get that B is a (n-1) x (n-1) tridiagonal matrix.

    When n=5, B is defined as:

    B= [ 2  -1   0    0;

    -1  2   -1   0;

    0  -1   2    -1;

    0   0   -1   2]


    Let z0 be the solution to the linear system:


    A A^T * z0 = A * v                  (5)


    The problem (5) can be solve by the Thomas Algorithm, in about 5n multiplications and 4n additions.


    It can also be solved by the Rose's Algorithm, in about 2n multiplications and 2n additions.


    Moreover, considering the special structure of the matrix A (and B),

    it can be solved in about n multiplications and 3n additions


    If lambda \geq \|z0\|_{infty}, x_i= mean(v), for all i,

    the problem (1) admits near analytical solution


    We have also added the restart technique, please refer to our paper for detail!


 */


 /*

 */


 void Thomas(double *zMax, double *z0, double * Av, int nn){


     /*


        We apply the Tomas algorithm for solving the following linear system

        B * z0 = Av

        Thomas algorithm is also called the tridiagonal matrix algorithm


        B=[ 2  -1   0    0;

        -1  2   -1   0;

        0  -1   2    -1;

        0   0   -1   2]


        z0 is the result,  Av is unchanged after the computation


        c is a precomputed nn dimensional vector

        c=[-1/2, -2/3, -3/4, -4/5, ..., -nn/(nn+1)]


        c[i]=- (i+1) / (i+2)

        c[i-1]=- i / (i+1)


        z0 is an nn dimensional vector


 */


     int i;

     double tt, z_max;


     /*

        Modify the coefficients in Av (copy to z0)

        */

     z0[0]=Av[0]/2;

     for (i=1;i < nn; i++){

         tt=Av[i] + z0[i-1];

         z0[i]=tt - tt / (i+2);

     }


     /*z0[i]=(Av[i] + z0[i-1]) * (i+1) / (i+2);*/


     /*z0[i]=(Av[i] + z0[i-1])/ ( 2 - i / (i+1));*/


     /*

        Back substitute (obtain the result in z0)

        */

     z_max= fabs(z0[nn-1]);


     for (i=nn-2; i>=0; i--){


         z0[i]+=  z0[i+1] -  z0[i+1]/ (i+2);


         /*z0[i]+=  z0[i+1] * (i+1) / (i+2);*/


         tt=fabs(z0[i]);


         if (tt > z_max)

             z_max=tt;


     }

     *zMax=z_max;


 }


 /*

 */


 void Rose(double *zMax, double *z0, double * Av, int nn){


     /*

        We use the Rose algorithm for solving the following linear system

        B * z0 = Av


        B=[ 2  -1   0    0;

        -1  2   -1   0;

        0  -1   2    -1;

        0   0   -1   2]


        z0 is the result,  Av is unchanged after the computation


        z0 is an nn dimensional vector


 */


     int i, m;

     double s=0, z_max;


     /*

        We follow the style in CLAPACK

        */

     m= nn % 5;

     if (m!=0){

         for (i=0;i<m; i++)

             s+=Av[i] * (i+1);

     }

     for(i=m;i<nn;i+=5)

         s+=   Av[i]   * (i+1)

             + Av[i+1] * (i+2)

             + Av[i+2] * (i+3)

             + Av[i+3] * (i+4)

             + Av[i+4] * (i+5);

     s/=(nn+1);


     /*

        from nn-1 to 0

        */

     z0[nn-1]=Av[nn-1]- s;

     for (i=nn-2;i >=0; i--){

         z0[i]=Av[i] + z0[i+1];

     }


     /*

        from 0 to nn-1

        */

     z_max= fabs(z0[0]);

     for (i=0; i<nn; i++){


         z0[i]+=  z0[i-1];


         s=fabs(z0[i]);


         if (s > z_max)

             z_max=s;


     }

     *zMax=z_max;


 }


 /*


 x=omega(z)


 v: the vector to be projected

 z: the approximate solution

 g: the gradient at z (g should be computed before calling this function


 nn: the length of z, g, and S (maximal length for S)


 n:  the length of x and v


 S: records the indices of the elements in the support set

 */


 int supportSet(double *x, double *v, double *z, double *g, int * S, double lambda, int nn){


     int i, j, n=nn+1, numS=0;

     double temp;


     /*

        we first scan z and g to obtain the support set S

        */


     /*numS: number of the elements in the support set S*/

     for(i=0;i<nn; i++){

         if ( ( (z[i]==lambda) && (g[i] < delta) ) || ( (z[i]==-lambda) && (g[i] >delta) )){

             S[numS]=i;

             numS++;

         }

     }


     /*

        printf("\n %d",numS);

        */


     if (numS==0){ /*this shows that S is empty*/

         temp=0;

         for (i=0;i<n;i++)

             temp+=v[i];


         temp=temp/n;

         for(i=0;i<n;i++)

             x[i]=temp;


         return numS;

     }


     /*

        Next, we deal with numS >=1

        */


     /*process the first block


       j=0

       */

     temp=0;

     for (i=0;i<=S[0]; i++)

         temp+=v[i];

     /*temp =sum (v [0: s[0] ]*/

     temp=( temp + z[ S[0] ] ) / (S[0] +1);

     for (i=0;i<=S[0]; i++)

         x[i]=temp;


     /*process the middle blocks


       If numS=1, it belongs the last block

       */

     for (j=1; j < numS; j++){

         temp=0;

         for (i= S[j-1] +1; i<= S[j]; i++){

             temp+=v[i];

         }


         /*temp =sum (v [ S[j-1] +1: s[j] ]*/


         temp=(temp - z[ S[j-1] ] + z[ S[j] ])/ (S[j]- S[j-1]);


         for (i= S[j-1] +1; i<= S[j]; i++){

             x[i]=temp;

         }

     }


     /*process the last block

       j=numS-1;

       */

     temp=0;

     for (i=S[numS-1] +1 ;i< n; i++)

         temp+=v[i];

     /*temp =sum (v [  (S[numS-1] +1): (n-1) ]*/


     temp=( temp - z[ S[numS-1] ] ) / (nn - S[numS-1]); /*S[numS-1] <= nn-1*/


     for (i=S[numS-1] +1 ;i< n; i++)

         x[i]=temp;


     return numS;


 }


 /*


 we compute the duality corresponding the solution z


 z: the approximate solution

 g: the gradient at z (we recompute the gradient)

 s: an auxiliary variable

 Av: A*v


 nn: the lenght for z, g, s, and Av


 The variables g and s shall be revised.


 The variables z and Av remain unchanged.

 */


 void dualityGap(double *gap, double *z, double *g, double *s, double *Av, double lambda, int nn){


     int i, m;

     double temp;


     g[0]=z[0] + z[0] - z[1] - Av[0];

     for (i=1;i<nn-1;i++){

         g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

     }

     g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


     for (i=0;i<nn;i++)

         if (g[i]>0)

             s[i]=lambda + z[i];

         else

             s[i]=-lambda + z[i];


     temp=0;

     m=nn%5;


     if (m!=0){

         for(i=0;i<m;i++)

             temp+=s[i]*g[i];

     }


     for(i=m;i<nn;i+=5)

         temp=temp + s[i]  *g[i]

             + s[i+1]*g[i+1]

             + s[i+2]*g[i+2]

             + s[i+3]*g[i+3]

             + s[i+4]*g[i+4];

     *gap=temp;

 }


 /*

    Similar to dualityGap,


    The difference is that, we assume that g has been computed.

    */


 void dualityGap2(double *gap, double *z, double *g, double *s, double *Av, double lambda, int nn){


     int i, m;

     double temp;


     /*

        g[0]=z[0] + z[0] - z[1] - Av[0];

        for (i=1;i<nn-1;i++){

        g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

        }

        g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


 */


     for (i=0;i<nn;i++)

         if (g[i]>0)

             s[i]=lambda + z[i];

         else

             s[i]=-lambda + z[i];


     temp=0;

     m=nn%5;


     if (m!=0){

         for(i=0;i<m;i++)

             temp+=s[i]*g[i];

     }


     for(i=m;i<nn;i+=5)

         temp=temp + s[i]  *g[i]

             + s[i+1]*g[i+1]

             + s[i+2]*g[i+2]

             + s[i+3]*g[i+3]

             + s[i+4]*g[i+4];

     *gap=temp;

 }


 /*

 generateSolution:


 generate the solution x based on the information of z and g

 (!!!!we assume that g has been computed as the gradient of z!!!!)


 */


 int generateSolution(double *x, double *z, double *gap,

         double *v, double *Av,

         double *g, double *s, int *S,

         double lambda, int nn){


     int i, m, numS, n=nn+1;

     double temp, funVal1, funVal2;


     /*

        z is the appropriate solution,

        and g contains its gradient

        */


     /*

        We assume that n>=3, and thus nn>=2


        We have two ways for recovering x.

        The first way is x = v - A^T z

        The second way is x =omega(z)

        */


     temp=0;

     m=nn%5;

     if (m!=0){

         for (i=0;i<m;i++)

             temp+=z[i]*(g[i] + Av[i]);

     }

     for (i=m;i<nn;i+=5)

         temp=temp + z[i]  *(g[i]   + Av[i])

             + z[i+1]*(g[i+1] + Av[i+1])

             + z[i+2]*(g[i+2] + Av[i+2])

             + z[i+3]*(g[i+3] + Av[i+3])

             + z[i+4]*(g[i+4] + Av[i+4]);

     funVal1=temp /2;


     temp=0;

     m=nn%5;

     if (m!=0){

         for (i=0;i<m;i++)

             temp+=fabs(g[i]);

     }

     for (i=m;i<nn;i+=5)

         temp=temp + fabs(g[i])

             + fabs(g[i+1])

             + fabs(g[i+2])

             + fabs(g[i+3])

             + fabs(g[i+4]);

     funVal1=funVal1+ temp*lambda;


     /*

        we compute the solution by the second way

        */


     numS= supportSet(x, v, z, g, S, lambda, nn);


     /*

        we compute the objective function of x computed in the second way

        */


     temp=0;

     m=n%5;

     if (m!=0){

         for (i=0;i<m;i++)

             temp+=(x[i]-v[i]) * (x[i]-v[i]);

     }

     for (i=m;i<n;i+=5)

         temp=temp + (x[i]-  v[i]) * (  x[i]-  v[i])

             + (x[i+1]-v[i+1]) * (x[i+1]-v[i+1])

             + (x[i+2]-v[i+2]) * (x[i+2]-v[i+2])

             + (x[i+3]-v[i+3]) * (x[i+3]-v[i+3])

             + (x[i+4]-v[i+4]) * (x[i+4]-v[i+4]);

     funVal2=temp/2;


     temp=0;

     m=nn%5;

     if (m!=0){

         for (i=0;i<m;i++)

             temp+=fabs( x[i+1]-x[i] );

     }

     for (i=m;i<nn;i+=5)

         temp=temp + fabs( x[i+1]-x[i] )

             + fabs( x[i+2]-x[i+1] )

             + fabs( x[i+3]-x[i+2] )

             + fabs( x[i+4]-x[i+3] )

             + fabs( x[i+5]-x[i+4] );

     funVal2=funVal2 + lambda * temp;


     /*

        printf("\n    funVal1=%e, funVal2=%e, diff=%e\n", funVal1, funVal2, funVal1-funVal2);

        */


     if (funVal2 > funVal1){  /*

                                 we compute the solution by the first way

                                 */

         x[0]=v[0] + z[0];

         for(i=1;i<n-1;i++)

             x[i]= v[i] - z[i-1] + z[i];

         x[n-1]=v[n-1] - z[n-2];

     }

     else{


         /*

            the solution x is computed in the second way

            the gap can be further reduced

            (note that, there might be numerical error)

            */


         *gap=*gap - (funVal1- funVal2);

         if (*gap <0)

             *gap=0;

     }


     return (numS);

 }


 void restartMapping(double *g, double *z,  double * v,

         double lambda, int nn)

 {


     int i, n=nn+1;

     double temp;

     int* S=(int *) malloc(sizeof(int)*nn);

     double *x=(double *)malloc(sizeof(double)*n);

     double *s=(double *)malloc(sizeof(double)*nn);

     double *Av=(double *)malloc(sizeof(double)*nn);

     //int numS=-1;


     /*

        for a given input z,

        we compute the z0 after restarting


        The elements in z lie in [-lambda, lambda]


        The returned value is g

        */


     for (i=0;i<nn; i++)

         Av[i]=v[i+1]-v[i];


     g[0]=z[0] + z[0] - z[1] - Av[0];

     for (i=1;i<nn-1;i++){

         g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

     }

     g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


     //numS = supportSet(x, v, z, g, S, lambda, nn);


     /*With x, we compute z via

       AA^T z = Av - Ax

       */


     /*

        compute s= Av -Ax

        */


     for (i=0;i<nn; i++)

         s[i]=Av[i] - x[i+1] + x[i];


     /*

        Apply Rose Algorithm for solving z

        */


     Thomas(&temp, g, s, nn);


     /*

        Rose(&temp, g, s, nn);

        */


     /*

        project g to [-lambda, lambda]

        */


     for(i=0;i<nn;i++){

         if (g[i]>lambda)

             g[i]=lambda;

         else

             if (g[i]<-lambda)

                 g[i]=-lambda;

     }


     free (S);

     free (x);

     free (s);

     free (Av);


 }


 /*


 Our objective is to solve the fused Lasso signal approximator (flsa) problem:


 min_x  g(x) 1/2 \|x-v\|^2  + lambda \|A x\|_1,                      (1)


 Let x* be the solution (which is unique), it satisfies


 0 in  x* - v +  A^T * lambda *SGN(Ax*)                     (2)


 To solve x*, it suffices to find


 y*  in A^T * lambda *SGN(Ax*)                              (3)

 that satisfies


 x* - v + y* =0                                             (4)

 which leads to

 x*= v - y*                                                 (5)


 Due to the uniqueness of x*, we conclude that y* is unique.


 As y* is a subgradient of lambda \|A x*\|_1,

 we name our method as Subgradient Finding Algorithm (sfa).


 y* in (3) can be further written as


 y*= A^T * z*                                               (6)

 where


 z* in lambda* SGN (Ax*)                                    (7)


 From (6), we have

 z* = (A A^T)^{-1} A * y*                                   (8)


 Therefore, from the uqniueness of y*, we conclude that z* is also unique.

 Next, we discuss how to solve this unique z*.


 The problem (1) can reformulated as the following equivalent problem:


 min_x  max_z  f(x, z)= 1/2 \|x-v\|^2  + <A x, z>

 subject to   \|z\|_{infty} \leq lambda                                  (9)


 At the saddle point, we have


 x = v - AT z,                                            (10)


 which somehow concides with (5) and (6)


 Plugging (10) into (9), we obtain the problem


 min_z  1/2  z^T A AT z - < z, A v>,

 subject to  \|z\|_{infty} \leq lambda,                             (11)


 In this program, we apply the Nesterov's method for solving (11).


 Duality gap:


 At a given point z0, we compute x0= v - A^T z0.

 It is easy to show that

 min_x f(x, z0) = f(x0, z0) <= max_z f(x0, z)               (12)


 Moreover, we have

 max_z f(x0, z) - min_x f(x, z0)

 <= lambda * \|A x0\|_1 - < z0, Av - A A^T z0>           (13)


 It is also to get that


 f(x0, z0) <= f(x*, z*) <= max_z f(x0, z)                   (14)


 g(x*)=f(x*, z*)                                            (15)


 g(x0)=max_z f(x0, z)                                       (17)


     Therefore, we have


 g(x0)-g(x*) <= lambda * \|A x0\|_1 - < z0, Av - A A^T z0>  (18)


     We have applied a restarting technique, which is quite involved; and thus, we do not explain here.


         */


         /*


         For sfa, the stepsize of the Nesterov's method is fixed to 1/4, so that no line search is needed.


         Explanation of the parameters:


         Output parameters

         x:    the solution to the primal problem

         gap:  the duality gap (pointer)


         Input parameters

         z:    the solution to the dual problem (before calling this function, z contains a starting point)

         !!!!we assume that the starting point has been successfully initialized in z !!!!

         z0:   a variable used for multiple purposes:

         1) the previous solution z0

         2) the difference between z and z0, i.e., z0=z- z0


         lambda:   the regularization parameter (and the radius of the infity ball, see (11)).

         nn:       the length of z, z0, Av, g, and s

         maxStep:  the maximal number of iterations


         v:    the point to be projected (not changed after the program)

         Av:   A*v (not changed after the program)


         s:        the search point (used for multiple purposes)

         g:        the gradient at g (and it is also used for multiple purposes)


         tol:      the tolerance of the gap

         tau:  the duality gap or the restarting technique is done every tau steps

         flag: if flag=1,  we apply the resart technique

         flag=2,  just run the SFA algorithm, terminate it when the absolution change is less than tol

         flag=3,  just run the SFA algorithm, terminate it when the duality gap is less than tol

         flag=4,  just run the SFA algorithm, terminate it when the relative duality gap is less than tol


         We would like to emphasis that the following assumptions

         have been checked in the functions that call this function:

         1) 0< lambda < z_max

         2) nn >=2

         3) z has been initialized with a starting point

         4) z0 has been initialized with all zeros


         The termination condition is checked every tau iterations.


         For the duality gap, please refer to (12-18)

         */


         int sfa(double *x,     double *gap, int * activeS,

                 double *z,     double *z0,   double * v,   double * Av,

                 double lambda, int nn,       int maxStep,

                 double *s,     double *g,

                 double tol,    int tau,       int flag){


             int i, iterStep, m, tFlag=0, n=nn+1;

             double alphap=0, alpha=1, beta=0, temp;

             int* S=(int *) malloc(sizeof(int)*nn);

             double gapp=-1, gappp=-1;   /*gapp denotes the previous gap*/

             int numS=-1, numSp=-2, numSpp=-3;;

             /*

                numS denotes the number of elements in the Support Set S

                numSp denotes the number of elements in the previous Support Set S

                */


             *gap=-1; /*initial a value -1*/


             /*

                The main algorithm by Nesterov's method


                B is an nn x nn tridiagonal matrix.


                The nn eigenvalues of B are 2- 2 cos (i * PI/ n), i=1, 2, ..., nn

                */


             for (iterStep=1; iterStep<=maxStep; iterStep++){


                 /*-------------   Step 1 ---------------------*/


                 beta=(alphap -1 ) / alpha;

                 /*

                    compute search point


                    s= z + beta * z0


                    We follow the style of CLAPACK

                    */

                 m=nn % 5;

                 if (m!=0){

                     for (i=0;i<m; i++)

                         s[i]=z[i]+ beta* z0[i];

                 }

                 for (i=m;i<nn;i+=5){

                     s[i]   =z[i]   + beta* z0[i];

                     s[i+1] =z[i+1] + beta* z0[i+1];

                     s[i+2] =z[i+2] + beta* z0[i+2];

                     s[i+3] =z[i+3] + beta* z0[i+3];

                     s[i+4] =z[i+4] + beta* z0[i+4];

                 }


                 /*

                    s and g are of size nn x 1


                    compute the gradient at s


                    g= B * s - Av,


                    where B is an nn x nn tridiagonal matrix. and is defined as


                    B= [ 2  -1   0    0;

                    -1  2   -1   0;

                    0  -1   2    -1;

                    0   0   -1   2]


                    We assume n>=3, which leads to nn>=2

                    */

                 g[0]=s[0] + s[0] - s[1] - Av[0];

                 for (i=1;i<nn-1;i++){

                     g[i]= - s[i-1] + s[i] + s[i] - s[i+1] - Av[i];

                 }

                 g[nn-1]= -s[nn-2] + s[nn-1] + s[nn-1] - Av[nn-1];


                 /*

                    z0 stores the previous -z

                    */

                 m=nn%7;

                 if (m!=0){

                     for (i=0;i<m;i++)

                         z0[i]=-z[i];

                 }

                 for (i=m; i <nn; i+=7){

                     z0[i]   = - z[i];

                     z0[i+1] = - z[i+1];

                     z0[i+2] = - z[i+2];

                     z0[i+3] = - z[i+3];

                     z0[i+4] = - z[i+4];

                     z0[i+5] = - z[i+5];

                     z0[i+6] = - z[i+6];

                 }


                 /*

                    do a gradient step based on s to get z

                    */

                 m=nn%5;

                 if (m!=0){

                     for(i=0;i<m; i++)

                         z[i]=s[i] - g[i]/4;

                 }

                 for (i=m;i<nn; i+=5){

                     z[i]   = s[i]   -  g[i]  /4;

                     z[i+1] = s[i+1] -  g[i+1]/4;

                     z[i+2] = s[i+2] -  g[i+2]/4;

                     z[i+3] = s[i+3] -  g[i+3]/4;

                     z[i+4] = s[i+4] -  g[i+4]/4;

                 }


                 /*

                    project z onto the L_{infty} ball with radius lambda


                    z is the new approximate solution

                    */

                 for (i=0;i<nn; i++){

                     if (z[i]>lambda)

                         z[i]=lambda;

                     else

                         if (z[i]<-lambda)

                             z[i]=-lambda;

                 }


                 /*

                    compute the difference between the new solution

                    and the previous solution (stored in z0=-z_p)


                    the difference is written to z0

                    */


                 m=nn%5;

                 if (m!=0){

                     for (i=0;i<m;i++)

                         z0[i]+=z[i];

                 }

                 for(i=m;i<nn; i+=5){

                     z0[i]  +=z[i];

                     z0[i+1]+=z[i+1];

                     z0[i+2]+=z[i+2];

                     z0[i+3]+=z[i+3];

                     z0[i+4]+=z[i+4];

                 }


                 alphap=alpha;

                 alpha=(1+sqrt(4*alpha*alpha+1))/2;


                 /*

                    check the termination condition

                    */

                 if (iterStep%tau==0){


                     /*

                        The variables g and s can be modified


                        The variables x, z0 and z can be revised for case 0, but not for the rest

                        */

                     switch (flag){

                         case 1:


                             /*


                                terminate the program once the "duality gap" is smaller than tol


                                compute the duality gap:


                                x= v - A^T z

                                Ax = Av - A A^T z = -g,

                                where

                                g = A A^T z - A v


                                the duality gap= lambda * \|Ax\|-1 - <z, Ax>

                                = lambda * \|g\|_1 + <z, g>


                                In fact, gap=0 indicates that,

                                if g_i >0, then z_i=-lambda

                                if g_i <0, then z_i=lambda

                                */


                             gappp=gapp;

                             gapp=*gap;  /*record the previous gap*/

                             numSpp=numSp;

                             numSp=numS; /*record the previous numS*/


                             dualityGap(gap, z, g, s, Av, lambda, nn);

                             /*g is computed as the gradient of z in this function*/


                             /*

                                printf("\n Iteration: %d, gap=%e, numS=%d", iterStep, *gap, numS);

                                */


                             /*

                                If *gap <=tol, we terminate the iteration

                                Otherwise, we restart the algorithm

                                */


                             if (*gap <=tol){

                                 tFlag=1;

                                 break;


                             } /* end of *gap <=tol */

                             else{


                                 /* we apply the restarting technique*/


                                 /*

                                    we compute the solution by the second way

                                    */

                                 numS = supportSet(x, v, z, g, S, lambda, nn);

                                 /*g, the gradient of z should be computed before calling this function*/


                                 /*With x, we compute z via

                                   AA^T z = Av - Ax

                                   */


                                 /*

                                    printf("\n iterStep=%d, numS=%d, gap=%e",iterStep, numS, *gap);

                                    */


                                 m=1;

                                 if (nn > 1000000)

                                     m=10;

                                 else

                                     if (nn > 100000)

                                         m=5;


                                 if ( abs(numS-numSp) < m){


                                     numS=generateSolution(x, z, gap, v, Av,

                                             g, s, S, lambda, nn);

                                     /*g, the gradient of z should be computed before calling this function*/


                                     if (*gap <tol){

                                         tFlag=2;     /*tFlag =2 shows that the result is already optimal

                                                        There is no need to call generateSolution for recomputing the best solution

                                                        */

                                         break;

                                     }


                                     if ( (*gap ==gappp) && (numS==numSpp) ){


                                         tFlag=2;

                                         break;


                                     }


                                     /*we terminate the program is *gap <1

                                       numS==numSP

                                       and gapp==*gap

                                       */

                                 }


                                 /*

                                    compute s= Av -Ax

                                    */

                                 for (i=0;i<nn; i++)

                                     s[i]=Av[i] - x[i+1] + x[i];


                                 /*

                                    apply Rose Algorithm for solving z

                                    */


                                 Thomas(&temp, z, s, nn);


                                 /*

                                    Rose(&temp, z, s, nn);

                                    */


                                 /*

                                    printf("\n Iteration: %d, %e", iterStep, temp);

                                    */


                                 /*

                                    project z to [-lambda2, lambda2]

                                    */

                                 for(i=0;i<nn;i++){

                                     if (z[i]>lambda)

                                         z[i]=lambda;

                                     else

                                         if (z[i]<-lambda)

                                             z[i]=-lambda;

                                 }


                                 m=nn%7;

                                 if (m!=0){

                                     for (i=0;i<m;i++)

                                         z0[i]=0;

                                 }

                                 for (i=m; i<nn; i+=7){

                                     z0[i]   = z0[i+1]

                                         = z0[i+2]

                                         = z0[i+3]

                                         = z0[i+4]

                                         = z0[i+5]

                                         = z0[i+6]

                                         =0;

                                 }


                                 alphap=0; alpha=1;


                                 /*

                                    we restart the algorithm

                                    */


                             }


                             break; /*break case 1*/


                         case 2:


                             /*

                                The program is terminated either the summation of the absolution change (denoted by z0)

                                of z (from the previous zp) is less than tol * nn,

                                or the maximal number of iteration (maxStep) is achieved

 Note: tol indeed measures the averaged per element change.

 */

                             temp=0;

                             m=nn%5;

                             if (m!=0){

                                 for(i=0;i<m;i++)

                                     temp+=fabs(z0[i]);

                             }

                             for(i=m;i<nn;i+=5)

                                 temp=temp + fabs(z0[i])

                                     + fabs(z0[i+1])

                                     + fabs(z0[i+2])

                                     + fabs(z0[i+3])

                                     + fabs(z0[i+4]);

                             *gap=temp / nn;


                             if (*gap <=tol){


                                 tFlag=1;

                             }


                             break;


                         case 3:


                             /*


                                terminate the program once the "duality gap" is smaller than tol


                                compute the duality gap:


                                x= v - A^T z

                                Ax = Av - A A^T z = -g,

                                where

                                g = A A^T z - A v


                                the duality gap= lambda * \|Ax\|-1 - <z, Ax>

                                = lambda * \|g\|_1 + <z, g>


                                In fact, gap=0 indicates that,

                                if g_i >0, then z_i=-lambda

                                if g_i <0, then z_i=lambda

                                */


                             g[0]=z[0] + z[0] - z[1] - Av[0];

                             for (i=1;i<nn-1;i++){

                                 g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

                             }


                             g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


                             for (i=0;i<nn;i++)

                                 if (g[i]>0)

                                     s[i]=lambda + z[i];

                                 else

                                     s[i]=-lambda + z[i];


                             temp=0;

                             m=nn%5;

                             if (m!=0){

                                 for(i=0;i<m;i++)

                                     temp+=s[i]*g[i];

                             }

                             for(i=m;i<nn;i+=5)

                                 temp=temp + s[i]  *g[i]

                                     + s[i+1]*g[i+1]

                                     + s[i+2]*g[i+2]

                                     + s[i+3]*g[i+3]

                                     + s[i+4]*g[i+4];

                             *gap=temp;


                             /*

                                printf("\n %e", *gap);

                                */


                             if (*gap <=tol)

                                 tFlag=1;


                             break;


                         case 4:


                             /*


                                terminate the program once the "relative duality gap" is smaller than tol


                                compute the duality gap:


                                x= v - A^T z

                                Ax = Av - A A^T z = -g,

                                where

                                g = A A^T z - A v


                                the duality gap= lambda * \|Ax\|-1 - <z, Ax>

                                = lambda * \|g\|_1 + <z, g>


                                In fact, gap=0 indicates that,

                                if g_i >0, then z_i=-lambda

                                if g_i <0, then z_i=lambda


                                Here, the "relative duality gap" is defined as:

                                duality gap / - 1/2 \|A^T z\|^2 + < z, Av>


                                We efficiently compute - 1/2 \|A^T z\|^2 + < z, Av> using the following relationship


                                - 1/2 \|A^T z\|^2 + < z, Av>

                                = -1/2 <z, A A^T z - Av -Av>

                                = -1/2 <z, g - Av>

                                */


                             g[0]=z[0] + z[0] - z[1] - Av[0];

                             for (i=1;i<nn-1;i++){

                                 g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

                             }


                             g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


                             for (i=0;i<nn;i++)

                                 if (g[i]>0)

                                     s[i]=lambda + z[i];

                                 else

                                     s[i]=-lambda + z[i];


                             temp=0;

                             m=nn%5;

                             if (m!=0){

                                 for(i=0;i<m;i++)

                                     temp+=s[i]*g[i];

                             }

                             for(i=m;i<nn;i+=5)

                                 temp=temp + s[i]  *g[i]

                                     + s[i+1]*g[i+1]

                                     + s[i+2]*g[i+2]

                                     + s[i+3]*g[i+3]

                                     + s[i+4]*g[i+4];

                             *gap=temp;

                             /*

                                Now, *gap contains the duality gap

                                Next, we compute

                                - 1/2 \|A^T z\|^2 + < z, Av>

                                =-1/2 <z, g - Av>

                                */


                             temp=0;

                             m=nn%5;

                             if (m!=0){

                                 for(i=0;i<m;i++)

                                     temp+=z[i] * (g[i] - Av[i]);

                             }

                             for(i=m;i<nn;i+=5)

                                 temp=temp + z[i]  * (g[i] -  Av[i])

                                     + z[i+1]* (g[i+1]- Av[i+1])

                                     + z[i+2]* (g[i+2]- Av[i+2])

                                     + z[i+3]* (g[i+3]- Av[i+3])

                                     + z[i+4]* (g[i+4]- Av[i+4]);

                             temp=fabs(temp) /2;


                             if (temp <1)

                                 temp=1;


                             *gap/=temp;

                             /*

                              *gap now contains the relative gap

                              */


                             if (*gap <=tol){

                                 tFlag=1;

                             }


                             break;


                         default:


                             /*

                                The program is terminated either the summation of the absolution change (denoted by z0)

                                of z (from the previous zp) is less than tol * nn,

                                or the maximal number of iteration (maxStep) is achieved

 Note: tol indeed measures the averaged per element change.

 */

                             temp=0;

                             m=nn%5;

                             if (m!=0){

                                 for(i=0;i<m;i++)

                                     temp+=fabs(z0[i]);

                             }

                             for(i=m;i<nn;i+=5)

                                 temp=temp + fabs(z0[i])

                                     + fabs(z0[i+1])

                                     + fabs(z0[i+2])

                                     + fabs(z0[i+3])

                                     + fabs(z0[i+4]);

                             *gap=temp / nn;


                             if (*gap <=tol){


                                 tFlag=1;

                             }


                             break;


                     }/*end of switch*/


                     if (tFlag)

                         break;


                 }/* end of the if for checking the termination condition */


                 /*-------------- Step 3 --------------------*/


             }


             /*

                for the other cases, except flag=1, compute the solution x according the first way (the primal-dual way)

                */


             if ( (flag !=1) || (tFlag==0) ){

                 x[0]=v[0] + z[0];

                 for(i=1;i<n-1;i++)

                     x[i]= v[i] - z[i-1] + z[i];

                 x[n-1]=v[n-1] - z[n-2];

             }


             if ( (flag==1) && (tFlag==1)){


                 /*

                    We assume that n>=3, and thus nn>=2


                    We have two ways for recovering x.

                    The first way is x = v - A^T z

                    The second way is x =omega(z)

                    */


                 /*

                    We first compute the objective function value of the first choice in terms f(x), see our paper

                    */


                 /*

                    for numerical reason, we do a gradient descent step

                    */


                 /*

                    ---------------------------------------------------

                    A gradient step  begins

                    */

                 g[0]=z[0] + z[0] - z[1] - Av[0];

                 for (i=1;i<nn-1;i++){

                     g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

                 }

                 g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


                 /*

                    do a gradient step based on z to get the new z

                    */

                 m=nn%5;

                 if (m!=0){

                     for(i=0;i<m; i++)

                         z[i]=z[i] - g[i]/4;

                 }

                 for (i=m;i<nn; i+=5){

                     z[i]   = z[i]   -  g[i]  /4;

                     z[i+1] = z[i+1] -  g[i+1]/4;

                     z[i+2] = z[i+2] -  g[i+2]/4;

                     z[i+3] = z[i+3] -  g[i+3]/4;

                     z[i+4] = z[i+4] -  g[i+4]/4;

                 }


                 /*

                    project z onto the L_{infty} ball with radius lambda


                    z is the new approximate solution

                    */

                 for (i=0;i<nn; i++){

                     if (z[i]>lambda)

                         z[i]=lambda;

                     else

                         if (z[i]<-lambda)

                             z[i]=-lambda;

                 }


                 /*

                    ---------------------------------------------------

                    A gradient descent step ends

                    */


                 /*compute the gradient at z*/


                 g[0]=z[0] + z[0] - z[1] - Av[0];

                 for (i=1;i<nn-1;i++){

                     g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

                 }

                 g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


                 numS=generateSolution(x, z, gap, v, Av,

                         g, s, S, lambda, nn);

                 /*g, the gradient of z should be computed before calling this function*/


             }


             free (S);

             /*

                free the variables S

                */


             *activeS=numS;

             return (iterStep);


         }


 /*


    Refer to sfa for the defintions of the variables


    In this file, we restart the program every step, and neglect the gradient step.


    It seems that, this program does not converge.


    This function shows that the gradient step is necessary.

    */


 int sfa_special(double *x,     double *gap,  int * activeS,

         double *z,     double * v,   double * Av,

         double lambda, int nn,       int maxStep,

         double *s,     double *g,

         double tol,    int tau){


     int i, iterStep;

     //int tFlag=0;

     //int n=nn+1;

     double temp;

     int* S=(int *) malloc(sizeof(int)*nn);

     double gapp=-1; /*gapp denotes the previous gap*/

     int numS=-1, numSp=-1;

     /*

        numS denotes the number of elements in the Support Set S

        numSp denotes the number of elements in the previous Support Set S

        */


     *gap=-1; /*initialize *gap a value*/


     for (iterStep=1; iterStep<=maxStep; iterStep++){


         g[0]=z[0] + z[0] - z[1] - Av[0];

         for (i=1;i<nn-1;i++){

             g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

         }

         g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


         numSp=numS; /*record the previous numS*/

         numS = supportSet(x, v, z, g, S, lambda, nn);


         /*With x, we compute z via

           AA^T z = Av - Ax

           */


         /*

            compute s= Av -Ax

            */


         for (i=0;i<nn; i++)

             s[i]=Av[i] - x[i+1] + x[i];


         /*

            Apply Rose Algorithm for solving z

            */


         Thomas(&temp, z, s, nn);


         /*

            Rose(&temp, z, s, nn);

            */


         /*

            project z to [-lambda, lambda]

            */


         for(i=0;i<nn;i++){

             if (z[i]>lambda)

                 z[i]=lambda;

             else

                 if (z[i]<-lambda)

                     z[i]=-lambda;

         }


         if (iterStep%tau==0){

             gapp=*gap;  /*record the previous gap*/


             dualityGap(gap, z, g, s, Av, lambda, nn);


             /*

                printf("\n iterStep=%d, numS=%d, gap=%e, diff=%e",iterStep, numS, *gap, *gap -gapp);


 */


             if (*gap <=tol){

                 //tFlag=1;

                 break;

             }


             if ( (*gap <1) && (numS==numSp) && (gapp == *gap) ){

                 //tFlag=1;

                 break;

                 /*we terminate the program is *gap <1

                   numS==numSP

                   and gapp==*gap

                   */

             }


         }/*end of if tau*/


     }/*end for */


     free (S);


     * activeS=numS;

     return(iterStep);


 }


 /*


    We do one gradient descent, and then restart the program

    */


 int sfa_one(double *x,     double *gap, int * activeS,

         double *z,     double * v,   double * Av,

         double lambda, int nn,       int maxStep,

         double *s,     double *g,

         double tol,    int tau){


     int i, iterStep, m;

     int tFlag=0;

     //int n=nn+1;

     double temp;

     int* S=(int *) malloc(sizeof(int)*nn);

     double gapp=-1, gappp=-2;   /*gapp denotes the previous gap*/

     int numS=-100, numSp=-200, numSpp=-300;

     /*

        numS denotes the number of elements in the Support Set S

        numSp denotes the number of elements in the previous Support Set S

        */


     *gap=-1; /*initialize *gap a value*/


     /*

        The main algorithm by Nesterov's method


        B is an nn x nn tridiagonal matrix.


        The nn eigenvalues of B are 2- 2 cos (i * PI/ n), i=1, 2, ..., nn

        */


     /*

        we first do a gradient step based on z

        */


     /*

        ---------------------------------------------------

        A gradient step  begins

        */

     g[0]=z[0] + z[0] - z[1] - Av[0];

     for (i=1;i<nn-1;i++){

         g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

     }

     g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


     /*

        do a gradient step based on z to get the new z

        */

     m=nn%5;

     if (m!=0){

         for(i=0;i<m; i++)

             z[i]=z[i] - g[i]/4;

     }

     for (i=m;i<nn; i+=5){

         z[i]   = z[i]   -  g[i]  /4;

         z[i+1] = z[i+1] -  g[i+1]/4;

         z[i+2] = z[i+2] -  g[i+2]/4;

         z[i+3] = z[i+3] -  g[i+3]/4;

         z[i+4] = z[i+4] -  g[i+4]/4;

     }


     /*

        project z onto the L_{infty} ball with radius lambda


        z is the new approximate solution

        */

     for (i=0;i<nn; i++){

         if (z[i]>lambda)

             z[i]=lambda;

         else

             if (z[i]<-lambda)

                 z[i]=-lambda;

     }


     /*

        ---------------------------------------------------

        A gradient descent step ends

        */


     /*compute the gradient at z*/


     g[0]=z[0] + z[0] - z[1] - Av[0];

     for (i=1;i<nn-1;i++){

         g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

     }

     g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


     for (iterStep=1; iterStep<=maxStep; iterStep++){


         /*

            ---------------------------------------------------

            restart the algorithm with x=omega(z)

            */


         numSpp=numSp;

         numSp=numS; /*record the previous numS*/

         numS = supportSet(x, v, z, g, S, lambda, nn);


         /*With x, we compute z via

           AA^T z = Av - Ax

           */


         /*

            compute s= Av -Ax

            */


         for (i=0;i<nn; i++)

             s[i]=Av[i] - x[i+1] + x[i];


         /*

            Apply Rose Algorithm for solving z

            */


         Thomas(&temp, z, s, nn);


         /*

            Rose(&temp, z, s, nn);

            */


         /*

            project z to [-lambda, lambda]

            */


         for(i=0;i<nn;i++){

             if (z[i]>lambda)

                 z[i]=lambda;

             else

                 if (z[i]<-lambda)

                     z[i]=-lambda;

         }


         /*

            ---------------------------------------------------

            restart the algorithm with x=omega(z)


            we have computed a new z, based on the above relationship

            */


         /*

            ---------------------------------------------------

            A gradient step  begins

            */

         g[0]=z[0] + z[0] - z[1] - Av[0];

         for (i=1;i<nn-1;i++){

             g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

         }

         g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


         /*

            do a gradient step based on z to get the new z

            */

         m=nn%5;

         if (m!=0){

             for(i=0;i<m; i++)

                 z[i]=z[i] - g[i]/4;

         }

         for (i=m;i<nn; i+=5){

             z[i]   = z[i]   -  g[i]  /4;

             z[i+1] = z[i+1] -  g[i+1]/4;

             z[i+2] = z[i+2] -  g[i+2]/4;

             z[i+3] = z[i+3] -  g[i+3]/4;

             z[i+4] = z[i+4] -  g[i+4]/4;

         }


         /*

            project z onto the L_{infty} ball with radius lambda


            z is the new approximate solution

            */

         for (i=0;i<nn; i++){

             if (z[i]>lambda)

                 z[i]=lambda;

             else

                 if (z[i]<-lambda)

                     z[i]=-lambda;

         }


         /*

            ---------------------------------------------------

            A gradient descent step ends

            */


         /*compute the gradient at z*/


         g[0]=z[0] + z[0] - z[1] - Av[0];

         for (i=1;i<nn-1;i++){

             g[i]= - z[i-1] + z[i] + z[i] - z[i+1] - Av[i];

         }

         g[nn-1]= -z[nn-2] + z[nn-1] + z[nn-1] - Av[nn-1];


         if (iterStep % tau==0){

             gappp=gapp;

             gapp=*gap;  /*record the previous gap*/


             dualityGap2(gap, z, g, s, Av, lambda, nn);

             /*g, the gradient of z should be computed before calling this function*/


             /*

                printf("\n iterStep=%d, numS=%d, gap=%e",iterStep, numS, *gap);

                */


             /*

                printf("\n  %d  & %d   &  %2.0e \\\\ \n \\hline ",iterStep, numS, *gap);

                */


             /*

                printf("\n %e",*gap);

                */


             /*


                     printf("\n %d",numS);


 */


             if (*gap <=tol){

                 //tFlag=1;

                 break;

             }


             m=1;

             if (nn > 1000000)

                 m=5;

             else

                 if (nn > 100000)

                     m=3;


             if ( abs( numS-numSp) <m ){


                 /*

                    printf("\n numS=%d, numSp=%d",numS,numSp);

                    */


                 m=generateSolution(x, z, gap, v, Av,

                         g, s, S, lambda, nn);

                 /*g, the gradient of z should be computed before calling this function*/


                 if (*gap < tol){


                     numS=m;

                     tFlag=2;

                     break;

                 }


                 if ( (*gap ==gappp) && (numS==numSpp) ){


                     tFlag=2;

                     break;


                 }


             } /*end of if*/


         }/*end of if tau*/


     } /*end of for*/


     if (tFlag!=2){

         numS=generateSolution(x, z, gap, v, Av, g, s, S, lambda, nn);

         /*g, the gradient of z should be computed before calling this function*/

     }


     free(S);


     *activeS=numS;

     return(iterStep);

 }


 #endif //USE_GPL_SHOGUN

sfa.h