svm.cpp
上传用户:xgw_05
上传日期:2014-12-08
资源大小:2726k
文件大小:42k
- #include <math.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include <ctype.h>
- #include <float.h>
- #include <string.h>
- #include <stdarg.h>
- #include "svm.h"
- typedef float Qfloat;
- typedef signed char schar;
- #ifndef min
- template <class T> inline T min(T x,T y) { return (x<y)?x:y; }
- #endif
- #ifndef max
- template <class T> inline T max(T x,T y) { return (x>y)?x:y; }
- #endif
- template <class T> inline void swap(T& x, T& y) { T t=x; x=y; y=t; }
- template <class S, class T> inline void clone(T*& dst, S* src, int n)
- {
- dst = new T[n];
- memcpy((void *)dst,(void *)src,sizeof(T)*n);
- }
- #define INF HUGE_VAL
- #define Malloc(type,n) (type *)malloc((n)*sizeof(type))
- #if 1
- void info(char *fmt,...)
- {
- va_list ap;
- va_start(ap,fmt);
- vprintf(fmt,ap);
- va_end(ap);
- }
- void info_flush()
- {
- fflush(stdout);
- }
- #else
- void info(char *fmt,...) {}
- void info_flush() {}
- #endif
- //
- // Kernel Cache
- //
- // l is the number of total data items
- // size is the cache size limit in bytes
- //
- class Cache
- {
- public:
- Cache(int l,int size);
- ~Cache();
- // request data [0,len)
- // return some position p where [p,len) need to be filled
- // (p >= len if nothing needs to be filled)
- int get_data(const int index, Qfloat **data, int len);
- void swap_index(int i, int j); // future_option
- private:
- int l;
- int size;
- struct head_t
- {
- head_t *prev, *next; // a cicular list
- Qfloat *data;
- int len; // data[0,len) is cached in this entry
- };
- head_t* head;
- head_t lru_head;
- void lru_delete(head_t *h);
- void lru_insert(head_t *h);
- };
- Cache::Cache(int l_,int size_):l(l_),size(size_)
- {
- head = (head_t *)calloc(l,sizeof(head_t)); // initialized to 0
- size /= sizeof(Qfloat);
- size -= l * sizeof(head_t) / sizeof(Qfloat);
- lru_head.next = lru_head.prev = &lru_head;
- }
- Cache::~Cache()
- {
- for(head_t *h = lru_head.next; h != &lru_head; h=h->next)
- free(h->data);
- free(head);
- }
- void Cache::lru_delete(head_t *h)
- {
- // delete from current location
- h->prev->next = h->next;
- h->next->prev = h->prev;
- }
- void Cache::lru_insert(head_t *h)
- {
- // insert to last position
- h->next = &lru_head;
- h->prev = lru_head.prev;
- h->prev->next = h;
- h->next->prev = h;
- }
- int Cache::get_data(const int index, Qfloat **data, int len)
- {
- head_t *h = &head[index];
- if(h->len) lru_delete(h);
- int more = len - h->len;
- if(more > 0)
- {
- // free old space
- while(size < more)
- {
- head_t *old = lru_head.next;
- lru_delete(old);
- free(old->data);
- size += old->len;
- old->data = 0;
- old->len = 0;
- }
- // allocate new space
- h->data = (Qfloat *)realloc(h->data,sizeof(Qfloat)*len);
- size -= more;
- swap(h->len,len);
- }
- lru_insert(h);
- *data = h->data;
- return len;
- }
- void Cache::swap_index(int i, int j)
- {
- if(i==j) return;
- if(head[i].len) lru_delete(&head[i]);
- if(head[j].len) lru_delete(&head[j]);
- swap(head[i].data,head[j].data);
- swap(head[i].len,head[j].len);
- if(head[i].len) lru_insert(&head[i]);
- if(head[j].len) lru_insert(&head[j]);
- if(i>j) swap(i,j);
- for(head_t *h = lru_head.next; h!=&lru_head; h=h->next)
- {
- if(h->len > i)
- {
- if(h->len > j)
- swap(h->data[i],h->data[j]);
- else
- {
- // give up
- lru_delete(h);
- free(h->data);
- size += h->len;
- h->data = 0;
- h->len = 0;
- }
- }
- }
- }
- //
- // Kernel evaluation
- //
- // the static method k_function is for doing single kernel evaluation
- // the constructor of Kernel prepares to calculate the l*l kernel matrix
- // the member function get_Q is for getting one column from the Q Matrix
- //
- class Kernel {
- public:
- Kernel(int l, svm_node * const * x, const svm_parameter& param);
- virtual ~Kernel();
- static double k_function(const svm_node *x, const svm_node *y,
- const svm_parameter& param);
- virtual Qfloat *get_Q(int column, int len) const = 0;
- virtual void swap_index(int i, int j) const // no so const...
- {
- swap(x[i],x[j]);
- if(x_square) swap(x_square[i],x_square[j]);
- }
- protected:
- double (Kernel::*kernel_function)(int i, int j) const;
- private:
- const svm_node **x;
- double *x_square;
- // svm_parameter
- const int kernel_type;
- const double degree;
- const double gamma;
- const double coef0;
- static double dot(const svm_node *px, const svm_node *py);
- double kernel_linear(int i, int j) const
- {
- return dot(x[i],x[j]);
- }
- double kernel_poly(int i, int j) const
- {
- return pow(gamma*dot(x[i],x[j])+coef0,degree);
- }
- double kernel_rbf(int i, int j) const
- {
- return exp(-gamma*(x_square[i]+x_square[j]-2*dot(x[i],x[j])));
- }
- double kernel_sigmoid(int i, int j) const
- {
- return tanh(gamma*dot(x[i],x[j])+coef0);
- }
- };
- Kernel::Kernel(int l, svm_node * const * x_, const svm_parameter& param)
- :kernel_type(param.kernel_type), degree(param.degree),
- gamma(param.gamma), coef0(param.coef0)
- {
- switch(kernel_type)
- {
- case LINEAR:
- kernel_function = &Kernel::kernel_linear;
- break;
- case POLY:
- kernel_function = &Kernel::kernel_poly;
- break;
- case RBF:
- kernel_function = &Kernel::kernel_rbf;
- break;
- case SIGMOID:
- kernel_function = &Kernel::kernel_sigmoid;
- break;
- default:
- fprintf(stderr,"unknown kernel function.n");
- exit(1);
- }
- clone(x,x_,l);
- if(kernel_type == RBF)
- {
- x_square = new double[l];
- for(int i=0;i<l;i++)
- x_square[i] = dot(x[i],x[i]);
- }
- else
- x_square = 0;
- }
- Kernel::~Kernel()
- {
- delete[] x;
- delete[] x_square;
- }
- double Kernel::dot(const svm_node *px, const svm_node *py)
- {
- double sum = 0;
- while(px->index != -1 && py->index != -1)
- {
- if(px->index == py->index)
- {
- sum += px->value * py->value;
- ++px;
- ++py;
- }
- else
- {
- if(px->index > py->index)
- ++py;
- else
- ++px;
- }
- }
- return sum;
- }
- double Kernel::k_function(const svm_node *x, const svm_node *y,
- const svm_parameter& param)
- {
- switch(param.kernel_type)
- {
- case LINEAR:
- return dot(x,y);
- case POLY:
- return pow(param.gamma*dot(x,y)+param.coef0,param.degree);
- case RBF:
- {
- double sum = 0;
- while(x->index != -1 && y->index !=-1)
- {
- if(x->index == y->index)
- {
- double d = x->value - y->value;
- sum += d*d;
- ++x;
- ++y;
- }
- else
- {
- if(x->index > y->index)
- {
- sum += y->value * y->value;
- ++y;
- }
- else
- {
- sum += x->value * x->value;
- ++x;
- }
- }
- }
- while(x->index != -1)
- {
- sum += x->value * x->value;
- ++x;
- }
- while(y->index != -1)
- {
- sum += y->value * y->value;
- ++y;
- }
-
- return exp(-param.gamma*sum);
- }
- case SIGMOID:
- return tanh(param.gamma*dot(x,y)+param.coef0);
- default:
- break;
- }
- fprintf(stderr,"unknown kernel function.n");
- exit(1);
- }
- // Generalized SMO+SVMlight algorithm
- // Solves:
- //
- // min 0.5(alpha^T Q alpha) + b^T alpha
- //
- // y^T alpha = delta
- // y_i = +1 or -1
- // 0 <= alpha_i <= Cp for y_i = 1
- // 0 <= alpha_i <= Cn for y_i = -1
- //
- // Given:
- //
- // Q, b, y, Cp, Cn, and an initial feasible point alpha
- // l is the size of vectors and matrices
- // eps is the stopping criterion
- //
- // solution will be put in alpha, objective value will be put in obj
- //
- class Solver {
- public:
- Solver() {};
- virtual ~Solver() {};
- struct SolutionInfo {
- double obj;
- double rho;
- double upper_bound_p;
- double upper_bound_n;
- double r; // for Solver_NU
- };
- void Solve(int l, const Kernel& Q, const double *b_, const schar *y_,
- double *alpha_, double Cp, double Cn, double eps,
- SolutionInfo* si, int shrinking);
- protected:
- int active_size;
- schar *y;
- double *G; // gradient of objective function
- enum { LOWER_BOUND, UPPER_BOUND, FREE };
- char *alpha_status; // LOWER_BOUND, UPPER_BOUND, FREE
- double *alpha;
- const Kernel *Q;
- double eps;
- double Cp,Cn;
- double *b;
- int *active_set;
- double *G_bar; // gradient, if we treat free variables as 0
- int l;
- bool unshrinked; // XXX
- double get_C(int i)
- {
- return (y[i] > 0)? Cp : Cn;
- }
- void update_alpha_status(int i)
- {
- if(alpha[i] >= get_C(i))
- alpha_status[i] = UPPER_BOUND;
- else if(alpha[i] <= 0)
- alpha_status[i] = LOWER_BOUND;
- else alpha_status[i] = FREE;
- }
- bool is_upper_bound(int i) { return alpha_status[i] == UPPER_BOUND; }
- bool is_lower_bound(int i) { return alpha_status[i] == LOWER_BOUND; }
- bool is_free(int i) { return alpha_status[i] == FREE; }
- void swap_index(int i, int j);
- void reconstruct_gradient();
- virtual int select_working_set(int &i, int &j);
- virtual double calculate_rho();
- virtual void do_shrinking();
- };
- void Solver::swap_index(int i, int j)
- {
- Q->swap_index(i,j);
- swap(y[i],y[j]);
- swap(G[i],G[j]);
- swap(alpha_status[i],alpha_status[j]);
- swap(alpha[i],alpha[j]);
- swap(b[i],b[j]);
- swap(active_set[i],active_set[j]);
- swap(G_bar[i],G_bar[j]);
- }
- void Solver::reconstruct_gradient()
- {
- // reconstruct inactive elements of G from G_bar and free variables
- if(active_size == l) return;
- int i;
- for(i=active_size;i<l;i++)
- G[i] = G_bar[i] + b[i];
-
- for(i=0;i<active_size;i++)
- if(is_free(i))
- {
- const Qfloat *Q_i = Q->get_Q(i,l);
- double alpha_i = alpha[i];
- for(int j=active_size;j<l;j++)
- G[j] += alpha_i * Q_i[j];
- }
- }
- void Solver::Solve(int l, const Kernel& Q, const double *b_, const schar *y_,
- double *alpha_, double Cp, double Cn, double eps,
- SolutionInfo* si, int shrinking)
- {
- this->l = l;
- this->Q = &Q;
- clone(b, b_,l);
- clone(y, y_,l);
- clone(alpha,alpha_,l);
- this->Cp = Cp;
- this->Cn = Cn;
- this->eps = eps;
- unshrinked = false;
- // initialize alpha_status
- {
- alpha_status = new char[l];
- for(int i=0;i<l;i++)
- update_alpha_status(i);
- }
- // initialize active set (for shrinking)
- {
- active_set = new int[l];
- for(int i=0;i<l;i++)
- active_set[i] = i;
- active_size = l;
- }
- // initialize gradient
- {
- G = new double[l];
- G_bar = new double[l];
- int i;
- for(i=0;i<l;i++)
- {
- G[i] = b[i];
- G_bar[i] = 0;
- }
- for(i=0;i<l;i++)
- if(!is_lower_bound(i))
- {
- Qfloat *Q_i = Q.get_Q(i,l);
- double alpha_i = alpha[i];
- int j;
- for(j=0;j<l;j++)
- G[j] += alpha_i*Q_i[j];
- if(is_upper_bound(i))
- for(j=0;j<l;j++)
- G_bar[j] += get_C(i) * Q_i[j];
- }
- }
- // optimization step
- int iter = 0;
- int counter = min(l,1000)+1;
- while(1)
- {
- // show progress and do shrinking
- if(--counter == 0)
- {
- counter = min(l,1000);
- if(shrinking) do_shrinking();
- info("."); info_flush();
- }
- int i,j;
- if(select_working_set(i,j)!=0)
- {
- // reconstruct the whole gradient
- reconstruct_gradient();
- // reset active set size and check
- active_size = l;
- info("*"); info_flush();
- if(select_working_set(i,j)!=0)
- break;
- else
- counter = 1; // do shrinking next iteration
- }
-
- ++iter;
- // update alpha[i] and alpha[j], handle bounds carefully
-
- const Qfloat *Q_i = Q.get_Q(i,active_size);
- const Qfloat *Q_j = Q.get_Q(j,active_size);
- double C_i = get_C(i);
- double C_j = get_C(j);
- double old_alpha_i = alpha[i];
- double old_alpha_j = alpha[j];
- if(y[i]!=y[j])
- {
- double delta = (-G[i]-G[j])/(Q_i[i]+Q_j[j]+2*Q_i[j]);
- double diff = alpha[i] - alpha[j];
- alpha[i] += delta;
- alpha[j] += delta;
-
- if(diff > 0)
- {
- if(alpha[j] < 0)
- {
- alpha[j] = 0;
- alpha[i] = diff;
- }
- }
- else
- {
- if(alpha[i] < 0)
- {
- alpha[i] = 0;
- alpha[j] = -diff;
- }
- }
- if(diff > C_i - C_j)
- {
- if(alpha[i] > C_i)
- {
- alpha[i] = C_i;
- alpha[j] = C_i - diff;
- }
- }
- else
- {
- if(alpha[j] > C_j)
- {
- alpha[j] = C_j;
- alpha[i] = C_j + diff;
- }
- }
- }
- else
- {
- double delta = (G[i]-G[j])/(Q_i[i]+Q_j[j]-2*Q_i[j]);
- double sum = alpha[i] + alpha[j];
- alpha[i] -= delta;
- alpha[j] += delta;
- if(sum > C_i)
- {
- if(alpha[i] > C_i)
- {
- alpha[i] = C_i;
- alpha[j] = sum - C_i;
- }
- }
- else
- {
- if(alpha[j] < 0)
- {
- alpha[j] = 0;
- alpha[i] = sum;
- }
- }
- if(sum > C_j)
- {
- if(alpha[j] > C_j)
- {
- alpha[j] = C_j;
- alpha[i] = sum - C_j;
- }
- }
- else
- {
- if(alpha[i] < 0)
- {
- alpha[i] = 0;
- alpha[j] = sum;
- }
- }
- }
- // update G
- double delta_alpha_i = alpha[i] - old_alpha_i;
- double delta_alpha_j = alpha[j] - old_alpha_j;
-
- for(int k=0;k<active_size;k++)
- {
- G[k] += Q_i[k]*delta_alpha_i + Q_j[k]*delta_alpha_j;
- }
- // update alpha_status and G_bar
- {
- bool ui = is_upper_bound(i);
- bool uj = is_upper_bound(j);
- update_alpha_status(i);
- update_alpha_status(j);
- int k;
- if(ui != is_upper_bound(i))
- {
- Q_i = Q.get_Q(i,l);
- if(ui)
- for(k=0;k<l;k++)
- G_bar[k] -= C_i * Q_i[k];
- else
- for(k=0;k<l;k++)
- G_bar[k] += C_i * Q_i[k];
- }
- if(uj != is_upper_bound(j))
- {
- Q_j = Q.get_Q(j,l);
- if(uj)
- for(k=0;k<l;k++)
- G_bar[k] -= C_j * Q_j[k];
- else
- for(k=0;k<l;k++)
- G_bar[k] += C_j * Q_j[k];
- }
- }
- }
- // calculate rho
- si->rho = calculate_rho();
- // calculate objective value
- {
- double v = 0;
- int i;
- for(i=0;i<l;i++)
- v += alpha[i] * (G[i] + b[i]);
- si->obj = v/2;
- }
- // put back the solution
- {
- for(int i=0;i<l;i++)
- alpha_[active_set[i]] = alpha[i];
- }
- // juggle everything back
- /*{
- for(int i=0;i<l;i++)
- while(active_set[i] != i)
- swap_index(i,active_set[i]);
- // or Q.swap_index(i,active_set[i]);
- }*/
- si->upper_bound_p = Cp;
- si->upper_bound_n = Cn;
- info("noptimization finished, #iter = %dn",iter);
- delete[] b;
- delete[] y;
- delete[] alpha;
- delete[] alpha_status;
- delete[] active_set;
- delete[] G;
- delete[] G_bar;
- }
- // return 1 if already optimal, return 0 otherwise
- int Solver::select_working_set(int &out_i, int &out_j)
- {
- // return i,j which maximize -grad(f)^T d , under constraint
- // if alpha_i == C, d != +1
- // if alpha_i == 0, d != -1
- double Gmax1 = -INF; // max { -grad(f)_i * d | y_i*d = +1 }
- int Gmax1_idx = -1;
- double Gmax2 = -INF; // max { -grad(f)_i * d | y_i*d = -1 }
- int Gmax2_idx = -1;
- for(int i=0;i<active_size;i++)
- {
- if(y[i]==+1) // y = +1
- {
- if(!is_upper_bound(i)) // d = +1
- {
- if(-G[i] > Gmax1)
- {
- Gmax1 = -G[i];
- Gmax1_idx = i;
- }
- }
- if(!is_lower_bound(i)) // d = -1
- {
- if(G[i] > Gmax2)
- {
- Gmax2 = G[i];
- Gmax2_idx = i;
- }
- }
- }
- else // y = -1
- {
- if(!is_upper_bound(i)) // d = +1
- {
- if(-G[i] > Gmax2)
- {
- Gmax2 = -G[i];
- Gmax2_idx = i;
- }
- }
- if(!is_lower_bound(i)) // d = -1
- {
- if(G[i] > Gmax1)
- {
- Gmax1 = G[i];
- Gmax1_idx = i;
- }
- }
- }
- }
- if(Gmax1+Gmax2 < eps)
- return 1;
- out_i = Gmax1_idx;
- out_j = Gmax2_idx;
- return 0;
- }
- void Solver::do_shrinking()
- {
- int i,j,k;
- if(select_working_set(i,j)!=0) return;
- double Gm1 = -y[j]*G[j];
- double Gm2 = y[i]*G[i];
- // shrink
-
- for(k=0;k<active_size;k++)
- {
- if(is_lower_bound(k))
- {
- if(y[k]==+1)
- {
- if(-G[k] >= Gm1) continue;
- }
- else if(-G[k] >= Gm2) continue;
- }
- else if(is_upper_bound(k))
- {
- if(y[k]==+1)
- {
- if(G[k] >= Gm2) continue;
- }
- else if(G[k] >= Gm1) continue;
- }
- else continue;
- --active_size;
- swap_index(k,active_size);
- --k; // look at the newcomer
- }
- // unshrink, check all variables again before final iterations
- if(unshrinked || -(Gm1 + Gm2) > eps*10) return;
-
- unshrinked = true;
- reconstruct_gradient();
- for(k=l-1;k>=active_size;k--)
- {
- if(is_lower_bound(k))
- {
- if(y[k]==+1)
- {
- if(-G[k] < Gm1) continue;
- }
- else if(-G[k] < Gm2) continue;
- }
- else if(is_upper_bound(k))
- {
- if(y[k]==+1)
- {
- if(G[k] < Gm2) continue;
- }
- else if(G[k] < Gm1) continue;
- }
- else continue;
- swap_index(k,active_size);
- active_size++;
- ++k; // look at the newcomer
- }
- }
- double Solver::calculate_rho()
- {
- double r;
- int nr_free = 0;
- double ub = INF, lb = -INF, sum_free = 0;
- for(int i=0;i<active_size;i++)
- {
- double yG = y[i]*G[i];
- if(is_lower_bound(i))
- {
- if(y[i] > 0)
- ub = min(ub,yG);
- else
- lb = max(lb,yG);
- }
- else if(is_upper_bound(i))
- {
- if(y[i] < 0)
- ub = min(ub,yG);
- else
- lb = max(lb,yG);
- }
- else
- {
- ++nr_free;
- sum_free += yG;
- }
- }
- if(nr_free>0)
- r = sum_free/nr_free;
- else
- r = (ub+lb)/2;
- return r;
- }
- //
- // Solver for nu-svm classification and regression
- //
- // additional constraint: e^T alpha = constant
- //
- class Solver_NU : public Solver
- {
- public:
- Solver_NU() {}
- void Solve(int l, const Kernel& Q, const double *b, const schar *y,
- double *alpha, double Cp, double Cn, double eps,
- SolutionInfo* si, int shrinking)
- {
- this->si = si;
- Solver::Solve(l,Q,b,y,alpha,Cp,Cn,eps,si,shrinking);
- }
- private:
- SolutionInfo *si;
- int select_working_set(int &i, int &j);
- double calculate_rho();
- void do_shrinking();
- };
- int Solver_NU::select_working_set(int &out_i, int &out_j)
- {
- // return i,j which maximize -grad(f)^T d , under constraint
- // if alpha_i == C, d != +1
- // if alpha_i == 0, d != -1
- double Gmax1 = -INF; // max { -grad(f)_i * d | y_i = +1, d = +1 }
- int Gmax1_idx = -1;
- double Gmax2 = -INF; // max { -grad(f)_i * d | y_i = +1, d = -1 }
- int Gmax2_idx = -1;
- double Gmax3 = -INF; // max { -grad(f)_i * d | y_i = -1, d = +1 }
- int Gmax3_idx = -1;
- double Gmax4 = -INF; // max { -grad(f)_i * d | y_i = -1, d = -1 }
- int Gmax4_idx = -1;
- for(int i=0;i<active_size;i++)
- {
- if(y[i]==+1) // y == +1
- {
- if(!is_upper_bound(i)) // d = +1
- {
- if(-G[i] > Gmax1)
- {
- Gmax1 = -G[i];
- Gmax1_idx = i;
- }
- }
- if(!is_lower_bound(i)) // d = -1
- {
- if(G[i] > Gmax2)
- {
- Gmax2 = G[i];
- Gmax2_idx = i;
- }
- }
- }
- else // y == -1
- {
- if(!is_upper_bound(i)) // d = +1
- {
- if(-G[i] > Gmax3)
- {
- Gmax3 = -G[i];
- Gmax3_idx = i;
- }
- }
- if(!is_lower_bound(i)) // d = -1
- {
- if(G[i] > Gmax4)
- {
- Gmax4 = G[i];
- Gmax4_idx = i;
- }
- }
- }
- }
- if(max(Gmax1+Gmax2,Gmax3+Gmax4) < eps)
- return 1;
- if(Gmax1+Gmax2 > Gmax3+Gmax4)
- {
- out_i = Gmax1_idx;
- out_j = Gmax2_idx;
- }
- else
- {
- out_i = Gmax3_idx;
- out_j = Gmax4_idx;
- }
- return 0;
- }
- void Solver_NU::do_shrinking()
- {
- double Gmax1 = -INF; // max { -grad(f)_i * d | y_i = +1, d = +1 }
- double Gmax2 = -INF; // max { -grad(f)_i * d | y_i = +1, d = -1 }
- double Gmax3 = -INF; // max { -grad(f)_i * d | y_i = -1, d = +1 }
- double Gmax4 = -INF; // max { -grad(f)_i * d | y_i = -1, d = -1 }
- int k;
- for(k=0;k<active_size;k++)
- {
- if(!is_upper_bound(k))
- {
- if(y[k]==+1)
- {
- if(-G[k] > Gmax1) Gmax1 = -G[k];
- }
- else if(-G[k] > Gmax3) Gmax3 = -G[k];
- }
- if(!is_lower_bound(k))
- {
- if(y[k]==+1)
- {
- if(G[k] > Gmax2) Gmax2 = G[k];
- }
- else if(G[k] > Gmax4) Gmax4 = G[k];
- }
- }
- double Gm1 = -Gmax2;
- double Gm2 = -Gmax1;
- double Gm3 = -Gmax4;
- double Gm4 = -Gmax3;
- for(k=0;k<active_size;k++)
- {
- if(is_lower_bound(k))
- {
- if(y[k]==+1)
- {
- if(-G[k] >= Gm1) continue;
- }
- else if(-G[k] >= Gm3) continue;
- }
- else if(is_upper_bound(k))
- {
- if(y[k]==+1)
- {
- if(G[k] >= Gm2) continue;
- }
- else if(G[k] >= Gm4) continue;
- }
- else continue;
- --active_size;
- swap_index(k,active_size);
- --k; // look at the newcomer
- }
- // unshrink, check all variables again before final iterations
- if(unshrinked || max(-(Gm1+Gm2),-(Gm3+Gm4)) > eps*10) return;
-
- unshrinked = true;
- reconstruct_gradient();
- for(k=l-1;k>=active_size;k--)
- {
- if(is_lower_bound(k))
- {
- if(y[k]==+1)
- {
- if(-G[k] < Gm1) continue;
- }
- else if(-G[k] < Gm3) continue;
- }
- else if(is_upper_bound(k))
- {
- if(y[k]==+1)
- {
- if(G[k] < Gm2) continue;
- }
- else if(G[k] < Gm4) continue;
- }
- else continue;
- swap_index(k,active_size);
- active_size++;
- ++k; // look at the newcomer
- }
- }
- double Solver_NU::calculate_rho()
- {
- int nr_free1 = 0,nr_free2 = 0;
- double ub1 = INF, ub2 = INF;
- double lb1 = -INF, lb2 = -INF;
- double sum_free1 = 0, sum_free2 = 0;
- for(int i=0;i<active_size;i++)
- {
- if(y[i]==+1)
- {
- if(is_lower_bound(i))
- ub1 = min(ub1,G[i]);
- else if(is_upper_bound(i))
- lb1 = max(lb1,G[i]);
- else
- {
- ++nr_free1;
- sum_free1 += G[i];
- }
- }
- else
- {
- if(is_lower_bound(i))
- ub2 = min(ub2,G[i]);
- else if(is_upper_bound(i))
- lb2 = max(lb2,G[i]);
- else
- {
- ++nr_free2;
- sum_free2 += G[i];
- }
- }
- }
- double r1,r2;
- if(nr_free1 > 0)
- r1 = sum_free1/nr_free1;
- else
- r1 = (ub1+lb1)/2;
-
- if(nr_free2 > 0)
- r2 = sum_free2/nr_free2;
- else
- r2 = (ub2+lb2)/2;
-
- si->r = (r1+r2)/2;
- return (r1-r2)/2;
- }
- //
- // Q matrices for various formulations
- //
- class SVC_Q: public Kernel
- {
- public:
- SVC_Q(const svm_problem& prob, const svm_parameter& param, const schar *y_)
- :Kernel(prob.l, prob.x, param)
- {
- clone(y,y_,prob.l);
- cache = new Cache(prob.l,(int)(param.cache_size*(1<<20)));
- }
-
- Qfloat *get_Q(int i, int len) const
- {
- Qfloat *data;
- int start;
- if((start = cache->get_data(i,&data,len)) < len)
- {
- for(int j=start;j<len;j++)
- data[j] = (Qfloat)(y[i]*y[j]*(this->*kernel_function)(i,j));
- }
- return data;
- }
- void swap_index(int i, int j) const
- {
- cache->swap_index(i,j);
- Kernel::swap_index(i,j);
- swap(y[i],y[j]);
- }
- ~SVC_Q()
- {
- delete[] y;
- delete cache;
- }
- private:
- schar *y;
- Cache *cache;
- };
- class ONE_CLASS_Q: public Kernel
- {
- public:
- ONE_CLASS_Q(const svm_problem& prob, const svm_parameter& param)
- :Kernel(prob.l, prob.x, param)
- {
- cache = new Cache(prob.l,(int)(param.cache_size*(1<<20)));
- }
-
- Qfloat *get_Q(int i, int len) const
- {
- Qfloat *data;
- int start;
- if((start = cache->get_data(i,&data,len)) < len)
- {
- for(int j=start;j<len;j++)
- data[j] = (Qfloat)(this->*kernel_function)(i,j);
- }
- return data;
- }
- void swap_index(int i, int j) const
- {
- cache->swap_index(i,j);
- Kernel::swap_index(i,j);
- }
- ~ONE_CLASS_Q()
- {
- delete cache;
- }
- private:
- Cache *cache;
- };
- class SVR_Q: public Kernel
- {
- public:
- SVR_Q(const svm_problem& prob, const svm_parameter& param)
- :Kernel(prob.l, prob.x, param)
- {
- l = prob.l;
- cache = new Cache(l,(int)(param.cache_size*(1<<20)));
- sign = new schar[2*l];
- index = new int[2*l];
- for(int k=0;k<l;k++)
- {
- sign[k] = 1;
- sign[k+l] = -1;
- index[k] = k;
- index[k+l] = k;
- }
- buffer[0] = new Qfloat[2*l];
- buffer[1] = new Qfloat[2*l];
- next_buffer = 0;
- }
- void swap_index(int i, int j) const
- {
- swap(sign[i],sign[j]);
- swap(index[i],index[j]);
- }
-
- Qfloat *get_Q(int i, int len) const
- {
- Qfloat *data;
- int real_i = index[i];
- if(cache->get_data(real_i,&data,l) < l)
- {
- for(int j=0;j<l;j++)
- data[j] = (Qfloat)(this->*kernel_function)(real_i,j);
- }
- // reorder and copy
- Qfloat *buf = buffer[next_buffer];
- next_buffer = 1 - next_buffer;
- schar si = sign[i];
- for(int j=0;j<len;j++)
- buf[j] = si * sign[j] * data[index[j]];
- return buf;
- }
- ~SVR_Q()
- {
- delete cache;
- delete[] sign;
- delete[] index;
- delete[] buffer[0];
- delete[] buffer[1];
- }
- private:
- int l;
- Cache *cache;
- schar *sign;
- int *index;
- mutable int next_buffer;
- Qfloat* buffer[2];
- };
- //
- // construct and solve various formulations
- //
- static void solve_c_svc(
- const svm_problem *prob, const svm_parameter* param,
- double *alpha, Solver::SolutionInfo* si, double Cp, double Cn)
- {
- int l = prob->l;
- double *minus_ones = new double[l];
- schar *y = new schar[l];
- int i;
- for(i=0;i<l;i++)
- {
- alpha[i] = 0;
- minus_ones[i] = -1;
- if(prob->y[i] > 0) y[i] = +1; else y[i]=-1;
- }
- Solver s;
- s.Solve(l, SVC_Q(*prob,*param,y), minus_ones, y,
- alpha, Cp, Cn, param->eps, si, param->shrinking);
- double sum_alpha=0;
- for(i=0;i<l;i++)
- sum_alpha += alpha[i];
- info("nu = %fn", sum_alpha/(param->C*prob->l));
- for(i=0;i<l;i++)
- alpha[i] *= y[i];
- delete[] minus_ones;
- delete[] y;
- }
- static void solve_nu_svc(
- const svm_problem *prob, const svm_parameter *param,
- double *alpha, Solver::SolutionInfo* si)
- {
- int i;
- int l = prob->l;
- double nu = param->nu;
- int y_pos = 0;
- int y_neg = 0;
- schar *y = new schar[l];
- for(i=0;i<l;i++)
- if(prob->y[i]>0)
- {
- y[i] = +1;
- ++y_pos;
- }
- else
- {
- y[i] = -1;
- ++y_neg;
- }
- if(nu < 0 || nu*l/2 > min(y_pos,y_neg))
- {
- fprintf(stderr,"specified nu is infeasiblen");
- exit(1);
- }
- double sum_pos = nu*l/2;
- double sum_neg = nu*l/2;
- for(i=0;i<l;i++)
- if(y[i] == +1)
- {
- alpha[i] = min(1.0,sum_pos);
- sum_pos -= alpha[i];
- }
- else
- {
- alpha[i] = min(1.0,sum_neg);
- sum_neg -= alpha[i];
- }
- double *zeros = new double[l];
- for(i=0;i<l;i++)
- zeros[i] = 0;
- Solver_NU s;
- s.Solve(l, SVC_Q(*prob,*param,y), zeros, y,
- alpha, 1.0, 1.0, param->eps, si, param->shrinking);
- double r = si->r;
- info("C = %fn",1/r);
- for(i=0;i<l;i++)
- alpha[i] *= y[i]/r;
- si->rho /= r;
- si->obj /= (r*r);
- si->upper_bound_p = 1/r;
- si->upper_bound_n = 1/r;
- delete[] y;
- delete[] zeros;
- }
- static void solve_one_class(
- const svm_problem *prob, const svm_parameter *param,
- double *alpha, Solver::SolutionInfo* si)
- {
- int l = prob->l;
- double *zeros = new double[l];
- schar *ones = new schar[l];
- int i;
- int n = (int)(param->nu*prob->l); // # of alpha's at upper bound
- if(n>=prob->l)
- {
- fprintf(stderr,"nu must be in (0,1)n");
- exit(1);
- }
- for(i=0;i<n;i++)
- alpha[i] = 1;
- alpha[n] = param->nu * prob->l - n;
- for(i=n+1;i<l;i++)
- alpha[i] = 0;
- for(i=0;i<l;i++)
- {
- zeros[i] = 0;
- ones[i] = 1;
- }
- Solver s;
- s.Solve(l, ONE_CLASS_Q(*prob,*param), zeros, ones,
- alpha, 1.0, 1.0, param->eps, si, param->shrinking);
- delete[] zeros;
- delete[] ones;
- }
- static void solve_epsilon_svr(
- const svm_problem *prob, const svm_parameter *param,
- double *alpha, Solver::SolutionInfo* si)
- {
- int l = prob->l;
- double *alpha2 = new double[2*l];
- double *linear_term = new double[2*l];
- schar *y = new schar[2*l];
- int i;
- for(i=0;i<l;i++)
- {
- alpha2[i] = 0;
- linear_term[i] = param->p - prob->y[i];
- y[i] = 1;
- alpha2[i+l] = 0;
- linear_term[i+l] = param->p + prob->y[i];
- y[i+l] = -1;
- }
- Solver s;
- s.Solve(2*l, SVR_Q(*prob,*param), linear_term, y,
- alpha2, param->C, param->C, param->eps, si, param->shrinking);
- double sum_alpha = 0;
- for(i=0;i<l;i++)
- {
- alpha[i] = alpha2[i] - alpha2[i+l];
- sum_alpha += fabs(alpha[i]);
- }
- info("nu = %fn",sum_alpha/(param->C*l));
- delete[] alpha2;
- delete[] linear_term;
- delete[] y;
- }
- static void solve_nu_svr(
- const svm_problem *prob, const svm_parameter *param,
- double *alpha, Solver::SolutionInfo* si)
- {
- if(param->nu < 0 || param->nu > 1)
- {
- fprintf(stderr,"specified nu is out of rangen");
- exit(1);
- }
- int l = prob->l;
- double C = param->C;
- double *alpha2 = new double[2*l];
- double *linear_term = new double[2*l];
- schar *y = new schar[2*l];
- int i;
- double sum = C * param->nu * l / 2;
- for(i=0;i<l;i++)
- {
- alpha2[i] = alpha2[i+l] = min(sum,C);
- sum -= alpha2[i];
- linear_term[i] = - prob->y[i];
- y[i] = 1;
- linear_term[i+l] = prob->y[i];
- y[i+l] = -1;
- }
- Solver_NU s;
- s.Solve(2*l, SVR_Q(*prob,*param), linear_term, y,
- alpha2, C, C, param->eps, si, param->shrinking);
- info("epsilon = %fn",-si->r);
- for(i=0;i<l;i++)
- alpha[i] = alpha2[i] - alpha2[i+l];
- delete[] alpha2;
- delete[] linear_term;
- delete[] y;
- }
- //
- // decision_function
- //
- struct decision_function
- {
- double *alpha;
- double rho;
- };
- decision_function svm_train_one(
- const svm_problem *prob, const svm_parameter *param,
- double Cp, double Cn)
- {
- double *alpha = Malloc(double,prob->l);
- Solver::SolutionInfo si;
- switch(param->svm_type)
- {
- case C_SVC:
- solve_c_svc(prob,param,alpha,&si,Cp,Cn);
- break;
- case NU_SVC:
- solve_nu_svc(prob,param,alpha,&si);
- break;
- case ONE_CLASS:
- solve_one_class(prob,param,alpha,&si);
- break;
- case EPSILON_SVR:
- solve_epsilon_svr(prob,param,alpha,&si);
- break;
- case NU_SVR:
- solve_nu_svr(prob,param,alpha,&si);
- break;
- }
- info("obj = %f, rho = %fn",si.obj,si.rho);
- // output SVs
- int nSV = 0;
- int nBSV = 0;
- for(int i=0;i<prob->l;i++)
- {
- if(fabs(alpha[i]) > 0)
- {
- ++nSV;
- if(prob->y[i] > 0)
- {
- if(fabs(alpha[i]) >= si.upper_bound_p)
- ++nBSV;
- }
- else
- {
- if(fabs(alpha[i]) >= si.upper_bound_n)
- ++nBSV;
- }
- }
- }
- info("nSV = %d, nBSV = %dn",nSV,nBSV);
- decision_function f;
- f.alpha = alpha;
- f.rho = si.rho;
- return f;
- }
- //
- // svm_model
- //
- struct svm_model
- {
- svm_parameter param; // parameter
- int nr_class; // number of classes, = 2 in regression/one class svm
- int l; // total #SV
- svm_node **SV; // SVs (SV[l])
- double **sv_coef; // coefficients for SVs in decision functions (sv_coef[n-1][l])
- double *rho; // constants in decision functions (rho[n*(n-1)/2])
- // for classification only
- int *label; // label of each class (label[n])
- int *nSV; // number of SVs for each class (nSV[n])
- // nSV[0] + nSV[1] + ... + nSV[n-1] = l
- // XXX
- int free_sv; // 1 if svm_model is created by svm_load_model
- // 0 if svm_model is created by svm_train
- };
- //
- // Interface functions
- //
- svm_model *svm_train(const svm_problem *prob, const svm_parameter *param)
- {
- svm_model *model = Malloc(svm_model,1);
- model->param = *param;
- model->free_sv = 0; // XXX
- if(param->svm_type == ONE_CLASS ||
- param->svm_type == EPSILON_SVR ||
- param->svm_type == NU_SVR)
- {
- // regression or one-class-svm
- model->nr_class = 2;
- model->label = NULL;
- model->nSV = NULL;
- model->sv_coef = Malloc(double *,1);
- decision_function f = svm_train_one(prob,param,0,0);
- model->rho = Malloc(double,1);
- model->rho[0] = f.rho;
- int nSV = 0;
- int i;
- for(i=0;i<prob->l;i++)
- if(fabs(f.alpha[i]) > 0) ++nSV;
- model->l = nSV;
- model->SV = Malloc(svm_node *,nSV);
- model->sv_coef[0] = Malloc(double,nSV);
- int j = 0;
- for(i=0;i<prob->l;i++)
- if(fabs(f.alpha[i]) > 0)
- {
- model->SV[j] = prob->x[i];
- model->sv_coef[0][j] = f.alpha[i];
- ++j;
- }
- free(f.alpha);
- }
- else
- {
- // classification
- // find out the number of classes
- int l = prob->l;
- int max_nr_class = 16;
- int nr_class = 0;
- int *label = Malloc(int,max_nr_class);
- int *count = Malloc(int,max_nr_class);
- int *index = Malloc(int,l);
- int i;
- for(i=0;i<l;i++)
- {
- int this_label = (int)prob->y[i];
- int j;
- for(j=0;j<nr_class;j++)
- if(this_label == label[j])
- {
- ++count[j];
- break;
- }
- index[i] = j;
- if(j == nr_class)
- {
- if(nr_class == max_nr_class)
- {
- max_nr_class *= 2;
- label = (int *)realloc(label,max_nr_class*sizeof(int));
- count = (int *)realloc(count,max_nr_class*sizeof(int));
- }
- label[nr_class] = this_label;
- count[nr_class] = 1;
- ++nr_class;
- }
- }
- // group training data of the same class
- int *start = Malloc(int,nr_class);
- start[0] = 0;
- for(i=1;i<nr_class;i++)
- start[i] = start[i-1]+count[i-1];
- svm_node **x = Malloc(svm_node *,l);
-
- for(i=0;i<l;i++)
- {
- x[start[index[i]]] = prob->x[i];
- ++start[index[i]];
- }
-
- start[0] = 0;
- for(i=1;i<nr_class;i++)
- start[i] = start[i-1]+count[i-1];
- // calculate weighted C
- double *weighted_C = Malloc(double, nr_class);
- for(i=0;i<nr_class;i++)
- weighted_C[i] = param->C;
- for(i=0;i<param->nr_weight;i++)
- {
- int j;
- for(j=0;j<nr_class;j++)
- if(param->weight_label[i] == label[j])
- break;
- if(j == nr_class)
- fprintf(stderr,"warning: class label %d specified in weight is not foundn", param->weight_label[i]);
- else
- weighted_C[j] *= param->weight[i];
- }
- // train n*(n-1)/2 models
-
- bool *nonzero = Malloc(bool,l);
- for(i=0;i<l;i++)
- nonzero[i] = false;
- decision_function *f = Malloc(decision_function,nr_class*(nr_class-1)/2);
- int p = 0;
- for(i=0;i<nr_class;i++)
- for(int j=i+1;j<nr_class;j++)
- {
- svm_problem sub_prob;
- int si = start[i], sj = start[j];
- int ci = count[i], cj = count[j];
- sub_prob.l = ci+cj;
- sub_prob.x = Malloc(svm_node *,sub_prob.l);
- sub_prob.y = Malloc(double,sub_prob.l);
- int k;
- for(k=0;k<ci;k++)
- {
- sub_prob.x[k] = x[si+k];
- sub_prob.y[k] = +1;
- }
- for(k=0;k<cj;k++)
- {
- sub_prob.x[ci+k] = x[sj+k];
- sub_prob.y[ci+k] = -1;
- }
-
- f[p] = svm_train_one(&sub_prob,param,weighted_C[i],weighted_C[j]);
- for(k=0;k<ci;k++)
- if(!nonzero[si+k] && fabs(f[p].alpha[k]) > 0)
- nonzero[si+k] = true;
- for(k=0;k<cj;k++)
- if(!nonzero[sj+k] && fabs(f[p].alpha[ci+k]) > 0)
- nonzero[sj+k] = true;
- free(sub_prob.x);
- free(sub_prob.y);
- ++p;
- }
- // build output
- model->nr_class = nr_class;
-
- model->label = Malloc(int,nr_class);
- for(i=0;i<nr_class;i++)
- model->label[i] = label[i];
-
- model->rho = Malloc(double,nr_class*(nr_class-1)/2);
- for(i=0;i<nr_class*(nr_class-1)/2;i++)
- model->rho[i] = f[i].rho;
- int total_sv = 0;
- int *nz_count = Malloc(int,nr_class);
- model->nSV = Malloc(int,nr_class);
- for(i=0;i<nr_class;i++)
- {
- int nSV = 0;
- for(int j=0;j<count[i];j++)
- if(nonzero[start[i]+j])
- {
- ++nSV;
- ++total_sv;
- }
- model->nSV[i] = nSV;
- nz_count[i] = nSV;
- }
-
- info("Total nSV = %dn",total_sv);
- model->l = total_sv;
- model->SV = Malloc(svm_node *,total_sv);
- p = 0;
- for(i=0;i<l;i++)
- if(nonzero[i]) model->SV[p++] = x[i];
- int *nz_start = Malloc(int,nr_class);
- nz_start[0] = 0;
- for(i=1;i<nr_class;i++)
- nz_start[i] = nz_start[i-1]+nz_count[i-1];
- model->sv_coef = Malloc(double *,nr_class-1);
- for(i=0;i<nr_class-1;i++)
- model->sv_coef[i] = Malloc(double,total_sv);
- p = 0;
- for(i=0;i<nr_class;i++)
- for(int j=i+1;j<nr_class;j++)
- {
- // classifier (i,j): coefficients with
- // i are in sv_coef[j-1][nz_start[i]...],
- // j are in sv_coef[i][nz_start[j]...]
- int si = start[i];
- int sj = start[j];
- int ci = count[i];
- int cj = count[j];
-
- int q = nz_start[i];
- int k;
- for(k=0;k<ci;k++)
- if(nonzero[si+k])
- model->sv_coef[j-1][q++] = f[p].alpha[k];
- q = nz_start[j];
- for(k=0;k<cj;k++)
- if(nonzero[sj+k])
- model->sv_coef[i][q++] = f[p].alpha[ci+k];
- ++p;
- }
-
- free(label);
- free(count);
- free(index);
- free(start);
- free(x);
- free(weighted_C);
- free(nonzero);
- for(i=0;i<nr_class*(nr_class-1)/2;i++)
- free(f[i].alpha);
- free(f);
- free(nz_count);
- free(nz_start);
- }
- return model;
- }
- double svm_predict(const svm_model *model, const svm_node *x)
- {
- if(model->param.svm_type == ONE_CLASS ||
- model->param.svm_type == EPSILON_SVR ||
- model->param.svm_type == NU_SVR)
- {
- double *sv_coef = model->sv_coef[0];
- double sum = 0;
- for(int i=0;i<model->l;i++)
- sum += sv_coef[i] * Kernel::k_function(x,model->SV[i],model->param);
- sum -= model->rho[0];
- if(model->param.svm_type == ONE_CLASS)
- return (sum>0)?1:-1;
- else
- return sum;
- }
- else
- {
- int i;
- int nr_class = model->nr_class;
- int l = model->l;
-
- double *kvalue = Malloc(double,l);
- for(i=0;i<l;i++)
- kvalue[i] = Kernel::k_function(x,model->SV[i],model->param);
- int *start = Malloc(int,nr_class);
- start[0] = 0;
- for(i=1;i<nr_class;i++)
- start[i] = start[i-1]+model->nSV[i-1];
- int *vote = Malloc(int,nr_class);
- for(i=0;i<nr_class;i++)
- vote[i] = 0;
- int p=0;
- for(i=0;i<nr_class;i++)
- for(int j=i+1;j<nr_class;j++)
- {
- double sum = 0;
- int si = start[i];
- int sj = start[j];
- int ci = model->nSV[i];
- int cj = model->nSV[j];
-
- int k;
- double *coef1 = model->sv_coef[j-1];
- double *coef2 = model->sv_coef[i];
- for(k=0;k<ci;k++)
- sum += coef1[si+k] * kvalue[si+k];
- for(k=0;k<cj;k++)
- sum += coef2[sj+k] * kvalue[sj+k];
- sum -= model->rho[p++];
- if(sum > 0)
- ++vote[i];
- else
- ++vote[j];
- }
- int vote_max_idx = 0;
- for(i=1;i<nr_class;i++)
- if(vote[i] > vote[vote_max_idx])
- vote_max_idx = i;
- free(kvalue);
- free(start);
- free(vote);
- return model->label[vote_max_idx];
- }
- }
- const char *svm_type_table[] =
- {
- "c_svc","nu_svc","one_class","epsilon_svr","nu_svr",NULL
- };
- const char *kernel_type_table[]=
- {
- "linear","polynomial","rbf","sigmoid",NULL
- };
- int svm_save_model(const char *model_file_name, const svm_model *model)
- {
- FILE *fp = fopen(model_file_name,"w");
- if(fp==NULL) return -1;
- const svm_parameter& param = model->param;
- fprintf(fp,"svm_type %sn", svm_type_table[param.svm_type]);
- fprintf(fp,"kernel_type %sn", kernel_type_table[param.kernel_type]);
- if(param.kernel_type == POLY)
- fprintf(fp,"degree %gn", param.degree);
- if(param.kernel_type == POLY || param.kernel_type == RBF || param.kernel_type == SIGMOID)
- fprintf(fp,"gamma %gn", param.gamma);
- if(param.kernel_type == POLY || param.kernel_type == SIGMOID)
- fprintf(fp,"coef0 %gn", param.coef0);
- int nr_class = model->nr_class;
- int l = model->l;
- fprintf(fp, "nr_class %dn", nr_class);
- fprintf(fp, "total_sv %dn",l);
-
- {
- fprintf(fp, "rho");
- for(int i=0;i<nr_class*(nr_class-1)/2;i++)
- fprintf(fp," %g",model->rho[i]);
- fprintf(fp, "n");
- }
-
- if(model->label)
- {
- fprintf(fp, "label");
- for(int i=0;i<nr_class;i++)
- fprintf(fp," %d",model->label[i]);
- fprintf(fp, "n");
- }
- if(model->nSV)
- {
- fprintf(fp, "nr_sv");
- for(int i=0;i<nr_class;i++)
- fprintf(fp," %d",model->nSV[i]);
- fprintf(fp, "n");
- }
- fprintf(fp, "SVn");
- const double * const *sv_coef = model->sv_coef;
- const svm_node * const *SV = model->SV;
- for(int i=0;i<l;i++)
- {
- for(int j=0;j<nr_class-1;j++)
- fprintf(fp, "%.16g ",sv_coef[j][i]);
- const svm_node *p = SV[i];
- while(p->index != -1)
- {
- fprintf(fp,"%d:%.8g ",p->index,p->value);
- p++;
- }
- fprintf(fp, "n");
- }
- fclose(fp);
- return 0;
- }
- svm_model *svm_load_model(const char *model_file_name)
- {
- FILE *fp = fopen(model_file_name,"rb");
- if(fp==NULL) return NULL;
-
- // read parameters
- svm_model *model = (svm_model *)malloc(sizeof(svm_model));
- svm_parameter& param = model->param;
- model->label = NULL;
- model->nSV = NULL;
- char cmd[81];
- while(1)
- {
- fscanf(fp,"%80s",cmd);
- if(strcmp(cmd,"svm_type")==0)
- {
- fscanf(fp,"%80s",cmd);
- int i;
- for(i=0;svm_type_table[i];i++)
- {
- if(strcmp(svm_type_table[i],cmd)==0)
- {
- param.svm_type=i;
- break;
- }
- }
- if(svm_type_table[i] == NULL)
- {
- fprintf(stderr,"unknown svm type.n");
- exit(1);
- }
- }
- else if(strcmp(cmd,"kernel_type")==0)
- {
- fscanf(fp,"%80s",cmd);
- int i;
- for(i=0;kernel_type_table[i];i++)
- {
- if(strcmp(kernel_type_table[i],cmd)==0)
- {
- param.kernel_type=i;
- break;
- }
- }
- if(kernel_type_table[i] == NULL)
- {
- fprintf(stderr,"unknown kernel function.n");
- exit(1);
- }
- }
- else if(strcmp(cmd,"degree")==0)
- fscanf(fp,"%lf",¶m.degree);
- else if(strcmp(cmd,"gamma")==0)
- fscanf(fp,"%lf",¶m.gamma);
- else if(strcmp(cmd,"coef0")==0)
- fscanf(fp,"%lf",¶m.coef0);
- else if(strcmp(cmd,"nr_class")==0)
- fscanf(fp,"%d",&model->nr_class);
- else if(strcmp(cmd,"total_sv")==0)
- fscanf(fp,"%d",&model->l);
- else if(strcmp(cmd,"rho")==0)
- {
- int n = model->nr_class * (model->nr_class-1)/2;
- model->rho = Malloc(double,n);
- for(int i=0;i<n;i++)
- fscanf(fp,"%lf",&model->rho[i]);
- }
- else if(strcmp(cmd,"label")==0)
- {
- int n = model->nr_class;
- model->label = Malloc(int,n);
- for(int i=0;i<n;i++)
- fscanf(fp,"%d",&model->label[i]);
- }
- else if(strcmp(cmd,"nr_sv")==0)
- {
- int n = model->nr_class;
- model->nSV = Malloc(int,n);
- for(int i=0;i<n;i++)
- fscanf(fp,"%d",&model->nSV[i]);
- }
- else if(strcmp(cmd,"SV")==0)
- {
- while(1)
- {
- int c = getc(fp);
- if(c==EOF || c=='n') break;
- }
- break;
- }
- else
- {
- fprintf(stderr,"unknown text in model filen");
- exit(1);
- }
- }
- // read sv_coef and SV
- int elements = 0;
- long pos = ftell(fp);
- while(1)
- {
- int c = fgetc(fp);
- switch(c)
- {
- case 'n':
- // count the '-1' element
- case ':':
- ++elements;
- break;
- case EOF:
- goto out;
- default:
- ;
- }
- }
- out:
- fseek(fp,pos,SEEK_SET);
- int m = model->nr_class - 1;
- int l = model->l;
- model->sv_coef = Malloc(double *,m);
- int i;
- for(i=0;i<m;i++)
- model->sv_coef[i] = Malloc(double,l);
- model->SV = Malloc(svm_node*,l);
- svm_node *x_space = Malloc(svm_node,elements);
- int j=0;
- for(i=0;i<l;i++)
- {
- model->SV[i] = &x_space[j];
- for(int k=0;k<m;k++)
- fscanf(fp,"%lf",&model->sv_coef[k][i]);
- while(1)
- {
- int c;
- do {
- c = getc(fp);
- if(c=='n') goto out2;
- } while(isspace(c));
- ungetc(c,fp);
- fscanf(fp,"%d:%lf",&(x_space[j].index),&(x_space[j].value));
- ++j;
- }
- out2:
- x_space[j++].index = -1;
- }
- fclose(fp);
- model->free_sv = 1; // XXX
- return model;
- }
- void svm_destroy_model(svm_model* model)
- {
- if(model->free_sv)
- free((void *)(model->SV[0]));
- for(int i=0;i<model->nr_class-1;i++)
- free(model->sv_coef[i]);
- free(model->SV);
- free(model->sv_coef);
- free(model->rho);
- free(model->label);
- free(model->nSV);
- free(model);
- }