📄 solver.cs
字号:
if (y[i] < 0)
ub = Math.Min(ub, yG);
else
lb = Math.Max(lb, yG);
}
else
{
++nr_free;
sum_free += yG;
}
}
if (nr_free > 0)
r = sum_free / nr_free;
else
r = (ub + lb) / 2;
return r;
}
}
//
// Solver for nu-svm classification and regression
//
// additional constraint: e^T \alpha = constant
//
sealed class Solver_NU : Solver
{
private SolutionInfo si;
public override void Solve(int l, QMatrix Q, double[] p, short[] y,
double[] alpha, double Cp, double Cn, double eps,
SolutionInfo si, bool shrinking)
{
this.si = si;
base.Solve(l, Q, p, y, alpha, Cp, Cn, eps, si, shrinking);
}
// return 1 if already optimal, return 0 otherwise
protected override int select_working_set(int[] working_set)
{
// return i,j such that y_i = y_j and
// i: maximizes -y_i * grad(f)_i, i in I_up(\alpha)
// j: minimizes the decrease of obj value
// (if quadratic coefficeint <= 0, replace it with tau)
// -y_j*grad(f)_j < -y_i*grad(f)_i, j in I_low(\alpha)
double Gmaxp = -INF;
double Gmaxp2 = -INF;
int Gmaxp_idx = -1;
double Gmaxn = -INF;
double Gmaxn2 = -INF;
int Gmaxn_idx = -1;
int Gmin_idx = -1;
double obj_diff_min = INF;
for (int t = 0; t < active_size; t++)
if (y[t] == +1)
{
if (!is_upper_bound(t))
if (-G[t] >= Gmaxp)
{
Gmaxp = -G[t];
Gmaxp_idx = t;
}
}
else
{
if (!is_lower_bound(t))
if (G[t] >= Gmaxn)
{
Gmaxn = G[t];
Gmaxn_idx = t;
}
}
int ip = Gmaxp_idx;
int iN = Gmaxn_idx;
float[] Q_ip = null;
float[] Q_in = null;
if (ip != -1) // null Q_ip not accessed: Gmaxp=-INF if ip=-1
Q_ip = Q.get_Q(ip, active_size);
if (iN != -1)
Q_in = Q.get_Q(iN, active_size);
for (int j = 0; j < active_size; j++)
{
if (y[j] == +1)
{
if (!is_lower_bound(j))
{
double grad_diff = Gmaxp + G[j];
if (G[j] >= Gmaxp2)
Gmaxp2 = G[j];
if (grad_diff > 0)
{
double obj_diff;
double quad_coef = Q_ip[ip] + QD[j] - 2 * Q_ip[j];
if (quad_coef > 0)
obj_diff = -(grad_diff * grad_diff) / quad_coef;
else
obj_diff = -(grad_diff * grad_diff) / 1e-12;
if (obj_diff <= obj_diff_min)
{
Gmin_idx = j;
obj_diff_min = obj_diff;
}
}
}
}
else
{
if (!is_upper_bound(j))
{
double grad_diff = Gmaxn - G[j];
if (-G[j] >= Gmaxn2)
Gmaxn2 = -G[j];
if (grad_diff > 0)
{
double obj_diff;
double quad_coef = Q_in[iN] + QD[j] - 2 * Q_in[j];
if (quad_coef > 0)
obj_diff = -(grad_diff * grad_diff) / quad_coef;
else
obj_diff = -(grad_diff * grad_diff) / 1e-12;
if (obj_diff <= obj_diff_min)
{
Gmin_idx = j;
obj_diff_min = obj_diff;
}
}
}
}
}
if (Math.Max(Gmaxp + Gmaxp2, Gmaxn + Gmaxn2) < eps)
return 1;
if (y[Gmin_idx] == +1)
working_set[0] = Gmaxp_idx;
else
working_set[0] = Gmaxn_idx;
working_set[1] = Gmin_idx;
return 0;
}
private bool be_shrunken(int i, double Gmax1, double Gmax2, double Gmax3, double Gmax4)
{
if (is_upper_bound(i))
{
if (y[i] == +1)
return (-G[i] > Gmax1);
else
return (-G[i] > Gmax4);
}
else if (is_lower_bound(i))
{
if (y[i] == +1)
return (G[i] > Gmax2);
else
return (G[i] > Gmax3);
}
else
return (false);
}
protected override void do_shrinking()
{
double Gmax1 = -INF; // max { -y_i * grad(f)_i | y_i = +1, i in I_up(\alpha) }
double Gmax2 = -INF; // max { y_i * grad(f)_i | y_i = +1, i in I_low(\alpha) }
double Gmax3 = -INF; // max { -y_i * grad(f)_i | y_i = -1, i in I_up(\alpha) }
double Gmax4 = -INF; // max { y_i * grad(f)_i | y_i = -1, i in I_low(\alpha) }
// find maximal violating pair first
int i;
for (i = 0; i < active_size; i++)
{
if (!is_upper_bound(i))
{
if (y[i] == +1)
{
if (-G[i] > Gmax1) Gmax1 = -G[i];
}
else if (-G[i] > Gmax4) Gmax4 = -G[i];
}
if (!is_lower_bound(i))
{
if (y[i] == +1)
{
if (G[i] > Gmax2) Gmax2 = G[i];
}
else if (G[i] > Gmax3) Gmax3 = G[i];
}
}
// shrinking
for (i = 0; i < active_size; i++)
if (be_shrunken(i, Gmax1, Gmax2, Gmax3, Gmax4))
{
active_size--;
while (active_size > i)
{
if (!be_shrunken(active_size, Gmax1, Gmax2, Gmax3, Gmax4))
{
swap_index(i, active_size);
break;
}
active_size--;
}
}
if (unshrinked || Math.Max(Gmax1 + Gmax2, Gmax3 + Gmax4) > eps * 10) return;
unshrinked = true;
reconstruct_gradient();
for (i = l - 1; i >= active_size; i--)
if (!be_shrunken(i, Gmax1, Gmax2, Gmax3, Gmax4))
{
while (active_size < i)
{
if (be_shrunken(active_size, Gmax1, Gmax2, Gmax3, Gmax4))
{
swap_index(i, active_size);
break;
}
active_size++;
}
active_size++;
}
}
protected override double calculate_rho()
{
int nr_free1 = 0, nr_free2 = 0;
double ub1 = INF, ub2 = INF;
double lb1 = -INF, lb2 = -INF;
double sum_free1 = 0, sum_free2 = 0;
for (int i = 0; i < active_size; i++)
{
if (y[i] == +1)
{
if (is_lower_bound(i))
ub1 = Math.Min(ub1, G[i]);
else if (is_upper_bound(i))
lb1 = Math.Max(lb1, G[i]);
else
{
++nr_free1;
sum_free1 += G[i];
}
}
else
{
if (is_lower_bound(i))
ub2 = Math.Min(ub2, G[i]);
else if (is_upper_bound(i))
lb2 = Math.Max(lb2, G[i]);
else
{
++nr_free2;
sum_free2 += G[i];
}
}
}
double r1, r2;
if (nr_free1 > 0)
r1 = sum_free1 / nr_free1;
else
r1 = (ub1 + lb1) / 2;
if (nr_free2 > 0)
r2 = sum_free2 / nr_free2;
else
r2 = (ub2 + lb2) / 2;
si.r = (r1 + r2) / 2;
return (r1 - r2) / 2;
}
}
//
// Q matrices for various formulations
//
class SVC_Q : Kernel
{
private short[] y;
private Cache cache;
private float[] QD;
public SVC_Q(Problem prob, Parameter param, short[] y_) : base(prob.Count, prob.X, param)
{
y = (short[])y_.Clone();
cache = new Cache(prob.Count, (long)(param.CacheSize * (1 << 20)));
QD = new float[prob.Count];
for (int i = 0; i < prob.Count; i++)
QD[i] = (float)kernel_function(i, i);
}
public override float[] get_Q(int i, int len)
{
float[][] data = new float[1][];
int start;
if ((start = cache.get_data(i, data, len)) < len)
{
for (int j = start; j < len; j++)
data[0][j] = (float)(y[i] * y[j] * kernel_function(i, j));
}
return data[0];
}
public override float[] get_QD()
{
return QD;
}
public override void swap_index(int i, int j)
{
cache.swap_index(i, j);
base.swap_index(i, j);
do { short _ = y[i]; y[i] = y[j]; y[j] = _; } while (false);
do { float _ = QD[i]; QD[i] = QD[j]; QD[j] = _; } while (false);
}
}
class ONE_CLASS_Q : Kernel
{
private Cache cache;
private float[] QD;
public ONE_CLASS_Q(Problem prob, Parameter param) : base(prob.Count, prob.X, param)
{
cache = new Cache(prob.Count, (long)(param.CacheSize * (1 << 20)));
QD = new float[prob.Count];
for (int i = 0; i < prob.Count; i++)
QD[i] = (float)kernel_function(i, i);
}
public override float[] get_Q(int i, int len)
{
float[][] data = new float[1][];
int start;
if ((start = cache.get_data(i, data, len)) < len)
{
for (int j = start; j < len; j++)
data[0][j] = (float)kernel_function(i, j);
}
return data[0];
}
public override float[] get_QD()
{
return QD;
}
public override void swap_index(int i, int j)
{
cache.swap_index(i, j);
base.swap_index(i, j);
do { float _ = QD[i]; QD[i] = QD[j]; QD[j] = _; } while (false);
}
}
class SVR_Q : Kernel
{
private int l;
private Cache cache;
private short[] sign;
private int[] index;
private int next_buffer;
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -