/// <summary> /// Computes the probability of the prediction being True. /// </summary> /// <param name="x"></param> /// <returns></returns> public double PredictRaw(Vector x) { var prediction = 0d; Preprocess(x); if (KernelFunction.IsLinear) { prediction = Theta.Dot(x) + Bias; } else { for (var j = 0; j < X.Rows; j++) { prediction = prediction + Alpha[j] * Y[j] * KernelFunction.Compute(X[j, VectorType.Row], x); } prediction += Bias; } return(prediction); }
/// <summary>Generates a SVM model based on a set of examples.</summary> /// <param name="X">The Matrix to process.</param> /// <param name="y">The Vector to process.</param> /// <returns>Model.</returns> public override IModel Generate(Matrix X, Vector y) { Preprocess(X); // expect truth = 1 and false = -1 y = y.ToBinary(k => k == 1d, falseValue: -1.0); // initialise variables int m = X.Rows, n = X.Cols, i = -1, j = -1; var iterations = 0; Vector gradient = Vector.Zeros(m), alpha = Vector.Zeros(m); // precompute kernal matrix (using similarity function) var K = KernelFunction.Compute(X); // synchronise SVM parameters with working set selection function. SelectionFunction.Bias = Bias; SelectionFunction.C = C; SelectionFunction.Epsilon = Epsilon; SelectionFunction.K = K; SelectionFunction.Y = y; var finalise = false; SelectionFunction.Initialize(alpha, gradient); while (finalise == false && iterations < MaxIterations) { var changes = 0; #region Training for (var p = 0; p < m; p++) { // get new working set selection using heuristic function var newPair = SelectionFunction.GetWorkingSet(i, j, gradient, alpha); // check for valid i, j pairs if (newPair.Item1 >= 0 && newPair.Item2 >= 0 && newPair.Item1 != newPair.Item2) { i = newPair.Item1; j = newPair.Item2; // compute new gradients gradient[i] = Bias + (alpha * y * K[i, VectorType.Col]).Sum() - y[i]; if ((!(y[i] * gradient[i] < -Epsilon) || !(alpha[i] < C)) && (!(y[i] * gradient[i] > Epsilon) || !(alpha[i] > 0))) { continue; } gradient[j] = Bias + (alpha * y * K[j, VectorType.Col]).Sum() - y[j]; // store temp working copies of alpha from both pairs (i, j) var tempAI = alpha[i]; var tempAJ = alpha[j]; // update lower and upper bounds of lagrange multipliers double lagHigh; double lagLow; if (y[i] == y[j]) { // pairs are same class don't apply large margin lagLow = System.Math.Max(0.0, alpha[j] + alpha[i] - C); lagHigh = System.Math.Min(C, alpha[j] + alpha[i]); } else { // pairs are not same class, apply large margin lagLow = System.Math.Max(0.0, alpha[j] - alpha[i]); lagHigh = System.Math.Min(C, C + alpha[j] - alpha[i]); } // if lagrange constraints are not diverse then get new working set if (lagLow == lagHigh) { continue; } // compute cost and if it's greater than 0 skip // cost should optimise large margin where fit line intercepts <= 0 var cost = 2.0 * K[i, j] - K[i, i] - K[j, j]; if (cost >= 0.0) { } else { // update alpha of (j) w.r.t to the relative cost difference of the i-th and j-th gradient alpha[j] = alpha[j] - y[j] * (gradient[i] - gradient[j]) / cost; // clip alpha with lagrange multipliers alpha[j] = System.Math.Min(lagHigh, alpha[j]); alpha[j] = System.Math.Max(lagLow, alpha[j]); // check alpha tolerance factor if (System.Math.Abs(alpha[j] - tempAJ) < Epsilon) { // we're optimising large margins so skip small ones alpha[j] = tempAJ; continue; } // update alpha of i if we have a large margin w.r.t to alpha (j) alpha[i] = alpha[i] + y[i] * y[j] * (tempAJ - alpha[j]); // precompute i, j into feasible region for Bias var yBeta = (alpha[i] - tempAI) * K[i, j] - y[j] * (alpha[j] - tempAJ); // store temp beta with gradient for i, j pairs var beta_i = Bias - gradient[i] - y[i] * yBeta * K[i, j]; var beta_j = Bias - gradient[j] - y[i] * yBeta * K[j, j]; // update new bias with constrained alpha limits (0 < alpha < C) if (0.0 < alpha[i] && alpha[i] < C) { Bias = beta_i; } else if (0.0 < alpha[j] && alpha[j] < C) { Bias = beta_j; } else { Bias = (beta_i + beta_j) / 2.0; } changes++; } } else if (newPair.Item1 == -1 || newPair.Item2 == -1) { // unable to find suitable sub problem (j) to optimise finalise = true; break; } } if (changes == 0) { iterations++; } else { iterations = 0; } #endregion } // get only supporting parameters where alpha is positive // i.e. because 0 < alpha < large margin var fitness = (alpha > 0d).ToArray(); // return initialised model return(new SVMModel { Descriptor = Descriptor, FeatureNormalizer = FeatureNormalizer, FeatureProperties = FeatureProperties, Theta = (alpha * y * X).ToVector(), Alpha = alpha.Slice(fitness), Bias = Bias, X = X.Slice(fitness, VectorType.Row), Y = y.Slice(fitness), KernelFunction = KernelFunction }); }