jideoyelayo1 · Nov 5, 2024 · Nov 5, 2024 · Nov 5, 2024 · Nov 5, 2024 · Nov 5, 2024
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -69,6 +69,10 @@ add_executable(HierarchicalClustering tests/clustering/HierarchicalClusteringTes
 target_compile_definitions(HierarchicalClustering PRIVATE TEST_HIERARCHICAL_CLUSTERING)
 target_link_libraries(HierarchicalClustering cpp_ml_library)
 
+add_executable(SupportVectorRegression tests/regression/SupportVectorRegressionTest.cpp)
+target_compile_definitions(SupportVectorRegression PRIVATE TEST_SUPPORT_VECTOR_REGRESSION)
+target_link_libraries(SupportVectorRegression cpp_ml_library)
+
 # Register individual tests
 add_test(NAME LogisticRegressionTest COMMAND LogisticRegressionTest)
 add_test(NAME PolynomialRegressionTest COMMAND PolynomialRegressionTest)
@@ -81,6 +85,8 @@ add_test(NAME KMeansClustering COMMAND KMeansClustering)
 add_test(NAME KNNClassifier COMMAND KNNClassifier)
 add_test(NAME KNNRegressor COMMAND KNNRegressor)
 add_test(NAME HierarchicalClustering COMMAND HierarchicalClustering)
+add_test(NAME SupportVectorRegression COMMAND SupportVectorRegression)
+
 
 
 # Add example executables if BUILD_EXAMPLES is ON
@@ -116,6 +122,8 @@ if(BUILD_EXAMPLES)
             target_compile_definitions(${EXAMPLE_TARGET} PRIVATE TEST_KNN_REGRESSOR)
         elseif(EXAMPLE_NAME STREQUAL "HierarchicalClusteringExample")
             target_compile_definitions(${EXAMPLE_TARGET} PRIVATE TEST_HIERARCHICAL_CLUSTERING)
+        elseif(EXAMPLE_NAME STREQUAL "SupportVectorRegressionExample")
+            target_compile_definitions(${EXAMPLE_TARGET} PRIVATE TEST_SUPPORT_VECTOR_REGRESSION)
         endif()
     endforeach()
 endif()
diff --git a/README.md b/README.md
@@ -63,17 +63,17 @@ The following machine learning algorithms are planned, inspired by concepts and
    - [x] Logistic Regression
    - [x] Decision Tree Regression
    - [x] Random Forest Regression
-   - [ ] K-Nearest Neighbors
+   - [x] K-Nearest Neighbors
 
 
 2. **Classification**
    - [x] Decision Tree Classifier
    - [x] Random Forest Classifier
-   - [ ] K-Nearest Neighbors
+   - [x] K-Nearest Neighbors
 
 3. **Clustering**
-   - [ ] K-Means Clustering
-   - [ ] Hierarchical clustering
+   - [x] K-Means Clustering
+   - [x] Hierarchical clustering
 
 4. **Neural Networks**
    - [ ] Neural Network (NN)

diff --git a/examples/SupportVectorRegressionExample.cpp b/examples/SupportVectorRegressionExample.cpp
@@ -0,0 +1,39 @@
+#include "../ml_library_include/ml/regression/SupportVectorRegression.hpp"
+#include <iostream>
+
+int testSupportVectorRegression() {
+    // Training data
+    std::vector<std::vector<double>> X_train = {
+        {1.0},
+        {2.0},
+        {3.0},
+        {4.0},
+        {5.0}
+    };
+    std::vector<double> y_train = {1.5, 2.0, 2.5, 3.0, 3.5};
+
+    // Test data
+    std::vector<std::vector<double>> X_test = {
+        {1.5},
+        {2.5},
+        {3.5}
+    };
+
+    // Create and train the model
+    SupportVectorRegression svr(1.0, 0.1, SupportVectorRegression::KernelType::RBF, 3, 0.1);
+    svr.fit(X_train, y_train);
+
+    // Make predictions
+    std::vector<double> predictions = svr.predict(X_test);
+
+    // Output predictions
+    for (size_t i = 0; i < predictions.size(); ++i) {
+        std::cout << "Sample " << i << " predicted value: " << predictions[i] << std::endl;
+    }
+
+    return 0;
+}
+
+int main(){
+    testSupportVectorRegression();
+}
diff --git a/ml_library_include/ml/regression/SupportVectorRegression.hpp b/ml_library_include/ml/regression/SupportVectorRegression.hpp
@@ -0,0 +1,299 @@
+#ifndef SUPPORT_VECTOR_REGRESSION_HPP
+#define SUPPORT_VECTOR_REGRESSION_HPP
+
+#include <vector>
+#include <cmath>
+#include <algorithm>
+#include <limits>
+#include <functional>
+#include <numeric>
+#include <random>
+#include <cassert>
+
+/**
+ * @file SupportVectorRegression.hpp
+ * @brief Implementation of Support Vector Regression (SVR) using SMO algorithm.
+ */
+
+/**
+ * @class SupportVectorRegression
+ * @brief Support Vector Regression using the ε-insensitive loss function.
+ */
+class SupportVectorRegression {
+public:
+    /**
+     * @brief Kernel function types.
+     */
+    enum class KernelType {
+        LINEAR,
+        POLYNOMIAL,
+        RBF
+    };
+
+    /**
+     * @brief Constructs a SupportVectorRegression model.
+     * @param C Regularization parameter.
+     * @param epsilon Epsilon parameter in the ε-insensitive loss function.
+     * @param kernel_type Type of kernel function to use.
+     * @param degree Degree for polynomial kernel.
+     * @param gamma Gamma parameter for RBF kernel.
+     * @param coef0 Independent term in polynomial kernel.
+     */
+    SupportVectorRegression(double C = 1.0, double epsilon = 0.1, KernelType kernel_type = KernelType::RBF,
+                            int degree = 3, double gamma = 1.0, double coef0 = 0.0);
+
+    /**
+     * @brief Destructor for SupportVectorRegression.
+     */
+    ~SupportVectorRegression();
+
+    /**
+     * @brief Fits the SVR model to the training data.
+     * @param X A vector of feature vectors (training data).
+     * @param y A vector of target values (training labels).
+     */
+    void fit(const std::vector<std::vector<double>>& X, const std::vector<double>& y);
+
+    /**
+     * @brief Predicts target values for the given input data.
+     * @param X A vector of feature vectors (test data).
+     * @return A vector of predicted target values.
+     */
+    std::vector<double> predict(const std::vector<std::vector<double>>& X) const;
+
+private:
+    double C; ///< Regularization parameter.
+    double epsilon; ///< Epsilon in the ε-insensitive loss function.
+    KernelType kernel_type; ///< Type of kernel function.
+    int degree; ///< Degree for polynomial kernel.
+    double gamma; ///< Gamma parameter for RBF kernel.
+    double coef0; ///< Independent term in polynomial kernel.
+
+    std::vector<std::vector<double>> X_train; ///< Training data features.
+    std::vector<double> y_train;              ///< Training data target values.
+    std::vector<double> alpha;                ///< Lagrange multipliers for positive errors.
+    std::vector<double> alpha_star;           ///< Lagrange multipliers for negative errors.
+    double b;                                 ///< Bias term.
+
+    std::function<double(const std::vector<double>&, const std::vector<double>&)> kernel; ///< Kernel function.
+
+    /**
+     * @brief Initializes the kernel function based on the kernel type.
+     */
+    void initialize_kernel();
+
+    /**
+     * @brief Solves the dual optimization problem using SMO.
+     */
+    void solve();
+
+    /**
+     * @brief Computes the output for a single sample.
+     * @param x The feature vector of the sample.
+     * @return The predicted target value.
+     */
+    double predict_sample(const std::vector<double>& x) const;
+
+    /**
+     * @brief Computes the kernel value between two samples.
+     * @param x1 The first feature vector.
+     * @param x2 The second feature vector.
+     * @return The kernel value.
+     */
+    double compute_kernel(const std::vector<double>& x1, const std::vector<double>& x2) const;
+
+    /**
+     * @brief Random number generator.
+     */
+    std::mt19937 rng;
+
+    /**
+     * @brief Error cache for SMO algorithm.
+     */
+    std::vector<double> errors;
+
+    /**
+     * @brief Initialize error cache.
+     */
+    void initialize_errors();
+
+    /**
+     * @brief Update error cache for a given index.
+     * @param i Index of the sample.
+     */
+    void update_error(size_t i);
+
+    /**
+     * @brief Select second index j for SMO algorithm.
+     * @param i First index.
+     * @return Second index j.
+     */
+    size_t select_second_index(size_t i);
+};
+
+SupportVectorRegression::SupportVectorRegression(double C, double epsilon, KernelType kernel_type,
+                                                 int degree, double gamma, double coef0)
+    : C(C), epsilon(epsilon), kernel_type(kernel_type), degree(degree), gamma(gamma), coef0(coef0), b(0.0) {
+    initialize_kernel();
+    rng.seed(std::random_device{}());
+}
+
+SupportVectorRegression::~SupportVectorRegression() {}
+
+void SupportVectorRegression::initialize_kernel() {
+    if (kernel_type == KernelType::LINEAR) {
+        kernel = [](const std::vector<double>& x1, const std::vector<double>& x2) {
+            return std::inner_product(x1.begin(), x1.end(), x2.begin(), 0.0);
+        };
+    } else if (kernel_type == KernelType::POLYNOMIAL) {
+        kernel = [this](const std::vector<double>& x1, const std::vector<double>& x2) {
+            return std::pow(gamma * std::inner_product(x1.begin(), x1.end(), x2.begin(), 0.0) + coef0, degree);
+        };
+    } else if (kernel_type == KernelType::RBF) {
+        kernel = [this](const std::vector<double>& x1, const std::vector<double>& x2) {
+            double sum = 0.0;
+            for (size_t i = 0; i < x1.size(); ++i) {
+                double diff = x1[i] - x2[i];
+                sum += diff * diff;
+            }
+            return std::exp(-gamma * sum);
+        };
+    }
+}
+
+void SupportVectorRegression::fit(const std::vector<std::vector<double>>& X, const std::vector<double>& y) {
+    X_train = X;
+    y_train = y;
+    size_t n_samples = X_train.size();
+
+    alpha.resize(n_samples, 0.0);
+    alpha_star.resize(n_samples, 0.0);
+
+    initialize_errors();
+
+    solve();
+}
+
+std::vector<double> SupportVectorRegression::predict(const std::vector<std::vector<double>>& X) const {
+    std::vector<double> predictions;
+    predictions.reserve(X.size());
+    for (const auto& x : X) {
+        predictions.push_back(predict_sample(x));
+    }
+    return predictions;
+}
+
+void SupportVectorRegression::initialize_errors() {
+    size_t n_samples = X_train.size();
+    errors.resize(n_samples);
+    for (size_t i = 0; i < n_samples; ++i) {
+        errors[i] = predict_sample(X_train[i]) - y_train[i];
+    }
+}
+
+double SupportVectorRegression::predict_sample(const std::vector<double>& x) const {
+    double result = b;
+    size_t n_samples = X_train.size();
+    for (size_t i = 0; i < n_samples; ++i) {
+        double coeff = alpha[i] - alpha_star[i];
+        if (std::abs(coeff) > 1e-8) {
+            result += coeff * compute_kernel(X_train[i], x);
+        }
+    }
+    return result;
+}
+
+double SupportVectorRegression::compute_kernel(const std::vector<double>& x1, const std::vector<double>& x2) const {
+    return kernel(x1, x2);
+}
+
+void SupportVectorRegression::update_error(size_t i) {
+    errors[i] = predict_sample(X_train[i]) - y_train[i];
+}
+
+size_t SupportVectorRegression::select_second_index(size_t i) {
+    size_t n_samples = X_train.size();
+    std::uniform_int_distribution<size_t> dist(0, n_samples - 1);
+    size_t j = dist(rng);
+    while (j == i) {
+        j = dist(rng);
+    }
+    return j;
+}
+
+void SupportVectorRegression::solve() {
+    size_t n_samples = X_train.size();
+    size_t max_passes = 5;
+    size_t passes = 0;
+    double tol = 1e-3;
+
+    while (passes < max_passes) {
+        size_t num_changed_alphas = 0;
+        for (size_t i = 0; i < n_samples; ++i) {
+            double E_i = errors[i];
+
+            // Check KKT conditions for alpha[i]
+            bool violate_KKT_alpha = ((alpha[i] < C) && (E_i > epsilon)) || ((alpha[i] > 0) && (E_i < epsilon));
+
+            // Check KKT conditions for alpha_star[i]
+            bool violate_KKT_alpha_star = ((alpha_star[i] < C) && (E_i < -epsilon)) || ((alpha_star[i] > 0) && (E_i > -epsilon));
+
+            if (violate_KKT_alpha || violate_KKT_alpha_star) {
+                size_t j = select_second_index(i);
+                double E_j = errors[j];
+
+                // Compute eta
+                double K_ii = compute_kernel(X_train[i], X_train[i]);
+                double K_jj = compute_kernel(X_train[j], X_train[j]);
+                double K_ij = compute_kernel(X_train[i], X_train[j]);
+                double eta = K_ii + K_jj - 2 * K_ij;
+
+                if (eta <= 0) {
+                    continue;
+                }
+
+                double alpha_i_old = alpha[i];
+                double alpha_star_i_old = alpha_star[i];
+                double alpha_j_old = alpha[j];
+                double alpha_star_j_old = alpha_star[j];
+
+                // Update alpha[i] and alpha[j]
+                double delta_alpha = 0.0;
+
+                if (violate_KKT_alpha) {
+                    delta_alpha = std::min(C - alpha[i], std::max(-alpha[i], (E_i - E_j) / eta));
+                    alpha[i] += delta_alpha;
+                    alpha[j] -= delta_alpha;
+                } else if (violate_KKT_alpha_star) {
+                    delta_alpha = std::min(C - alpha_star[i], std::max(-alpha_star[i], -(E_i - E_j) / eta));
+                    alpha_star[i] += delta_alpha;
+                    alpha_star[j] -= delta_alpha;
+                }
+
+                // Update threshold b
+                double b1 = b - E_i - delta_alpha * (K_ii - K_ij);
+                double b2 = b - E_j - delta_alpha * (K_ij - K_jj);
+
+                if ((alpha[i] > 0 && alpha[i] < C) || (alpha_star[i] > 0 && alpha_star[i] < C))
+                    b = b1;
+                else if ((alpha[j] > 0 && alpha[j] < C) || (alpha_star[j] > 0 && alpha_star[j] < C))
+                    b = b2;
+                else
+                    b = (b1 + b2) / 2.0;
+
+                // Update error cache
+                update_error(i);
+                update_error(j);
+
+                num_changed_alphas++;
+            }
+        }
+
+        if (num_changed_alphas == 0)
+            passes++;
+        else
+            passes = 0;
+    }
+}
+
+#endif // SUPPORT_VECTOR_REGRESSION_HPP