summaryrefslogtreecommitdiffstats
path: root/ml/KMeans.h
diff options
context:
space:
mode:
Diffstat (limited to 'ml/KMeans.h')
-rw-r--r--ml/KMeans.h41
1 files changed, 41 insertions, 0 deletions
diff --git a/ml/KMeans.h b/ml/KMeans.h
new file mode 100644
index 00000000..0398eeb8
--- /dev/null
+++ b/ml/KMeans.h
@@ -0,0 +1,41 @@
+// SPDX-License-Identifier: GPL-3.0-or-later
+
+#ifndef KMEANS_H
+#define KMEANS_H
+
+#include <atomic>
+#include <vector>
+#include <limits>
+#include <mutex>
+
+#include "SamplesBuffer.h"
+#include "json/single_include/nlohmann/json.hpp"
+
+class KMeans {
+public:
+ KMeans(size_t NumClusters = 2) : NumClusters(NumClusters) {
+ MinDist = std::numeric_limits<CalculatedNumber>::max();
+ MaxDist = std::numeric_limits<CalculatedNumber>::min();
+ };
+
+ void train(const std::vector<DSample> &Samples, size_t MaxIterations);
+ CalculatedNumber anomalyScore(const DSample &Sample) const;
+
+ void toJson(nlohmann::json &J) const {
+ J = nlohmann::json{
+ {"CCs", ClusterCenters},
+ {"MinDist", MinDist},
+ {"MaxDist", MaxDist}
+ };
+ }
+
+private:
+ size_t NumClusters;
+
+ std::vector<DSample> ClusterCenters;
+
+ CalculatedNumber MinDist;
+ CalculatedNumber MaxDist;
+};
+
+#endif /* KMEANS_H */