-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathKMeansTest.cpp
106 lines (104 loc) · 5.11 KB
/
KMeansTest.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
//
// Created by Olcay Taner YILDIZ on 10.01.2021.
//
#include "catch.hpp"
#include "../src/DataSet/DataSet.h"
#include "../src/Model/Parametric/KMeansModel.h"
#include "../src/Parameter/KMeansParameter.h"
TEST_CASE("KMeansTest-testTrain") {
DataSet iris, car, chess, bupa, tictactoe, dermatology, nursery;
vector<AttributeType> attributeTypes;
for (int i = 0; i < 4; i++) {
attributeTypes.emplace_back(AttributeType::CONTINUOUS);
}
DataDefinition dataDefinition = DataDefinition(attributeTypes);
iris = DataSet(dataDefinition, ",", "datasets/iris.data");
attributeTypes.clear();
for (int i = 0; i < 6; i++) {
attributeTypes.emplace_back(AttributeType::CONTINUOUS);
}
dataDefinition = DataDefinition(attributeTypes);
bupa = DataSet(dataDefinition, ",", "datasets/bupa.data");
attributeTypes.clear();
for (int i = 0; i < 34; i++) {
attributeTypes.emplace_back(AttributeType::CONTINUOUS);
}
dataDefinition = DataDefinition(attributeTypes);
dermatology = DataSet(dataDefinition, ",", "datasets/dermatology.data");
attributeTypes.clear();
for (int i = 0; i < 6; i++) {
attributeTypes.emplace_back(AttributeType::DISCRETE);
}
dataDefinition = DataDefinition(attributeTypes);
car = DataSet(dataDefinition, ",", "datasets/car.data");
attributeTypes.clear();
for (int i = 0; i < 9; i++) {
attributeTypes.emplace_back(AttributeType::DISCRETE);
}
dataDefinition = DataDefinition(attributeTypes);
tictactoe = DataSet(dataDefinition, ",", "datasets/tictactoe.data");
attributeTypes.clear();
for (int i = 0; i < 8; i++) {
attributeTypes.emplace_back(AttributeType::DISCRETE);
}
dataDefinition = DataDefinition(attributeTypes);
nursery = DataSet(dataDefinition, ",", "datasets/nursery.data");
attributeTypes.clear();
for (int i = 0; i < 6; i++) {
if (i % 2 == 0) {
attributeTypes.emplace_back(AttributeType::DISCRETE);
} else {
attributeTypes.emplace_back(AttributeType::CONTINUOUS);
}
}
dataDefinition = DataDefinition(attributeTypes);
chess = DataSet(dataDefinition, ",", "datasets/chess.data");
auto* kMeansParameter = new KMeansParameter(1);
SECTION("train") {
KMeansModel kMeans = KMeansModel();
InstanceList instanceList = iris.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(7.33, Catch::Matchers::WithinAbs(100 * kMeans.test(iris.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
instanceList = bupa.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(43.77, Catch::Matchers::WithinAbs(100 * kMeans.test(bupa.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
instanceList = dermatology.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(45.08, Catch::Matchers::WithinAbs(100 * kMeans.test(dermatology.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
instanceList = car.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(56.71, Catch::Matchers::WithinAbs(100 * kMeans.test(car.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
instanceList = tictactoe.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(31.00, Catch::Matchers::WithinAbs(100 * kMeans.test(tictactoe.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
instanceList = nursery.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(45.00, Catch::Matchers::WithinAbs(100 * kMeans.test(nursery.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
instanceList = chess.getInstanceList();
kMeans.train(instanceList, kMeansParameter);
REQUIRE_THAT(83.25, Catch::Matchers::WithinAbs(100 * kMeans.test(chess.getInstanceList())->getErrorRate(), 0.01));
}
SECTION("load") {
KMeansModel kMeans = KMeansModel();
kMeans.loadModel("models/kmeans-iris.txt");
REQUIRE_THAT(7.33, Catch::Matchers::WithinAbs(100 * kMeans.test(iris.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
kMeans.loadModel("models/kmeans-bupa.txt");
REQUIRE_THAT(43.77, Catch::Matchers::WithinAbs(100 * kMeans.test(bupa.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
kMeans.loadModel("models/kmeans-dermatology.txt");
REQUIRE_THAT(45.08, Catch::Matchers::WithinAbs(100 * kMeans.test(dermatology.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
kMeans.loadModel("models/kmeans-car.txt");
REQUIRE_THAT(56.71, Catch::Matchers::WithinAbs(100 * kMeans.test(car.getInstanceList())->getErrorRate(), 0.01));
kMeans = KMeansModel();
kMeans.loadModel("models/kmeans-tictactoe.txt");
REQUIRE_THAT(31.00, Catch::Matchers::WithinAbs(100 * kMeans.test(tictactoe.getInstanceList())->getErrorRate(), 0.01));
}
}