select "alpha", count(*) from alpha
UNION ALL
select "beta", count(*) from beta
UNION ALL
select "delta", count(*) from delta
UNION ALL
select "gamma", count(*) from gamma
dataset
count
"alpha"
"2204"
"beta"
"2204"
"delta"
"2204"
"gamma"
"2204"
Top 10 Performers, external metric
select clusteralgorithm,distancefunction,usedfields,tfidf,stopwords,lemmatized,synonyms,germanetfunction,Word2VecAdd,Word2VecAverage,F1WeightedAvg from alpha order by F1WeightedAvg desc
limit 10
alpha
clusteralgorithm
distancefunction
usedfields
tfidf
stopwords
lemmatized
synonyms
germanetfunction
Word2VecAdd
Word2VecAverage
F1WeightedAvg
FuzzyCMeans2320
CosineDistance
7
true
true
true
false
false
false
false
0.3443
FuzzyCMeans2320
CosineDistance
7
true
true
true
true
false
false
false
0.3417
KMeans2320
CosineDistance
7
true
true
true
false
false
false
true
0.3209
FuzzyCMeans2320
CosineDistance
7
true
true
true
false
false
true
false
0.3205
KMeans2320
CosineDistance
7
true
true
true
false
false
true
false
0.3165
FuzzyCMeans2320
CosineDistance
7
true
true
true
false
false
false
true
0.3134
FuzzyCMeans2320
CosineDistance
7
true
true
true
true
false
true
false
0.3002
KMeans2320
CosineDistance
7
true
true
true
true
false
false
true
0.299
KMeans2320
EuclideanDistance
7
true
true
true
false
false
false
true
0.299
KMeans2320
CosineDistance
7
true
true
true
false
false
false
false
0.2987
beta
clusteralgorithm
distancefunction
usedfields
tfidf
stopwords
lemmatized
synonyms
germanetfunction
Word2VecAdd
Word2VecAverage
F1WeightedAvg
ClusterART
Not needed
7
true
true
true
true
true
false
false
0.7506
Neural Gas
CosineDistance
7
true
true
true
true
true
true
false
0.5297
Neural Gas
CosineDistance
7
true
true
true
true
true
false
false
0.5285
Neural Gas
CosineDistance
7
true
true
true
true
true
false
true
0.5284
ClusterART
Not needed
7
true
true
true
false
true
false
false
0.5024
Neural Gas
EuclideanDistance
7
true
true
true
true
true
false
true
0.4872
FuzzyCMeans1520
EuclideanDistance
7
true
true
true
false
false
true
false
0.4618
Neural Gas
EuclideanDistance
7
true
true
true
true
false
false
true
0.4617
KMeans1520
WordEmbDistance
7
true
true
true
true
false
false
false
0.459
KMeans1520
WordEmbDistance
7
true
true
true
true
false
false
true
0.459
gamma
clusteralgorithm
distancefunction
usedfields
tfidf
stopwords
lemmatized
synonyms
germanetfunction
Word2VecAdd
Word2VecAverage
F1WeightedAvg
KMeans1720
CosineDistance
7
true
true
true
false
false
false
false
0.5184
KMeans1720
CosineDistance
7
true
true
true
true
false
false
false
0.5044
ClusterART
Not needed
7
true
true
true
true
false
false
false
0.4662
KMeans1720
EuclideanDistance
7
true
true
true
false
false
false
false
0.463
FuzzyCMeans1720
CosineDistance
7
true
true
true
false
false
false
false
0.4353
FuzzyCMeans1720
EuclideanDistance
7
true
true
true
false
false
false
false
0.4352
KMeans1720
EuclideanDistance
7
true
true
true
true
false
false
false
0.4335
FuzzyCMeans1720
CosineDistance
7
true
true
true
true
false
false
false
0.417
FuzzyCMeans1720
EuclideanDistance
7
true
true
true
true
false
false
false
0.4111
KMeans1720
EuclideanDistance
7
true
true
true
false
false
false
true
0.4097
delta
clusteralgorithm
distancefunction
usedfields
tfidf
stopwords
lemmatized
synonyms
germanetfunction
Word2VecAdd
Word2VecAverage
F1WeightedAvg
ClusterART
Not needed
7
true
true
true
true
false
false
false
0.5622
ClusterART
Not needed
7
true
true
true
false
false
false
false
0.5584
Neural Gas
CosineDistance
7
true
true
true
false
false
false
false
0.5102
Neural Gas
CosineDistance
7
true
true
true
true
false
false
false
0.5093
Neural Gas
EuclideanDistance
7
true
true
true
false
false
false
false
0.5082
Neural Gas
EuclideanDistance
7
true
true
true
true
false
false
false
0.5017
KMeans1620
CosineDistance
7
true
true
true
false
false
false
false
0.4604
Neural Gas
EuclideanDistance
7
true
true
true
true
false
false
true
0.4552
Neural Gas
EuclideanDistance
7
true
true
true
false
false
false
true
0.454
KMeans1620
CosineDistance
7
true
true
true
true
false
false
false
0.45
Top 10 Performers, internal metric
select k, clusteralgorithm, distancefunction,word2vecadd,word2vecaverage,SilhouetteAvg from alpha order by silhouetteavg desc
limit 10
alpha (Human Golden Standard: k=23)
k
clusteralgorithm
distancefunction
word2vecadd
word2vecaverage
SilhouetteAvg
2
KMeans220
EuclideanDistance
true
false
0.9084
2
KMeans220
EuclideanDistance
true
false
0.9082
2
KMeans220
EuclideanDistance
false
true
0.8006
11
FuzzyCMeans1120
EuclideanDistance
true
false
0.7854
12
FuzzyCMeans1220
EuclideanDistance
true
false
0.7803
13
FuzzyCMeans1320
EuclideanDistance
true
false
0.7681
14
FuzzyCMeans1420
EuclideanDistance
true
false
0.7644
10
FuzzyCMeans1020
EuclideanDistance
true
false
0.7643
15
FuzzyCMeans1520
EuclideanDistance
true
false
0.7584
8
FuzzyCMeans820
EuclideanDistance
true
false
0.7434
beta (Human Golden Standard: k=15)
k
clusteralgorithm
distancefunction
word2vecadd
word2vecaverage
SilhouetteAvg
14
KMeans1420
EuclideanDistance
true
false
0.6819
13
KMeans1320
EuclideanDistance
true
false
0.6794
15
KMeans1520
EuclideanDistance
true
false
0.6781
12
KMeans1220
EuclideanDistance
true
false
0.6761
11
KMeans1120
EuclideanDistance
true
false
0.6721
16
KMeans1620
EuclideanDistance
true
false
0.6716
17
KMeans1720
EuclideanDistance
true
false
0.6663
10
KMeans1020
EuclideanDistance
true
false
0.6662
18
KMeans1820
EuclideanDistance
true
false
0.6598
15
FuzzyCMeans1520
EuclideanDistance
true
false
0.6559
gamma (Human Golden Standard: k=19)
k
clusteralgorithm
distancefunction
word2vecadd
word2vecaverage
SilhouetteAvg
12
KMeans1220
EuclideanDistance
true
false
0.7102
10
KMeans1020
EuclideanDistance
true
false
0.7081
13
KMeans1320
EuclideanDistance
true
false
0.7073
11
KMeans1120
EuclideanDistance
true
false
0.7053
14
KMeans1420
EuclideanDistance
true
false
0.7039
9
KMeans920
EuclideanDistance
true
false
0.7036
15
KMeans1520
EuclideanDistance
true
false
0.6983
8
KMeans820
EuclideanDistance
true
false
0.6957
16
KMeans1620
EuclideanDistance
true
false
0.6919
11
KMeans1120
EuclideanDistance
true
false
0.6881
delta (Human Golden Standard: k=16)
k
clusteralgorithm
distancefunction
word2vecadd
word2vecaverage
SilhouetteAvg
16
FuzzyCMeans1620
EuclideanDistance
true
false
0.7195
15
FuzzyCMeans1520
EuclideanDistance
true
false
0.7181
13
FuzzyCMeans1320
EuclideanDistance
true
false
0.7169
17
FuzzyCMeans1720
EuclideanDistance
true
false
0.7149
14
FuzzyCMeans1420
EuclideanDistance
true
false
0.7142
14
KMeans1420
EuclideanDistance
true
false
0.714
12
FuzzyCMeans1220
EuclideanDistance
true
false
0.7137
13
KMeans1320
EuclideanDistance
true
false
0.7117
12
KMeans1220
EuclideanDistance
true
false
0.7104
16
KMeans1620
EuclideanDistance
true
false
0.7103
Correlation between Silhouette and F1
select SilhouetteAvg,F1WeightedAvg from alpha
where distancefunction <> "WordEmbDistance" -- Not supported distance function
select ClusterAlgorithm, DistanceFunction, Synonyms, Tfidf, Synonyms, GermaNetFunction, Word2VecAdd, Word2VecAverage, SilhouetteAvg, max(F1WeightedAvg) BestF1 from alpha
group by ClusterAlgorithm
order by BestF1 desc
alpha
ClusterAlgorithm
DistanceFunction
Synonyms
Tfidf
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
SilhouetteAvg
BestF1
FuzzyCMeans2320
CosineDistance
false
true
false
false
false
false
0.0847
0.3443
KMeans2320
CosineDistance
false
true
false
false
false
true
0.0374
0.3209
Neural Gas
EuclideanDistance
false
true
false
true
false
true
0.0893
0.2475
ClusterART
Not needed
false
true
false
false
false
false
0.1943
0.2383
beta
ClusterAlgorithm
DistanceFunction
Synonyms
Tfidf
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
SilhouetteAvg
BestF1
ClusterART
Not needed
true
true
true
true
false
false
0.0189
0.7506
Neural Gas
CosineDistance
true
true
true
true
true
false
-0.0464
0.5297
FuzzyCMeans1520
EuclideanDistance
false
true
false
false
true
false
0.022
0.4618
KMeans1520
WordEmbDistance
true
true
true
false
false
false
-1.0
0.459
gamma
ClusterAlgorithm
DistanceFunction
Synonyms
Tfidf
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
SilhouetteAvg
BestF1
KMeans1720
CosineDistance
false
true
false
false
false
false
0.1451
0.5184
ClusterART
Not needed
true
true
true
false
false
false
0.2436
0.4662
FuzzyCMeans1720
CosineDistance
false
true
false
false
false
false
0.1041
0.4353
Neural Gas
CosineDistance
true
true
true
false
false
true
0.0701
0.4083
delta
ClusterAlgorithm
DistanceFunction
Synonyms
Tfidf
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
SilhouetteAvg
BestF1
ClusterART
Not needed
true
true
true
false
false
false
0.2014
0.5622
Neural Gas
CosineDistance
false
true
false
false
false
false
0.0636
0.5102
KMeans1620
CosineDistance
false
true
false
false
false
false
0.1435
0.4604
FuzzyCMeans1620
EuclideanDistance
false
true
false
false
false
true
0.0227
0.4394
Best performances per parameter (internal)
select ClusterAlgorithm, k, DistanceFunction, Synonyms, Synonyms, GermaNetFunction, Word2VecAdd, Word2VecAverage, max(SilhouetteAvg) from alpha
group by ClusterAlgorithm
order by SilhouetteAvg desc
alpha
ClusterAlgorithm
k
DistanceFunction
Synonyms
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
Best SilhouetteAvg
KMeans220
2
EuclideanDistance
true
true
false
true
false
0.9084
FuzzyCMeans1120
11
EuclideanDistance
true
true
true
true
false
0.7854
FuzzyCMeans1220
12
EuclideanDistance
true
true
true
true
false
0.7803
FuzzyCMeans1320
13
EuclideanDistance
true
true
true
true
false
0.7681
FuzzyCMeans1420
14
EuclideanDistance
true
true
true
true
false
0.7644
FuzzyCMeans1020
10
EuclideanDistance
true
true
true
true
false
0.7643
FuzzyCMeans1520
15
EuclideanDistance
true
true
true
true
false
0.7584
FuzzyCMeans820
8
EuclideanDistance
true
true
true
true
false
0.7434
FuzzyCMeans1620
16
EuclideanDistance
true
true
true
true
false
0.7376
FuzzyCMeans920
9
EuclideanDistance
true
true
true
true
false
0.7375
KMeans1020
10
EuclideanDistance
true
true
true
true
false
0.7351
KMeans920
9
EuclideanDistance
true
true
true
true
false
0.7344
KMeans1120
11
EuclideanDistance
true
true
true
true
false
0.7332
FuzzyCMeans1720
17
EuclideanDistance
true
true
true
true
false
0.7295
KMeans1220
12
EuclideanDistance
true
true
true
true
false
0.7289
KMeans1320
13
EuclideanDistance
false
false
true
true
false
0.7282
KMeans820
8
EuclideanDistance
true
true
true
true
false
0.726
KMeans1420
14
EuclideanDistance
false
false
true
true
false
0.7251
KMeans1520
15
EuclideanDistance
false
false
true
true
false
0.7196
KMeans1620
16
EuclideanDistance
false
false
true
true
false
0.7166
KMeans1720
17
EuclideanDistance
false
false
true
true
false
0.715
KMeans720
7
EuclideanDistance
true
true
true
true
false
0.713
FuzzyCMeans720
7
EuclideanDistance
true
true
true
true
false
0.7085
KMeans1820
18
EuclideanDistance
false
false
true
true
false
0.7074
FuzzyCMeans1820
18
EuclideanDistance
true
true
true
true
false
0.7062
FuzzyCMeans1920
19
EuclideanDistance
true
true
true
true
false
0.7059
KMeans1920
19
EuclideanDistance
false
false
true
true
false
0.7047
KMeans2020
20
EuclideanDistance
false
false
true
true
false
0.7005
KMeans2120
21
EuclideanDistance
false
false
true
true
false
0.6994
FuzzyCMeans2020
20
EuclideanDistance
true
true
true
true
false
0.6975
KMeans2220
22
EuclideanDistance
false
false
true
true
false
0.6967
KMeans2320
23
EuclideanDistance
false
false
true
true
false
0.689
KMeans620
6
EuclideanDistance
true
true
true
true
false
0.6854
KMeans2420
24
EuclideanDistance
false
false
true
true
false
0.683
KMeans2520
25
EuclideanDistance
false
false
true
true
false
0.6801
FuzzyCMeans2120
21
EuclideanDistance
true
true
true
true
false
0.6797
FuzzyCMeans2220
22
EuclideanDistance
true
true
true
true
false
0.6777
FuzzyCMeans620
6
EuclideanDistance
true
true
true
true
false
0.6721
KMeans2620
26
EuclideanDistance
false
false
true
true
false
0.6719
FuzzyCMeans2320
23
EuclideanDistance
true
true
true
true
false
0.6656
KMeans2720
27
EuclideanDistance
false
false
true
true
false
0.6606
KMeans2820
28
EuclideanDistance
false
false
true
true
false
0.6566
FuzzyCMeans2420
24
EuclideanDistance
true
true
true
true
false
0.6549
KMeans2920
29
EuclideanDistance
false
false
true
true
false
0.6487
KMeans3020
30
EuclideanDistance
false
false
true
true
false
0.6461
FuzzyCMeans2520
25
EuclideanDistance
true
true
true
true
false
0.6443
FuzzyCMeans2620
26
EuclideanDistance
true
true
true
true
false
0.6428
KMeans520
5
EuclideanDistance
true
true
true
true
false
0.6395
FuzzyCMeans2720
27
EuclideanDistance
true
true
true
true
false
0.6279
FuzzyCMeans2820
28
EuclideanDistance
true
true
true
true
false
0.6222
FuzzyCMeans520
5
EuclideanDistance
true
true
true
true
false
0.6151
FuzzyCMeans2920
29
EuclideanDistance
true
true
true
true
false
0.6109
KMeans420
4
EuclideanDistance
true
true
true
false
true
0.6086
FuzzyCMeans3020
30
EuclideanDistance
true
true
true
true
false
0.5966
FuzzyCMeans220
2
EuclideanDistance
false
false
true
false
true
0.5666
KMeans320
3
EuclideanDistance
true
true
true
true
false
0.5651
FuzzyCMeans420
4
EuclideanDistance
false
false
true
false
true
0.5507
Neural Gas
2
EuclideanDistance
true
true
true
false
true
0.545
FuzzyCMeans320
3
EuclideanDistance
true
true
true
false
true
0.5406
ClusterART
27
Not needed
false
false
false
false
false
0.2134
beta
ClusterAlgorithm
k
DistanceFunction
Synonyms
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
Best SilhouetteAvg
KMeans1420
14
EuclideanDistance
false
false
true
true
false
0.6819
KMeans1320
13
EuclideanDistance
false
false
true
true
false
0.6794
KMeans1520
15
EuclideanDistance
false
false
true
true
false
0.6781
KMeans1220
12
EuclideanDistance
false
false
true
true
false
0.6761
KMeans1120
11
EuclideanDistance
false
false
true
true
false
0.6721
KMeans1620
16
EuclideanDistance
false
false
true
true
false
0.6716
KMeans1720
17
EuclideanDistance
false
false
true
true
false
0.6663
KMeans1020
10
EuclideanDistance
false
false
true
true
false
0.6662
KMeans1820
18
EuclideanDistance
false
false
true
true
false
0.6598
FuzzyCMeans1520
15
EuclideanDistance
true
true
true
true
false
0.6559
KMeans1920
19
EuclideanDistance
false
false
true
true
false
0.652
FuzzyCMeans1420
14
EuclideanDistance
true
true
true
true
false
0.6509
KMeans920
9
EuclideanDistance
false
false
true
true
false
0.6509
FuzzyCMeans1620
16
EuclideanDistance
true
true
true
true
false
0.6482
KMeans2020
20
EuclideanDistance
false
false
true
true
false
0.6458
FuzzyCMeans1320
13
EuclideanDistance
true
true
true
true
false
0.6435
FuzzyCMeans1720
17
EuclideanDistance
true
true
true
true
false
0.6392
FuzzyCMeans1220
12
EuclideanDistance
true
true
true
true
false
0.6362
KMeans2120
21
EuclideanDistance
false
false
true
true
false
0.6357
KMeans820
8
EuclideanDistance
true
true
true
true
false
0.6311
FuzzyCMeans1820
18
EuclideanDistance
true
true
true
true
false
0.6297
KMeans2220
22
EuclideanDistance
false
false
true
true
false
0.6278
KMeans2320
23
EuclideanDistance
false
false
true
true
false
0.6191
FuzzyCMeans1920
19
EuclideanDistance
true
true
true
true
false
0.615
FuzzyCMeans920
9
EuclideanDistance
true
true
true
true
false
0.6149
FuzzyCMeans720
7
EuclideanDistance
true
true
true
true
false
0.6127
KMeans720
7
EuclideanDistance
true
true
true
true
false
0.6117
FuzzyCMeans2020
20
EuclideanDistance
true
true
true
true
false
0.6075
KMeans2420
24
EuclideanDistance
false
false
true
true
false
0.6071
FuzzyCMeans1020
10
EuclideanDistance
true
true
true
true
false
0.6063
FuzzyCMeans1120
11
EuclideanDistance
false
false
true
true
false
0.6057
FuzzyCMeans620
6
EuclideanDistance
true
true
true
true
false
0.6057
KMeans2520
25
EuclideanDistance
false
false
true
true
false
0.6009
FuzzyCMeans820
8
EuclideanDistance
true
true
true
true
false
0.6004
FuzzyCMeans2120
21
EuclideanDistance
true
true
true
true
false
0.5949
KMeans2620
26
EuclideanDistance
false
false
true
true
false
0.5908
KMeans620
6
EuclideanDistance
true
true
true
true
false
0.5868
KMeans2720
27
EuclideanDistance
false
false
true
true
false
0.5849
FuzzyCMeans2220
22
EuclideanDistance
true
true
true
true
false
0.5811
FuzzyCMeans220
2
EuclideanDistance
false
false
true
false
true
0.579
KMeans2820
28
EuclideanDistance
false
false
true
true
false
0.5785
FuzzyCMeans2320
23
EuclideanDistance
true
true
true
true
false
0.5763
KMeans2920
29
EuclideanDistance
false
false
true
true
false
0.571
KMeans220
2
EuclideanDistance
false
false
true
false
true
0.5709
KMeans520
5
EuclideanDistance
false
false
true
false
true
0.5702
KMeans3020
30
EuclideanDistance
false
false
true
true
false
0.5654
FuzzyCMeans2420
24
EuclideanDistance
true
true
true
true
false
0.5599
Neural Gas
2
EuclideanDistance
false
false
true
false
true
0.5588
FuzzyCMeans2520
25
EuclideanDistance
true
true
true
true
false
0.5537
KMeans320
3
EuclideanDistance
false
false
true
false
true
0.5533
FuzzyCMeans2620
26
EuclideanDistance
true
true
true
true
false
0.5492
KMeans420
4
EuclideanDistance
true
true
true
true
false
0.5477
FuzzyCMeans320
3
EuclideanDistance
false
false
true
false
true
0.5346
FuzzyCMeans520
5
EuclideanDistance
false
false
true
false
true
0.5323
FuzzyCMeans2720
27
EuclideanDistance
true
true
true
true
false
0.5319
FuzzyCMeans420
4
EuclideanDistance
false
false
true
false
true
0.5243
FuzzyCMeans2820
28
EuclideanDistance
true
true
true
true
false
0.5177
FuzzyCMeans2920
29
EuclideanDistance
true
true
true
true
false
0.5044
FuzzyCMeans3020
30
EuclideanDistance
true
true
true
true
false
0.5016
ClusterART
2
Not needed
false
false
false
false
false
0.2176
gamma
ClusterAlgorithm
k
DistanceFunction
Synonyms
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
Best SilhouetteAvg
KMeans1220
12
EuclideanDistance
true
true
true
true
false
0.7102
KMeans1020
10
EuclideanDistance
true
true
true
true
false
0.7081
KMeans1320
13
EuclideanDistance
true
true
true
true
false
0.7073
KMeans1120
11
EuclideanDistance
true
true
true
true
false
0.7053
KMeans1420
14
EuclideanDistance
true
true
true
true
false
0.7039
KMeans920
9
EuclideanDistance
true
true
true
true
false
0.7036
KMeans1520
15
EuclideanDistance
true
true
true
true
false
0.6983
KMeans820
8
EuclideanDistance
true
true
true
true
false
0.6957
KMeans1620
16
EuclideanDistance
true
true
true
true
false
0.6919
KMeans1720
17
EuclideanDistance
true
true
true
true
false
0.6843
KMeans1820
18
EuclideanDistance
true
true
true
true
false
0.6827
FuzzyCMeans1720
17
EuclideanDistance
true
true
true
true
false
0.6799
FuzzyCMeans1620
16
EuclideanDistance
true
true
true
true
false
0.6795
KMeans720
7
EuclideanDistance
true
true
true
true
false
0.6784
KMeans1920
19
EuclideanDistance
true
true
true
true
false
0.6755
FuzzyCMeans620
6
EuclideanDistance
true
true
true
true
false
0.6714
FuzzyCMeans1520
15
EuclideanDistance
true
true
true
true
false
0.6707
FuzzyCMeans1920
19
EuclideanDistance
true
true
true
true
false
0.667
KMeans2020
20
EuclideanDistance
true
true
true
true
false
0.6655
FuzzyCMeans1820
18
EuclideanDistance
true
true
true
true
false
0.6639
FuzzyCMeans1320
13
EuclideanDistance
true
true
true
true
false
0.66
KMeans2120
21
EuclideanDistance
true
true
true
true
false
0.6597
FuzzyCMeans1420
14
EuclideanDistance
true
true
true
true
false
0.6593
KMeans620
6
EuclideanDistance
true
true
true
true
false
0.6584
KMeans2220
22
EuclideanDistance
true
true
true
true
false
0.6569
FuzzyCMeans2020
20
EuclideanDistance
true
true
true
true
false
0.6515
KMeans2320
23
EuclideanDistance
true
true
true
true
false
0.6512
KMeans2420
24
EuclideanDistance
true
true
true
true
false
0.6496
FuzzyCMeans1220
12
EuclideanDistance
true
true
true
true
false
0.6468
FuzzyCMeans820
8
EuclideanDistance
false
false
true
true
false
0.6453
KMeans2520
25
EuclideanDistance
true
true
true
true
false
0.6411
FuzzyCMeans1020
10
EuclideanDistance
true
true
true
true
false
0.6394
FuzzyCMeans2120
21
EuclideanDistance
false
false
true
true
false
0.6392
KMeans2620
26
EuclideanDistance
true
true
true
true
false
0.6385
KMeans520
5
EuclideanDistance
true
true
true
true
false
0.6366
KMeans2720
27
EuclideanDistance
true
true
true
true
false
0.6338
FuzzyCMeans2220
22
EuclideanDistance
false
false
true
true
false
0.6312
FuzzyCMeans2320
23
EuclideanDistance
false
false
true
true
false
0.6312
KMeans2820
28
EuclideanDistance
true
true
true
true
false
0.6285
FuzzyCMeans1120
11
EuclideanDistance
true
true
true
true
false
0.6259
FuzzyCMeans520
5
EuclideanDistance
true
true
true
false
true
0.6258
FuzzyCMeans2420
24
EuclideanDistance
false
false
true
true
false
0.6253
KMeans2920
29
EuclideanDistance
true
true
true
true
false
0.6246
FuzzyCMeans920
9
EuclideanDistance
true
true
true
true
false
0.6243
FuzzyCMeans2520
25
EuclideanDistance
false
false
true
true
false
0.6213
FuzzyCMeans720
7
EuclideanDistance
true
true
true
true
false
0.6202
KMeans3020
30
EuclideanDistance
true
true
true
true
false
0.6189
FuzzyCMeans2620
26
EuclideanDistance
false
false
true
true
false
0.6027
KMeans420
4
EuclideanDistance
false
false
true
false
true
0.6004
KMeans220
2
EuclideanDistance
false
false
true
true
false
0.5975
KMeans320
3
EuclideanDistance
true
true
true
false
true
0.596
FuzzyCMeans220
2
EuclideanDistance
false
false
true
true
false
0.5943
FuzzyCMeans2720
27
EuclideanDistance
false
false
true
true
false
0.594
FuzzyCMeans2820
28
EuclideanDistance
false
false
true
true
false
0.5865
FuzzyCMeans420
4
EuclideanDistance
true
true
true
false
true
0.5813
Neural Gas
2
EuclideanDistance
true
true
true
true
false
0.5772
FuzzyCMeans2920
29
EuclideanDistance
false
false
true
true
false
0.5711
FuzzyCMeans320
3
EuclideanDistance
true
true
true
true
false
0.5697
FuzzyCMeans3020
30
EuclideanDistance
false
false
true
true
false
0.5594
ClusterART
13
Not needed
false
false
false
false
false
0.3186
delta
ClusterAlgorithm
k
DistanceFunction
Synonyms
Synonyms
GermaNetFunction
Word2VecAdd
Word2VecAverage
Best SilhouetteAvg
FuzzyCMeans1620
16
EuclideanDistance
true
true
true
true
false
0.7195
FuzzyCMeans1520
15
EuclideanDistance
true
true
true
true
false
0.7181
FuzzyCMeans1320
13
EuclideanDistance
true
true
true
true
false
0.7169
FuzzyCMeans1720
17
EuclideanDistance
true
true
true
true
false
0.7149
FuzzyCMeans1420
14
EuclideanDistance
true
true
true
true
false
0.7142
KMeans1420
14
EuclideanDistance
true
true
true
true
false
0.714
FuzzyCMeans1220
12
EuclideanDistance
true
true
true
true
false
0.7137
KMeans1320
13
EuclideanDistance
true
true
true
true
false
0.7117
KMeans1220
12
EuclideanDistance
true
true
true
true
false
0.7104
KMeans1620
16
EuclideanDistance
true
true
true
true
false
0.7103
KMeans1120
11
EuclideanDistance
true
true
true
true
false
0.7099
KMeans1520
15
EuclideanDistance
true
true
true
true
false
0.7094
FuzzyCMeans1820
18
EuclideanDistance
true
true
true
true
false
0.7093
FuzzyCMeans1920
19
EuclideanDistance
true
true
true
true
false
0.7067
KMeans1720
17
EuclideanDistance
true
true
true
true
false
0.7041
KMeans1020
10
EuclideanDistance
true
true
true
true
false
0.7031
KMeans1820
18
EuclideanDistance
true
true
true
true
false
0.7012
KMeans1920
19
EuclideanDistance
true
true
true
true
false
0.6988
KMeans2020
20
EuclideanDistance
true
true
true
true
false
0.6964
FuzzyCMeans2020
20
EuclideanDistance
true
true
true
true
false
0.6914
KMeans920
9
EuclideanDistance
true
true
true
true
false
0.6913
KMeans2120
21
EuclideanDistance
true
true
true
true
false
0.6906
FuzzyCMeans2120
21
EuclideanDistance
true
true
true
true
false
0.6866
KMeans2220
22
EuclideanDistance
true
true
true
true
false
0.6851
KMeans2320
23
EuclideanDistance
true
true
true
true
false
0.6789
KMeans820
8
EuclideanDistance
true
true
true
true
false
0.6786
FuzzyCMeans1120
11
EuclideanDistance
false
false
true
true
false
0.6782
KMeans2420
24
EuclideanDistance
true
true
true
true
false
0.6777
FuzzyCMeans2220
22
EuclideanDistance
true
true
true
true
false
0.6748
FuzzyCMeans1020
10
EuclideanDistance
false
false
true
true
false
0.6744
KMeans2520
25
EuclideanDistance
true
true
true
true
false
0.6713
KMeans2620
26
EuclideanDistance
true
true
true
true
false
0.6657
FuzzyCMeans2320
23
EuclideanDistance
true
true
true
true
false
0.6652
KMeans2720
27
EuclideanDistance
true
true
true
true
false
0.6641
KMeans2820
28
EuclideanDistance
true
true
true
true
false
0.6586
FuzzyCMeans920
9
EuclideanDistance
false
false
true
true
false
0.6577
KMeans720
7
EuclideanDistance
false
false
true
true
false
0.6571
KMeans2920
29
EuclideanDistance
true
true
true
true
false
0.6548
FuzzyCMeans620
6
EuclideanDistance
false
false
true
false
true
0.6518
FuzzyCMeans2420
24
EuclideanDistance
false
false
true
true
false
0.6507
KMeans3020
30
EuclideanDistance
true
true
true
true
false
0.6494
FuzzyCMeans820
8
EuclideanDistance
true
true
true
true
false
0.6493
FuzzyCMeans2520
25
EuclideanDistance
false
false
true
true
false
0.6477
FuzzyCMeans2620
26
EuclideanDistance
false
false
true
true
false
0.6462
FuzzyCMeans2720
27
EuclideanDistance
false
false
true
true
false
0.6413
FuzzyCMeans720
7
EuclideanDistance
false
false
true
true
false
0.6395
KMeans620
6
EuclideanDistance
true
true
true
true
false
0.6378
FuzzyCMeans2820
28
EuclideanDistance
false
false
true
true
false
0.6359
FuzzyCMeans2920
29
EuclideanDistance
false
false
true
true
false
0.6153
KMeans520
5
EuclideanDistance
false
false
true
false
true
0.6056
FuzzyCMeans3020
30
EuclideanDistance
false
false
true
true
false
0.6017
KMeans220
2
EuclideanDistance
true
true
true
true
false
0.5973
FuzzyCMeans220
2
EuclideanDistance
true
true
true
false
true
0.5849
Neural Gas
2
EuclideanDistance
false
false
true
false
true
0.5828
KMeans420
4
EuclideanDistance
true
true
true
true
false
0.569
KMeans320
3
EuclideanDistance
false
false
true
false
true
0.5522
FuzzyCMeans420
4
EuclideanDistance
false
false
true
false
true
0.5503
FuzzyCMeans320
3
EuclideanDistance
false
false
true
false
true
0.5451
FuzzyCMeans520
5
EuclideanDistance
false
false
true
false
true
0.5213
ClusterART
10
Not needed
false
false
true
false
false
0.4338
k vs. Silhouette, sorted by k
select k, max(SilhouetteAvg) from gamma group by k order by SilhouetteAvg desc
alpha
beta
gamma
delta
k vs. Silhouette, Top 15
select k, max(SilhouetteAvg) from delta group by k order by SilhouetteAvg desc
limit 15
alpha
beta
gamma
delta
Impact of Word2VecAdd, external
select *, round(("F1 with Word2VecAdd"-"F1 without Word2VecAdd")/"F1 with Word2VecAdd"*100, 2) as "Difference in %" from (
select a.ClusterAlgorithm as "Cluster Algorithm", a.DistanceFunction as "Distance Function", max(a.F1WeightedAvg) as "F1 with Word2VecAdd", max(b.F1WeightedAvg) as "F1 without Word2VecAdd" from alpha a
left outer join alpha b on (b.ClusterAlgorithm = a.ClusterAlgorithm and a.DistanceFunction = b.DistanceFunction)
where a.Word2VecAdd = "true" and b.Word2VecAdd = "false"
group by a.ClusterAlgorithm, a.DistanceFunction
order by a.F1WeightedAvg desc
)
alpha
Cluster Algorithm
Distance Function
F1 with Word2VecAdd
F1 without Word2VecAdd
Difference in %
FuzzyCMeans2320
CosineDistance
0.3205
0.3443
-7.43
KMeans2320
CosineDistance
0.3165
0.3209
-1.39
KMeans2320
WordEmbDistance
0.2465
0.2465
0.0
KMeans2320
EuclideanDistance
0.2404
0.299
-24.38
Neural Gas
CosineDistance
0.236
0.2314
1.95
Neural Gas
EuclideanDistance
0.2347
0.2475
-5.45
FuzzyCMeans2320
EuclideanDistance
0.214
0.2619
-22.38
beta
Cluster Algorithm
Distance Function
F1 with Word2VecAdd
F1 without Word2VecAdd
Difference in %
FuzzyCMeans1520
EuclideanDistance
0.4618
0.4512
2.3
KMeans1520
WordEmbDistance
0.4529
0.459
-1.35
Neural Gas
EuclideanDistance
0.4509
0.4872
-8.05
Neural Gas
CosineDistance
0.5297
0.5285
0.23
KMeans1520
EuclideanDistance
0.294
0.4282
-45.65
KMeans1520
CosineDistance
0.3252
0.4161
-27.95
FuzzyCMeans1520
CosineDistance
0.3283
0.4258
-29.7
gamma
Cluster Algorithm
Distance Function
F1 with Word2VecAdd
F1 without Word2VecAdd
Difference in %
KMeans1720
CosineDistance
0.3792
0.5184
-36.71
Neural Gas
CosineDistance
0.3831
0.4083
-6.58
KMeans1720
WordEmbDistance
0.3494
0.3497
-0.09
FuzzyCMeans1720
CosineDistance
0.292
0.4353
-49.08
KMeans1720
EuclideanDistance
0.2841
0.463
-62.97
Neural Gas
EuclideanDistance
0.2746
0.3892
-41.73
FuzzyCMeans1720
EuclideanDistance
0.2561
0.4352
-69.93
delta
Cluster Algorithm
Distance Function
F1 with Word2VecAdd
F1 without Word2VecAdd
Difference in %
Neural Gas
CosineDistance
0.4448
0.5102
-14.7
Neural Gas
EuclideanDistance
0.4139
0.5082
-22.78
KMeans1620
WordEmbDistance
0.4187
0.4187
0.0
FuzzyCMeans1620
EuclideanDistance
0.3549
0.4394
-23.81
KMeans1620
CosineDistance
0.3375
0.4604
-36.41
KMeans1620
EuclideanDistance
0.2884
0.4248
-47.3
FuzzyCMeans1620
CosineDistance
0.2856
0.3843
-34.56
Impact of Word2VecAdd, internal
#TIMM
select *, round(("Silhouette with Word2VecAdd"-"Silhouette without Word2VecAdd / Word2VecAverage")/"Silhouette with Word2VecAdd"*100, 2) as "Difference" from (
select a.ClusterAlgorithm as "Cluster Algorithm", a.k as "k", a.DistanceFunction as "Distance Function", max(a.SilhouetteAvg) as "Silhouette with Word2VecAdd", max(b.SilhouetteAvg) as "Silhouette without Word2VecAdd / Word2VecAverage" from alpha a
left outer join alpha b on (b.ClusterAlgorithm = a.ClusterAlgorithm and a.k = b.k and a.DistanceFunction = b.DistanceFunction)
where a.Word2VecAdd = "true" and b.Word2VecAdd = "false" and b.Word2VecAverage = "false"
group by a.ClusterAlgorithm, a.k, a.DistanceFunction
order by a.SilhouetteAvg desc
)
alpha
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAdd
Silhouette without Word2VecAdd
Difference
KMeans220
2
EuclideanDistance
0.9084
0.8006
11.87
KMeans320
3
EuclideanDistance
0.5651
0.5463
3.33
KMeans420
4
EuclideanDistance
0.5816
0.6086
-4.64
KMeans520
5
EuclideanDistance
0.6395
0.624
2.42
KMeans620
6
EuclideanDistance
0.6854
0.6459
5.76
Neural Gas
2
EuclideanDistance
0.491
0.545
-11.0
KMeans720
7
EuclideanDistance
0.713
0.6271
12.05
FuzzyCMeans220
2
EuclideanDistance
0.5248
0.5666
-7.96
KMeans820
8
EuclideanDistance
0.726
0.6212
14.44
KMeans3020
30
EuclideanDistance
0.6461
0.5416
16.17
KMeans920
9
EuclideanDistance
0.7344
0.6242
15.01
KMeans2920
29
EuclideanDistance
0.6487
0.5445
16.06
KMeans1020
10
EuclideanDistance
0.7351
0.6167
16.11
KMeans2820
28
EuclideanDistance
0.6566
0.5491
16.37
KMeans2720
27
EuclideanDistance
0.6606
0.5502
16.71
KMeans2520
25
EuclideanDistance
0.6801
0.5611
17.5
KMeans2620
26
EuclideanDistance
0.6719
0.5566
17.16
KMeans1120
11
EuclideanDistance
0.7332
0.6129
16.41
KMeans1220
12
EuclideanDistance
0.7289
0.6037
17.18
KMeans2420
24
EuclideanDistance
0.683
0.5644
17.36
KMeans2220
22
EuclideanDistance
0.6967
0.5704
18.13
KMeans2320
23
EuclideanDistance
0.689
0.568
17.56
KMeans2120
21
EuclideanDistance
0.6994
0.5747
17.83
KMeans2020
20
EuclideanDistance
0.7005
0.5813
17.02
KMeans1920
19
EuclideanDistance
0.7047
0.5854
16.93
KMeans1620
16
EuclideanDistance
0.7166
0.5949
16.98
KMeans1520
15
EuclideanDistance
0.7196
0.599
16.76
KMeans1420
14
EuclideanDistance
0.7251
0.6022
16.95
KMeans1320
13
EuclideanDistance
0.7282
0.6045
16.99
KMeans1720
17
EuclideanDistance
0.715
0.5901
17.47
KMeans1820
18
EuclideanDistance
0.7074
0.5852
17.27
FuzzyCMeans2820
28
EuclideanDistance
0.6222
0.4834
22.31
FuzzyCMeans2920
29
EuclideanDistance
0.6109
0.4814
21.2
FuzzyCMeans3020
30
EuclideanDistance
0.5966
0.4772
20.01
FuzzyCMeans2620
26
EuclideanDistance
0.6428
0.4974
22.62
FuzzyCMeans2720
27
EuclideanDistance
0.6279
0.4921
21.63
FuzzyCMeans2520
25
EuclideanDistance
0.6443
0.4951
23.16
FuzzyCMeans2320
23
EuclideanDistance
0.6656
0.4981
25.17
FuzzyCMeans2420
24
EuclideanDistance
0.6549
0.4977
24.0
FuzzyCMeans2220
22
EuclideanDistance
0.6777
0.4965
26.74
FuzzyCMeans2120
21
EuclideanDistance
0.6797
0.5051
25.69
FuzzyCMeans2020
20
EuclideanDistance
0.6975
0.5063
27.41
FuzzyCMeans1920
19
EuclideanDistance
0.7059
0.5064
28.26
FuzzyCMeans1820
18
EuclideanDistance
0.7062
0.5126
27.41
FuzzyCMeans1720
17
EuclideanDistance
0.7295
0.518
28.99
FuzzyCMeans1620
16
EuclideanDistance
0.7376
0.5324
27.82
FuzzyCMeans1520
15
EuclideanDistance
0.7584
0.5377
29.1
FuzzyCMeans1420
14
EuclideanDistance
0.7644
0.5425
29.03
FuzzyCMeans1320
13
EuclideanDistance
0.7681
0.5496
28.45
FuzzyCMeans1220
12
EuclideanDistance
0.7803
0.5588
28.39
FuzzyCMeans1120
11
EuclideanDistance
0.7854
0.5698
27.45
FuzzyCMeans1020
10
EuclideanDistance
0.7643
0.5811
23.97
FuzzyCMeans920
9
EuclideanDistance
0.7375
0.5927
19.63
FuzzyCMeans820
8
EuclideanDistance
0.7434
0.6116
17.73
FuzzyCMeans720
7
EuclideanDistance
0.7085
0.6654
6.08
FuzzyCMeans620
6
EuclideanDistance
0.6721
0.6167
8.24
FuzzyCMeans520
5
EuclideanDistance
0.6151
0.525
14.65
FuzzyCMeans420
4
EuclideanDistance
0.5396
0.5507
-2.06
FuzzyCMeans320
3
EuclideanDistance
0.4912
0.5406
-10.06
beta
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAdd
Silhouette without Word2VecAdd
Difference
KMeans220
2
EuclideanDistance
0.5534
0.5709
-3.16
Neural Gas
2
EuclideanDistance
0.5557
0.5588
-0.56
FuzzyCMeans220
2
EuclideanDistance
0.557
0.579
-3.95
KMeans320
3
EuclideanDistance
0.5525
0.5533
-0.14
FuzzyCMeans320
3
EuclideanDistance
0.4548
0.5346
-17.55
KMeans3020
30
EuclideanDistance
0.5654
0.503
11.04
KMeans2920
29
EuclideanDistance
0.571
0.5056
11.45
KMeans2820
28
EuclideanDistance
0.5785
0.5069
12.38
KMeans2720
27
EuclideanDistance
0.5849
0.5084
13.08
KMeans2620
26
EuclideanDistance
0.5908
0.5105
13.59
KMeans2520
25
EuclideanDistance
0.6009
0.5123
14.74
KMeans2420
24
EuclideanDistance
0.6071
0.5164
14.94
FuzzyCMeans420
4
EuclideanDistance
0.481
0.5243
-9.0
KMeans2320
23
EuclideanDistance
0.6191
0.5183
16.28
KMeans420
4
EuclideanDistance
0.5477
0.5466
0.2
KMeans2220
22
EuclideanDistance
0.6278
0.5234
16.63
KMeans2120
21
EuclideanDistance
0.6357
0.5243
17.52
KMeans2020
20
EuclideanDistance
0.6458
0.5278
18.27
KMeans1920
19
EuclideanDistance
0.652
0.5308
18.59
FuzzyCMeans520
5
EuclideanDistance
0.5089
0.5323
-4.6
KMeans1820
18
EuclideanDistance
0.6598
0.5394
18.25
KMeans1720
17
EuclideanDistance
0.6663
0.5458
18.08
FuzzyCMeans620
6
EuclideanDistance
0.6057
0.596
1.6
KMeans1620
16
EuclideanDistance
0.6716
0.5463
18.66
KMeans1520
15
EuclideanDistance
0.6781
0.5486
19.1
FuzzyCMeans720
7
EuclideanDistance
0.6127
0.5371
12.34
KMeans520
5
EuclideanDistance
0.5505
0.5702
-3.58
KMeans1420
14
EuclideanDistance
0.6819
0.5506
19.26
KMeans1320
13
EuclideanDistance
0.6794
0.5474
19.43
FuzzyCMeans820
8
EuclideanDistance
0.6004
0.5598
6.76
KMeans1220
12
EuclideanDistance
0.6761
0.548
18.95
KMeans1120
11
EuclideanDistance
0.6721
0.5492
18.29
FuzzyCMeans920
9
EuclideanDistance
0.6149
0.5729
6.83
KMeans620
6
EuclideanDistance
0.5868
0.5848
0.34
FuzzyCMeans1020
10
EuclideanDistance
0.6063
0.5596
7.7
KMeans1020
10
EuclideanDistance
0.6662
0.5509
17.31
FuzzyCMeans1120
11
EuclideanDistance
0.6057
0.5477
9.58
KMeans720
7
EuclideanDistance
0.6117
0.5772
5.64
KMeans920
9
EuclideanDistance
0.6509
0.5576
14.33
KMeans820
8
EuclideanDistance
0.6311
0.5625
10.87
FuzzyCMeans1220
12
EuclideanDistance
0.6362
0.5248
17.51
FuzzyCMeans1320
13
EuclideanDistance
0.6435
0.5036
21.74
FuzzyCMeans1420
14
EuclideanDistance
0.6509
0.4756
26.93
FuzzyCMeans1520
15
EuclideanDistance
0.6559
0.4604
29.81
FuzzyCMeans1620
16
EuclideanDistance
0.6482
0.4493
30.68
FuzzyCMeans1720
17
EuclideanDistance
0.6392
0.4315
32.49
FuzzyCMeans1820
18
EuclideanDistance
0.6297
0.4202
33.27
FuzzyCMeans1920
19
EuclideanDistance
0.615
0.4036
34.37
FuzzyCMeans2020
20
EuclideanDistance
0.6075
0.397
34.65
FuzzyCMeans2120
21
EuclideanDistance
0.5949
0.3912
34.24
FuzzyCMeans2220
22
EuclideanDistance
0.5811
0.3801
34.59
FuzzyCMeans2320
23
EuclideanDistance
0.5763
0.3741
35.09
FuzzyCMeans2420
24
EuclideanDistance
0.5599
0.3635
35.08
FuzzyCMeans2520
25
EuclideanDistance
0.5537
0.3511
36.59
FuzzyCMeans2620
26
EuclideanDistance
0.5492
0.3487
36.51
FuzzyCMeans2720
27
EuclideanDistance
0.5319
0.33
37.96
FuzzyCMeans2820
28
EuclideanDistance
0.5177
0.3264
36.95
FuzzyCMeans2920
29
EuclideanDistance
0.5044
0.3256
35.45
FuzzyCMeans3020
30
EuclideanDistance
0.5016
0.316
37.0
gamma
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAdd
Silhouette without Word2VecAdd
Difference
KMeans220
2
EuclideanDistance
0.5975
0.5666
5.17
KMeans3020
30
EuclideanDistance
0.6189
0.5606
9.42
KMeans2920
29
EuclideanDistance
0.6246
0.5617
10.07
KMeans2820
28
EuclideanDistance
0.6285
0.5645
10.18
KMeans2720
27
EuclideanDistance
0.6338
0.567
10.54
KMeans2620
26
EuclideanDistance
0.6385
0.5701
10.71
KMeans2520
25
EuclideanDistance
0.6411
0.5734
10.56
KMeans2420
24
EuclideanDistance
0.6496
0.578
11.02
KMeans2320
23
EuclideanDistance
0.6512
0.5795
11.01
KMeans2220
22
EuclideanDistance
0.6569
0.5837
11.14
KMeans2120
21
EuclideanDistance
0.6597
0.5872
10.99
KMeans2020
20
EuclideanDistance
0.6655
0.591
11.19
KMeans1920
19
EuclideanDistance
0.6755
0.5943
12.02
FuzzyCMeans220
2
EuclideanDistance
0.5943
0.5598
5.81
Neural Gas
2
EuclideanDistance
0.5772
0.5372
6.93
KMeans1820
18
EuclideanDistance
0.6827
0.5989
12.27
KMeans1720
17
EuclideanDistance
0.6843
0.6022
12.0
KMeans1620
16
EuclideanDistance
0.6919
0.6056
12.47
KMeans1520
15
EuclideanDistance
0.6983
0.6065
13.15
KMeans1420
14
EuclideanDistance
0.7039
0.6103
13.3
KMeans1320
13
EuclideanDistance
0.7073
0.6128
13.36
KMeans1220
12
EuclideanDistance
0.7102
0.6133
13.64
KMeans1120
11
EuclideanDistance
0.7053
0.6196
12.15
KMeans1020
10
EuclideanDistance
0.7081
0.6221
12.15
FuzzyCMeans320
3
EuclideanDistance
0.5697
0.5535
2.84
KMeans920
9
EuclideanDistance
0.7036
0.6237
11.36
KMeans820
8
EuclideanDistance
0.6957
0.6196
10.94
KMeans720
7
EuclideanDistance
0.6784
0.6159
9.21
KMeans320
3
EuclideanDistance
0.57
0.596
-4.56
KMeans420
4
EuclideanDistance
0.5889
0.6004
-1.95
KMeans620
6
EuclideanDistance
0.6584
0.6113
7.15
KMeans520
5
EuclideanDistance
0.6366
0.6182
2.89
FuzzyCMeans420
4
EuclideanDistance
0.5701
0.5813
-1.96
FuzzyCMeans520
5
EuclideanDistance
0.6255
0.6258
-0.05
FuzzyCMeans620
6
EuclideanDistance
0.6714
0.6434
4.17
FuzzyCMeans720
7
EuclideanDistance
0.6202
0.5812
6.29
FuzzyCMeans820
8
EuclideanDistance
0.6453
0.5536
14.21
FuzzyCMeans920
9
EuclideanDistance
0.6243
0.5386
13.73
FuzzyCMeans1020
10
EuclideanDistance
0.6394
0.5278
17.45
FuzzyCMeans1120
11
EuclideanDistance
0.6259
0.4999
20.13
FuzzyCMeans1220
12
EuclideanDistance
0.6468
0.4837
25.22
FuzzyCMeans1320
13
EuclideanDistance
0.66
0.4713
28.59
FuzzyCMeans1420
14
EuclideanDistance
0.6593
0.4631
29.76
FuzzyCMeans1520
15
EuclideanDistance
0.6707
0.4544
32.25
FuzzyCMeans1620
16
EuclideanDistance
0.6795
0.4487
33.97
FuzzyCMeans1720
17
EuclideanDistance
0.6799
0.4392
35.4
FuzzyCMeans1820
18
EuclideanDistance
0.6639
0.4363
34.28
FuzzyCMeans1920
19
EuclideanDistance
0.667
0.4351
34.77
FuzzyCMeans2020
20
EuclideanDistance
0.6515
0.427
34.46
FuzzyCMeans2120
21
EuclideanDistance
0.6392
0.4215
34.06
FuzzyCMeans2220
22
EuclideanDistance
0.6312
0.4246
32.73
FuzzyCMeans2320
23
EuclideanDistance
0.6312
0.414
34.41
FuzzyCMeans2420
24
EuclideanDistance
0.6253
0.4017
35.76
FuzzyCMeans2520
25
EuclideanDistance
0.6213
0.3977
35.99
FuzzyCMeans2620
26
EuclideanDistance
0.6027
0.3872
35.76
FuzzyCMeans2720
27
EuclideanDistance
0.594
0.3844
35.29
FuzzyCMeans2820
28
EuclideanDistance
0.5865
0.3759
35.91
FuzzyCMeans2920
29
EuclideanDistance
0.5711
0.3757
34.21
FuzzyCMeans3020
30
EuclideanDistance
0.5594
0.3566
36.25
delta
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAdd
Silhouette without Word2VecAdd
Difference
KMeans220
2
EuclideanDistance
0.5973
0.5872
1.69
FuzzyCMeans220
2
EuclideanDistance
0.5417
0.5849
-7.97
KMeans3020
30
EuclideanDistance
0.6494
0.5797
10.73
KMeans2920
29
EuclideanDistance
0.6548
0.5836
10.87
KMeans2820
28
EuclideanDistance
0.6586
0.5881
10.7
KMeans2720
27
EuclideanDistance
0.6641
0.5903
11.11
Neural Gas
2
EuclideanDistance
0.5
0.5828
-16.56
KMeans2620
26
EuclideanDistance
0.6657
0.5941
10.76
KMeans2520
25
EuclideanDistance
0.6713
0.5997
10.67
KMeans2320
23
EuclideanDistance
0.6789
0.6037
11.08
KMeans2420
24
EuclideanDistance
0.6777
0.6009
11.33
KMeans2220
22
EuclideanDistance
0.6851
0.6034
11.93
KMeans2120
21
EuclideanDistance
0.6906
0.6094
11.76
KMeans2020
20
EuclideanDistance
0.6964
0.6123
12.08
KMeans1920
19
EuclideanDistance
0.6988
0.618
11.56
KMeans1820
18
EuclideanDistance
0.7012
0.6218
11.32
KMeans1720
17
EuclideanDistance
0.7041
0.6248
11.26
KMeans1620
16
EuclideanDistance
0.7103
0.6298
11.33
KMeans1520
15
EuclideanDistance
0.7094
0.6334
10.71
KMeans1420
14
EuclideanDistance
0.714
0.6287
11.95
KMeans320
3
EuclideanDistance
0.5514
0.5522
-0.15
KMeans1320
13
EuclideanDistance
0.7117
0.6301
11.47
KMeans1220
12
EuclideanDistance
0.7104
0.6275
11.67
KMeans1120
11
EuclideanDistance
0.7099
0.6267
11.72
KMeans1020
10
EuclideanDistance
0.7031
0.6226
11.45
FuzzyCMeans320
3
EuclideanDistance
0.5086
0.5451
-7.18
KMeans920
9
EuclideanDistance
0.6913
0.6199
10.33
KMeans420
4
EuclideanDistance
0.569
0.5653
0.65
KMeans820
8
EuclideanDistance
0.6786
0.6183
8.89
FuzzyCMeans420
4
EuclideanDistance
0.4509
0.5503
-22.04
KMeans720
7
EuclideanDistance
0.6571
0.6174
6.04
KMeans520
5
EuclideanDistance
0.5931
0.6056
-2.11
FuzzyCMeans520
5
EuclideanDistance
0.5117
0.5213
-1.88
FuzzyCMeans620
6
EuclideanDistance
0.6005
0.6518
-8.54
KMeans620
6
EuclideanDistance
0.6378
0.6194
2.88
FuzzyCMeans720
7
EuclideanDistance
0.6395
0.6099
4.63
FuzzyCMeans820
8
EuclideanDistance
0.6493
0.6093
6.16
FuzzyCMeans920
9
EuclideanDistance
0.6577
0.5746
12.63
FuzzyCMeans1120
11
EuclideanDistance
0.6782
0.5508
18.79
FuzzyCMeans1020
10
EuclideanDistance
0.6744
0.5685
15.7
FuzzyCMeans1220
12
EuclideanDistance
0.7137
0.5551
22.22
FuzzyCMeans1320
13
EuclideanDistance
0.7169
0.5471
23.69
FuzzyCMeans1420
14
EuclideanDistance
0.7142
0.5256
26.41
FuzzyCMeans1520
15
EuclideanDistance
0.7181
0.5103
28.94
FuzzyCMeans1620
16
EuclideanDistance
0.7195
0.5051
29.8
FuzzyCMeans1720
17
EuclideanDistance
0.7149
0.5043
29.46
FuzzyCMeans1820
18
EuclideanDistance
0.7093
0.4949
30.23
FuzzyCMeans1920
19
EuclideanDistance
0.7067
0.4898
30.69
FuzzyCMeans2020
20
EuclideanDistance
0.6914
0.49
29.13
FuzzyCMeans2120
21
EuclideanDistance
0.6866
0.4818
29.83
FuzzyCMeans2220
22
EuclideanDistance
0.6748
0.4801
28.85
FuzzyCMeans2320
23
EuclideanDistance
0.6652
0.4737
28.79
FuzzyCMeans2420
24
EuclideanDistance
0.6507
0.4531
30.37
FuzzyCMeans2520
25
EuclideanDistance
0.6477
0.4445
31.37
FuzzyCMeans2620
26
EuclideanDistance
0.6462
0.4364
32.47
FuzzyCMeans2720
27
EuclideanDistance
0.6413
0.4279
33.28
FuzzyCMeans2820
28
EuclideanDistance
0.6359
0.4162
34.55
FuzzyCMeans2920
29
EuclideanDistance
0.6153
0.4115
33.12
FuzzyCMeans3020
30
EuclideanDistance
0.6017
0.4035
32.94
Impact of Word2VecAverage, external
select *, round(("F1 with Word2VecAverage"-"F1 without Word2VecAverage")/"F1 with Word2VecAverage"*100, 2) as "Difference in %" from (
select a.ClusterAlgorithm as "Cluster Algorithm", a.DistanceFunction as "Distance Function", max(a.F1WeightedAvg) as "F1 with Word2VecAverage", max(b.F1WeightedAvg) as "F1 without Word2VecAverage" from delta a
left outer join delta b on (b.ClusterAlgorithm = a.ClusterAlgorithm and a.DistanceFunction = b.DistanceFunction)
where a.Word2VecAverage = "true" and b.Word2VecAverage = "false"
group by a.ClusterAlgorithm, a.DistanceFunction
order by a.F1WeightedAvg desc
)
alpha
Cluster Algorithm
Distance Function
F1 with Word2VecAverage
F1 without Word2VecAverage
Difference in %
KMeans2320
CosineDistance
0.3209
0.3165
1.37
FuzzyCMeans2320
CosineDistance
0.3134
0.3443
-9.86
KMeans2320
EuclideanDistance
0.299
0.2845
4.85
KMeans2320
WordEmbDistance
0.2465
0.2465
0.0
Neural Gas
CosineDistance
0.2314
0.236
-1.99
FuzzyCMeans2320
EuclideanDistance
0.2234
0.2619
-17.23
Neural Gas
EuclideanDistance
0.2475
0.2347
5.17
beta
Cluster Algorithm
Distance Function
F1 with Word2VecAverage
F1 without Word2VecAverage
Difference in %
Neural Gas
EuclideanDistance
0.4872
0.4509
7.45
KMeans1520
WordEmbDistance
0.459
0.459
0.0
FuzzyCMeans1520
EuclideanDistance
0.381
0.4618
-21.21
Neural Gas
CosineDistance
0.5284
0.5297
-0.25
KMeans1520
EuclideanDistance
0.3252
0.4282
-31.67
KMeans1520
CosineDistance
0.3206
0.4161
-29.79
FuzzyCMeans1520
CosineDistance
0.3277
0.4258
-29.94
gamma
Cluster Algorithm
Distance Function
F1 with Word2VecAverage
F1 without Word2VecAverage
Difference in %
KMeans1720
EuclideanDistance
0.4097
0.463
-13.01
KMeans1720
CosineDistance
0.3834
0.5184
-35.21
Neural Gas
CosineDistance
0.4083
0.3831
6.17
FuzzyCMeans1720
EuclideanDistance
0.3548
0.4352
-22.66
KMeans1720
WordEmbDistance
0.3497
0.3494
0.09
Neural Gas
EuclideanDistance
0.3892
0.3764
3.29
FuzzyCMeans1720
CosineDistance
0.3048
0.4353
-42.81
delta
Cluster Algorithm
Distance Function
F1 with Word2VecAverage
F1 without Word2VecAverage
Difference in %
Neural Gas
EuclideanDistance
0.4552
0.5082
-11.64
FuzzyCMeans1620
EuclideanDistance
0.4394
0.4323
1.62
Neural Gas
CosineDistance
0.4357
0.5102
-17.1
KMeans1620
EuclideanDistance
0.3971
0.4248
-6.98
KMeans1620
WordEmbDistance
0.4187
0.4187
0.0
KMeans1620
CosineDistance
0.3478
0.4604
-32.37
FuzzyCMeans1620
CosineDistance
0.2863
0.3843
-34.23
Impact of Word2VecAverage, internal
select *, round(("Silhouette with Word2VecAverage"-"Silhouette without Word2VecAverage")/"Silhouette with Word2VecAverage"*100, 2) as "Difference" from (
select a.ClusterAlgorithm as "Cluster Algorithm", a.k as "k", a.DistanceFunction as "Distance Function", max(a.SilhouetteAvg) as "Silhouette with Word2VecAverage", max(b.SilhouetteAvg) as "Silhouette without Word2VecAverage" from gamma a
left outer join gamma b on (b.ClusterAlgorithm = a.ClusterAlgorithm and a.k = b.k and a.DistanceFunction = b.DistanceFunction)
where a.Word2VecAverage = "true" and b.Word2VecAverage = "false"
group by a.ClusterAlgorithm
order by a.SilhouetteAvg desc
)
alpha
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAverage
Silhouette without Word2VecAverage
Difference
KMeans220
2
EuclideanDistance
0.8006
0.9084
-13.46
KMeans320
3
EuclideanDistance
0.5463
0.5651
-3.44
KMeans420
4
EuclideanDistance
0.6086
0.5816
4.44
KMeans520
5
EuclideanDistance
0.624
0.6395
-2.48
KMeans620
6
EuclideanDistance
0.6459
0.6854
-6.12
KMeans720
7
EuclideanDistance
0.6271
0.713
-13.7
KMeans2920
29
EuclideanDistance
0.5445
0.6487
-19.14
KMeans3020
30
EuclideanDistance
0.5416
0.6461
-19.29
KMeans2820
28
EuclideanDistance
0.5491
0.6566
-19.58
KMeans2720
27
EuclideanDistance
0.5502
0.6606
-20.07
KMeans2620
26
EuclideanDistance
0.5566
0.6719
-20.72
KMeans820
8
EuclideanDistance
0.6212
0.726
-16.87
KMeans2520
25
EuclideanDistance
0.5611
0.6801
-21.21
KMeans2420
24
EuclideanDistance
0.5644
0.683
-21.01
KMeans920
9
EuclideanDistance
0.6242
0.7344
-17.65
KMeans2320
23
EuclideanDistance
0.568
0.689
-21.3
KMeans2220
22
EuclideanDistance
0.5704
0.6967
-22.14
KMeans2120
21
EuclideanDistance
0.5747
0.6994
-21.7
KMeans1020
10
EuclideanDistance
0.6167
0.7351
-19.2
KMeans1920
19
EuclideanDistance
0.5854
0.7047
-20.38
KMeans2020
20
EuclideanDistance
0.5813
0.7005
-20.51
KMeans1820
18
EuclideanDistance
0.5852
0.7074
-20.88
KMeans1720
17
EuclideanDistance
0.5901
0.715
-21.17
KMeans1520
15
EuclideanDistance
0.599
0.7196
-20.13
KMeans1620
16
EuclideanDistance
0.5949
0.7166
-20.46
KMeans1120
11
EuclideanDistance
0.6129
0.7332
-19.63
KMeans1220
12
EuclideanDistance
0.6037
0.7289
-20.74
KMeans1420
14
EuclideanDistance
0.6022
0.7251
-20.41
KMeans1320
13
EuclideanDistance
0.6045
0.7282
-20.46
FuzzyCMeans220
2
EuclideanDistance
0.5666
0.5248
7.38
Neural Gas
2
EuclideanDistance
0.545
0.491
9.91
FuzzyCMeans520
5
EuclideanDistance
0.525
0.6151
-17.16
FuzzyCMeans420
4
EuclideanDistance
0.5507
0.5396
2.02
FuzzyCMeans720
7
EuclideanDistance
0.6654
0.7085
-6.48
FuzzyCMeans620
6
EuclideanDistance
0.6167
0.6721
-8.98
FuzzyCMeans820
8
EuclideanDistance
0.6116
0.7434
-21.55
FuzzyCMeans1020
10
EuclideanDistance
0.5811
0.7643
-31.53
FuzzyCMeans920
9
EuclideanDistance
0.5927
0.7375
-24.43
FuzzyCMeans1120
11
EuclideanDistance
0.5698
0.7854
-37.84
FuzzyCMeans1220
12
EuclideanDistance
0.5588
0.7803
-39.64
FuzzyCMeans1320
13
EuclideanDistance
0.5496
0.7681
-39.76
FuzzyCMeans1620
16
EuclideanDistance
0.5324
0.7376
-38.54
FuzzyCMeans1420
14
EuclideanDistance
0.5425
0.7644
-40.9
FuzzyCMeans1520
15
EuclideanDistance
0.5377
0.7584
-41.05
FuzzyCMeans320
3
EuclideanDistance
0.5406
0.4912
9.14
FuzzyCMeans1720
17
EuclideanDistance
0.518
0.7295
-40.83
FuzzyCMeans1920
19
EuclideanDistance
0.5064
0.7059
-39.4
FuzzyCMeans1820
18
EuclideanDistance
0.5126
0.7062
-37.77
FuzzyCMeans2020
20
EuclideanDistance
0.5063
0.6975
-37.76
FuzzyCMeans2120
21
EuclideanDistance
0.5051
0.6797
-34.57
FuzzyCMeans2220
22
EuclideanDistance
0.4965
0.6777
-36.5
FuzzyCMeans2320
23
EuclideanDistance
0.4981
0.6656
-33.63
FuzzyCMeans2420
24
EuclideanDistance
0.4977
0.6549
-31.59
FuzzyCMeans2520
25
EuclideanDistance
0.4951
0.6443
-30.14
FuzzyCMeans2820
28
EuclideanDistance
0.4834
0.6222
-28.71
FuzzyCMeans2920
29
EuclideanDistance
0.4814
0.6109
-26.9
FuzzyCMeans2620
26
EuclideanDistance
0.4974
0.6428
-29.23
FuzzyCMeans2720
27
EuclideanDistance
0.4921
0.6279
-27.6
FuzzyCMeans3020
30
EuclideanDistance
0.4772
0.5966
-25.02
beta
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAverage
Silhouette without Word2VecAverage
Difference
KMeans220
2
EuclideanDistance
0.5709
0.5534
3.07
KMeans3020
30
EuclideanDistance
0.503
0.5654
-12.41
KMeans2920
29
EuclideanDistance
0.5056
0.571
-12.94
KMeans2820
28
EuclideanDistance
0.5069
0.5785
-14.13
KMeans2720
27
EuclideanDistance
0.5084
0.5849
-15.05
KMeans2620
26
EuclideanDistance
0.5105
0.5908
-15.73
FuzzyCMeans220
2
EuclideanDistance
0.579
0.557
3.8
KMeans2420
24
EuclideanDistance
0.5164
0.6071
-17.56
KMeans2520
25
EuclideanDistance
0.5123
0.6009
-17.29
KMeans2320
23
EuclideanDistance
0.5183
0.6191
-19.45
KMeans2220
22
EuclideanDistance
0.5234
0.6278
-19.95
KMeans2120
21
EuclideanDistance
0.5243
0.6357
-21.25
FuzzyCMeans620
6
EuclideanDistance
0.596
0.6057
-1.63
KMeans2020
20
EuclideanDistance
0.5278
0.6458
-22.36
Neural Gas
2
EuclideanDistance
0.5588
0.5557
0.55
KMeans1920
19
EuclideanDistance
0.5308
0.652
-22.83
FuzzyCMeans720
7
EuclideanDistance
0.5371
0.6127
-14.08
KMeans1820
18
EuclideanDistance
0.5394
0.6598
-22.32
FuzzyCMeans520
5
EuclideanDistance
0.5323
0.5089
4.4
KMeans1720
17
EuclideanDistance
0.5458
0.6663
-22.08
KMeans1620
16
EuclideanDistance
0.5463
0.6716
-22.94
FuzzyCMeans820
8
EuclideanDistance
0.5598
0.6004
-7.25
KMeans1520
15
EuclideanDistance
0.5486
0.6781
-23.61
KMeans1420
14
EuclideanDistance
0.5506
0.6819
-23.85
KMeans1320
13
EuclideanDistance
0.5474
0.6794
-24.11
KMeans1220
12
EuclideanDistance
0.548
0.6761
-23.38
KMeans1120
11
EuclideanDistance
0.5492
0.6721
-22.38
KMeans1020
10
EuclideanDistance
0.5509
0.6662
-20.93
KMeans920
9
EuclideanDistance
0.5576
0.6509
-16.73
FuzzyCMeans920
9
EuclideanDistance
0.5729
0.6149
-7.33
FuzzyCMeans420
4
EuclideanDistance
0.5243
0.481
8.26
KMeans820
8
EuclideanDistance
0.5625
0.6311
-12.2
KMeans320
3
EuclideanDistance
0.5533
0.5525
0.14
KMeans720
7
EuclideanDistance
0.5772
0.6117
-5.98
KMeans620
6
EuclideanDistance
0.5848
0.5868
-0.34
FuzzyCMeans1020
10
EuclideanDistance
0.5596
0.6063
-8.35
KMeans520
5
EuclideanDistance
0.5702
0.5505
3.45
KMeans420
4
EuclideanDistance
0.5466
0.5477
-0.2
FuzzyCMeans1120
11
EuclideanDistance
0.5477
0.6057
-10.59
FuzzyCMeans320
3
EuclideanDistance
0.5346
0.4548
14.93
FuzzyCMeans1220
12
EuclideanDistance
0.5248
0.6362
-21.23
FuzzyCMeans1320
13
EuclideanDistance
0.5036
0.6435
-27.78
FuzzyCMeans1420
14
EuclideanDistance
0.4756
0.6509
-36.86
FuzzyCMeans1820
18
EuclideanDistance
0.4202
0.6297
-49.86
FuzzyCMeans2020
20
EuclideanDistance
0.397
0.6075
-53.02
FuzzyCMeans1720
17
EuclideanDistance
0.4315
0.6392
-48.13
FuzzyCMeans1920
19
EuclideanDistance
0.4036
0.615
-52.38
FuzzyCMeans1520
15
EuclideanDistance
0.4604
0.6559
-42.46
FuzzyCMeans2120
21
EuclideanDistance
0.3912
0.5949
-52.07
FuzzyCMeans2220
22
EuclideanDistance
0.3801
0.5811
-52.88
FuzzyCMeans1620
16
EuclideanDistance
0.4493
0.6482
-44.27
FuzzyCMeans2320
23
EuclideanDistance
0.3741
0.5763
-54.05
FuzzyCMeans2420
24
EuclideanDistance
0.3635
0.5599
-54.03
FuzzyCMeans2520
25
EuclideanDistance
0.3511
0.5537
-57.7
FuzzyCMeans2720
27
EuclideanDistance
0.33
0.5319
-61.18
FuzzyCMeans2620
26
EuclideanDistance
0.3487
0.5492
-57.5
FuzzyCMeans2820
28
EuclideanDistance
0.3264
0.5177
-58.61
FuzzyCMeans2920
29
EuclideanDistance
0.3256
0.5044
-54.91
FuzzyCMeans3020
30
EuclideanDistance
0.316
0.5016
-58.73
gamma
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAverage
Silhouette without Word2VecAverage
Difference
Neural Gas
2
EuclideanDistance
0.5372
0.5772
-7.45
KMeans3020
30
EuclideanDistance
0.5606
0.6189
-10.4
KMeans2820
28
EuclideanDistance
0.5645
0.6285
-11.34
KMeans2920
29
EuclideanDistance
0.5617
0.6246
-11.2
KMeans2720
27
EuclideanDistance
0.567
0.6338
-11.78
KMeans2620
26
EuclideanDistance
0.5701
0.6385
-12.0
KMeans2520
25
EuclideanDistance
0.5734
0.6411
-11.81
KMeans2420
24
EuclideanDistance
0.578
0.6496
-12.39
KMeans2320
23
EuclideanDistance
0.5795
0.6512
-12.37
KMeans2120
21
EuclideanDistance
0.5872
0.6597
-12.35
KMeans2220
22
EuclideanDistance
0.5837
0.6569
-12.54
KMeans2020
20
EuclideanDistance
0.591
0.6655
-12.61
KMeans1920
19
EuclideanDistance
0.5943
0.6755
-13.66
KMeans1820
18
EuclideanDistance
0.5989
0.6827
-13.99
KMeans1720
17
EuclideanDistance
0.6022
0.6843
-13.63
KMeans1620
16
EuclideanDistance
0.6056
0.6919
-14.25
KMeans1520
15
EuclideanDistance
0.6065
0.6983
-15.14
KMeans1420
14
EuclideanDistance
0.6103
0.7039
-15.34
KMeans1320
13
EuclideanDistance
0.6128
0.7073
-15.42
KMeans1220
12
EuclideanDistance
0.6133
0.7102
-15.8
KMeans1120
11
EuclideanDistance
0.6196
0.7053
-13.83
KMeans1020
10
EuclideanDistance
0.6221
0.7081
-13.82
KMeans220
2
EuclideanDistance
0.5666
0.5975
-5.45
KMeans920
9
EuclideanDistance
0.6237
0.7036
-12.81
KMeans820
8
EuclideanDistance
0.6196
0.6957
-12.28
KMeans720
7
EuclideanDistance
0.6159
0.6784
-10.15
KMeans620
6
EuclideanDistance
0.6113
0.6584
-7.7
KMeans520
5
EuclideanDistance
0.6182
0.6366
-2.98
KMeans420
4
EuclideanDistance
0.6004
0.5889
1.92
FuzzyCMeans220
2
EuclideanDistance
0.5598
0.5943
-6.16
KMeans320
3
EuclideanDistance
0.596
0.57
4.36
FuzzyCMeans720
7
EuclideanDistance
0.5812
0.6202
-6.71
FuzzyCMeans620
6
EuclideanDistance
0.6434
0.6714
-4.35
FuzzyCMeans520
5
EuclideanDistance
0.6258
0.6255
0.05
FuzzyCMeans820
8
EuclideanDistance
0.5536
0.6453
-16.56
FuzzyCMeans420
4
EuclideanDistance
0.5813
0.5701
1.93
FuzzyCMeans920
9
EuclideanDistance
0.5386
0.6243
-15.91
FuzzyCMeans320
3
EuclideanDistance
0.5535
0.5697
-2.93
FuzzyCMeans1020
10
EuclideanDistance
0.5278
0.6394
-21.14
FuzzyCMeans1120
11
EuclideanDistance
0.4999
0.6259
-25.21
FuzzyCMeans1220
12
EuclideanDistance
0.4837
0.6468
-33.72
FuzzyCMeans1320
13
EuclideanDistance
0.4713
0.66
-40.04
FuzzyCMeans1420
14
EuclideanDistance
0.4631
0.6593
-42.37
FuzzyCMeans1520
15
EuclideanDistance
0.4544
0.6707
-47.6
FuzzyCMeans1620
16
EuclideanDistance
0.4487
0.6795
-51.44
FuzzyCMeans1720
17
EuclideanDistance
0.4392
0.6799
-54.8
FuzzyCMeans1820
18
EuclideanDistance
0.4363
0.6639
-52.17
FuzzyCMeans2020
20
EuclideanDistance
0.427
0.6515
-52.58
FuzzyCMeans1920
19
EuclideanDistance
0.4351
0.667
-53.3
FuzzyCMeans2120
21
EuclideanDistance
0.4215
0.6392
-51.65
FuzzyCMeans2220
22
EuclideanDistance
0.4246
0.6312
-48.66
FuzzyCMeans2320
23
EuclideanDistance
0.414
0.6312
-52.46
FuzzyCMeans2420
24
EuclideanDistance
0.4017
0.6253
-55.66
FuzzyCMeans2520
25
EuclideanDistance
0.3977
0.6213
-56.22
FuzzyCMeans2620
26
EuclideanDistance
0.3872
0.6027
-55.66
FuzzyCMeans2720
27
EuclideanDistance
0.3844
0.594
-54.53
FuzzyCMeans2820
28
EuclideanDistance
0.3759
0.5865
-56.03
FuzzyCMeans2920
29
EuclideanDistance
0.3757
0.5711
-52.01
FuzzyCMeans3020
30
EuclideanDistance
0.3566
0.5594
-56.87
delta
Cluster Algorithm
k
Distance Function
Silhouette with Word2VecAverage
Silhouette without Word2VecAverage
Difference
Neural Gas
3
CosineDistance
0.5828
0.5038
13.56
KMeans3020
30
EuclideanDistance
0.5797
0.6494
-12.02
KMeans2920
29
EuclideanDistance
0.5836
0.6548
-12.2
KMeans2820
28
EuclideanDistance
0.5881
0.6586
-11.99
KMeans2720
27
EuclideanDistance
0.5903
0.6641
-12.5
KMeans2620
26
EuclideanDistance
0.5941
0.6657
-12.05
KMeans2520
25
EuclideanDistance
0.5997
0.6713
-11.94
KMeans2320
23
EuclideanDistance
0.6037
0.6789
-12.46
KMeans2420
24
EuclideanDistance
0.6009
0.6777
-12.78
KMeans2220
22
EuclideanDistance
0.6034
0.6851
-13.54
KMeans2120
21
EuclideanDistance
0.6094
0.6906
-13.32
KMeans2020
20
EuclideanDistance
0.6123
0.6964
-13.74
KMeans1920
19
EuclideanDistance
0.618
0.6988
-13.07
KMeans1820
18
EuclideanDistance
0.6218
0.7012
-12.77
KMeans1720
17
EuclideanDistance
0.6248
0.7041
-12.69
KMeans1620
16
EuclideanDistance
0.6298
0.7103
-12.78
KMeans1520
15
EuclideanDistance
0.6334
0.7094
-12.0
KMeans1420
14
EuclideanDistance
0.6287
0.714
-13.57
KMeans220
2
EuclideanDistance
0.5872
0.5973
-1.72
KMeans1320
13
EuclideanDistance
0.6301
0.7117
-12.95
KMeans1220
12
EuclideanDistance
0.6275
0.7104
-13.21
KMeans1120
11
EuclideanDistance
0.6267
0.7099
-13.28
KMeans1020
10
EuclideanDistance
0.6226
0.7031
-12.93
KMeans920
9
EuclideanDistance
0.6199
0.6913
-11.52
KMeans820
8
EuclideanDistance
0.6183
0.6786
-9.75
FuzzyCMeans220
2
EuclideanDistance
0.5849
0.5417
7.39
FuzzyCMeans420
4
EuclideanDistance
0.5503
0.4509
18.06
KMeans720
7
EuclideanDistance
0.6174
0.6571
-6.43
FuzzyCMeans520
5
EuclideanDistance
0.5213
0.5117
1.84
KMeans320
3
EuclideanDistance
0.5522
0.5514
0.14
KMeans620
6
EuclideanDistance
0.6194
0.6378
-2.97
KMeans520
5
EuclideanDistance
0.6056
0.5931
2.06
FuzzyCMeans620
6
EuclideanDistance
0.6518
0.6005
7.87
KMeans420
4
EuclideanDistance
0.5653
0.569
-0.65
FuzzyCMeans720
7
EuclideanDistance
0.6099
0.6395
-4.85
FuzzyCMeans820
8
EuclideanDistance
0.6093
0.6493
-6.56
FuzzyCMeans320
3
EuclideanDistance
0.5451
0.5086
6.7
FuzzyCMeans920
9
EuclideanDistance
0.5746
0.6577
-14.46
FuzzyCMeans1120
11
EuclideanDistance
0.5508
0.6782
-23.13
FuzzyCMeans1020
10
EuclideanDistance
0.5685
0.6744
-18.63
FuzzyCMeans1220
12
EuclideanDistance
0.5551
0.7137
-28.57
FuzzyCMeans1320
13
EuclideanDistance
0.5471
0.7169
-31.04
FuzzyCMeans1420
14
EuclideanDistance
0.5256
0.7142
-35.88
FuzzyCMeans1520
15
EuclideanDistance
0.5103
0.7181
-40.72
FuzzyCMeans1620
16
EuclideanDistance
0.5051
0.7195
-42.45
FuzzyCMeans1720
17
EuclideanDistance
0.5043
0.7149
-41.76
FuzzyCMeans1820
18
EuclideanDistance
0.4949
0.7093
-43.32
FuzzyCMeans1920
19
EuclideanDistance
0.4898
0.7067
-44.28
FuzzyCMeans2520
25
EuclideanDistance
0.4445
0.6477
-45.71
FuzzyCMeans2220
22
EuclideanDistance
0.4801
0.6748
-40.55
FuzzyCMeans2320
23
EuclideanDistance
0.4737
0.6652
-40.43
FuzzyCMeans2420
24
EuclideanDistance
0.4531
0.6507
-43.61
FuzzyCMeans2020
20
EuclideanDistance
0.49
0.6914
-41.1
FuzzyCMeans2620
26
EuclideanDistance
0.4364
0.6462
-48.08
FuzzyCMeans2120
21
EuclideanDistance
0.4818
0.6866
-42.51
FuzzyCMeans2720
27
EuclideanDistance
0.4279
0.6413
-49.87
FuzzyCMeans2920
29
EuclideanDistance
0.4115
0.6153
-49.53
FuzzyCMeans2820
28
EuclideanDistance
0.4162
0.6359
-52.79
FuzzyCMeans3020
30
EuclideanDistance
0.4035
0.6017
-49.12
Impact of WordEmbeddings and Ontologies external
select "Cluster Algorithm", "baseline F1", round(("ontologies F1"-"baseline F1")/"baseline F1"*100,2) || ' %' "ontologies F1 impact", round(("wordembeddings F1"-"baseline F1")/"baseline F1"*100,2) || ' %' "wordembeddings F1 impact", round(("both F1"-"baseline F1")/"baseline F1"*100,2) || ' %' "both F1 impact" from(
select baseline.ClusterAlgorithm as "Cluster Algorithm", max(baseline.F1WeightedAvg) "baseline F1", max(ontologies.F1WeightedAvg) "ontologies F1", max(wordembeddings.F1WeightedAvg) "wordembeddings F1", max(both.F1WeightedAvg) "both F1" from delta baseline
left outer join delta ontologies on (ontologies.ClusterAlgorithm = baseline.ClusterAlgorithm and baseline.DistanceFunction = ontologies.DistanceFunction and ((ontologies.synonyms = "true" or ontologies.germanetfunction = "true") and ontologies.Word2VecAdd = "false" and ontologies.Word2VecAverage = "false" and ontologies.distancefunction <> "WordEmbDistance"))
left outer join delta wordembeddings on (wordembeddings.ClusterAlgorithm = baseline.ClusterAlgorithm and baseline.DistanceFunction = wordembeddings.DistanceFunction and ((wordembeddings.Word2VecAdd = "true" or wordembeddings.Word2VecAverage = "true") and wordembeddings.distancefunction <> "WordEmbDistance" and wordembeddings.synonyms = "false" and wordembeddings.germanetfunction = "false"))
left outer join delta both on (both.ClusterAlgorithm = baseline.ClusterAlgorithm and baseline.DistanceFunction = both.DistanceFunction and ((both.Word2VecAdd = "true" or both.Word2VecAverage = "true") and both.distancefunction <> "WordEmbDistance" and (both.synonyms = "true" or both.germanetfunction = "true") ))
where baseline.Germanetfunction = "false" and baseline.Synonyms = "false" and baseline.Word2VecAdd = "false" and baseline.Word2VecAverage = "false" and baseline.distancefunction <> "WordEmbDistance"
group by baseline.ClusterAlgorithm
order by (both.F1WeightedAvg) desc
)
alpha
Cluster Algorithm
Baseline F1
ontologies F1 impact
wordembeddings F1 impact
both F1 impact
FuzzyCMeans2320
0.3443
-0.76 %
-6.91 %
-12.81 %
KMeans2320
0.2987
-0.74 %
7.43 %
0.1 %
Neural Gas
0.2053
10.28 %
-8.91 %
20.56 %
ClusterART
0.2383
-7.76 %
beta
Cluster Algorithm
Baseline F1
ontologies F1 impact
wordembeddings F1 impact
both F1 impact
Neural Gas
0.3921
34.79 %
16.93 %
35.09 %
FuzzyCMeans1520
0.4512
-7.14 %
2.35 %
-4.32 %
KMeans1520
0.428
0.05 %
-26.36 %
-24.02 %
ClusterART
0.4127
81.88 %
gamma
Cluster Algorithm
Baseline F1
ontologies F1 impact
wordembeddings F1 impact
both F1 impact
Neural Gas
0.3921
34.79 %
16.93 %
35.09 %
FuzzyCMeans1520
0.4512
-7.14 %
2.35 %
-4.32 %
KMeans1520
0.428
0.05 %
-26.36 %
-24.02 %
ClusterART
0.4127
81.88 %
delta
Cluster Algorithm
Baseline F1
ontologies F1 impact
wordembeddings F1 impact
both F1 impact
Neural Gas
0.5102
-0.18 %
-11.02 %
-10.78 %
FuzzyCMeans1620
0.4323
-10.55 %
1.64 %
-1.55 %
KMeans1620
0.4604
-2.26 %
-13.75 %
-14.29 %
ClusterART
0.5584
0.68 %
Impact of WordEmbeddings and Ontologies internal
select "Cluster Algorithm", "baseline SilhouetteAvg", round(("ontologies SilhouetteAvg"-"baseline SilhouetteAvg")/"baseline SilhouetteAvg"*100,2) || ' %' "ontologies SilhouetteAvg impact", round(("wordembeddings SilhouetteAvg"-"baseline SilhouetteAvg")/"baseline SilhouetteAvg"*100,2) || ' %' "wordembeddings SilhouetteAvg impact",
round(("both SilhouetteAvg"-"baseline SilhouetteAvg")/"baseline SilhouetteAvg"*100,2) || ' %' "both SilhouetteAvg impact" from(
select baseline.ClusterAlgorithm as "Cluster Algorithm", max(baseline.SilhouetteAvg) "baseline SilhouetteAvg", max(ontologies.SilhouetteAvg) "ontologies SilhouetteAvg", max(wordembeddings.SilhouetteAvg) "wordembeddings SilhouetteAvg", max(both.SilhouetteAvg) "both SilhouetteAvg" from delta baseline
left outer join delta ontologies on (ontologies.ClusterAlgorithm = baseline.ClusterAlgorithm and baseline.DistanceFunction = ontologies.DistanceFunction and ((ontologies.synonyms = "true" or ontologies.germanetfunction = "true") and ontologies.Word2VecAdd = "false" and ontologies.Word2VecAverage = "false" and ontologies.distancefunction <> "WordEmbDistance"))
left outer join delta wordembeddings on (wordembeddings.ClusterAlgorithm = baseline.ClusterAlgorithm and baseline.DistanceFunction = wordembeddings.DistanceFunction and ((wordembeddings.Word2VecAdd = "true" or wordembeddings.Word2VecAverage = "true") and wordembeddings.distancefunction <> "WordEmbDistance" and wordembeddings.synonyms = "false" and wordembeddings.germanetfunction = "false"))
left outer join delta both on (both.ClusterAlgorithm = baseline.ClusterAlgorithm and baseline.DistanceFunction = both.DistanceFunction and ((both.Word2VecAdd = "true" or both.Word2VecAverage = "true") and both.distancefunction <> "WordEmbDistance" and (both.synonyms = "true" or both.germanetfunction = "true") ))
where baseline.Germanetfunction = "false" and baseline.Synonyms = "false" and baseline.Word2VecAdd = "false" and baseline.Word2VecAverage = "false" and baseline.distancefunction <> "WordEmbDistance"
group by baseline.ClusterAlgorithm
order by (both.SilhouetteAvg) desc
)