From 6e7f2206197fe3e142d5c2edfc35cd4ffb8a50d0 Mon Sep 17 00:00:00 2001 From: Victor Zimmermann <zimmermann@cl.uni-heidelberg.de> Date: Tue, 13 Mar 2018 16:58:59 +0100 Subject: [PATCH] Newer results. Try5 on different dataset. --- results/out4.log | 1418 ++++++++++++++++++ results/try3.log | 278 ++++ results/try4.log | 3649 ++++++++++++++++++++++++++++++++++++++++++++++ results/try5.log | 3347 ++++++++++++++++++++++++++++++++++++++++++ 4 files changed, 8692 insertions(+) create mode 100644 results/out4.log create mode 100644 results/try3.log create mode 100644 results/try4.log create mode 100644 results/try5.log diff --git a/results/out4.log b/results/out4.log new file mode 100644 index 0000000..dc4cb40 --- /dev/null +++ b/results/out4.log @@ -0,0 +1,1418 @@ +[A] Loading absinth.py. + +[a] Counting nodes and edges. death_by_chocolate +[a] ~00% Nodes: 0 Edges: 0. death_by_chocolate +[a] ~09% Nodes: 15 Edges: 105. death_by_chocolate +[a] ~19% Nodes: 56 Edges: 661. death_by_chocolate +[a] ~29% Nodes: 226 Edges: 3566. death_by_chocolate +[a] ~39% Nodes: 226 Edges: 3566. death_by_chocolate +[a] ~49% Nodes: 243 Edges: 3719. death_by_chocolate +[a] ~59% Nodes: 444 Edges: 9158. death_by_chocolate +[a] ~69% Nodes: 444 Edges: 9158. death_by_chocolate +[a] ~79% Nodes: 456 Edges: 9302. death_by_chocolate +[a] ~89% Nodes: 482 Edges: 9836. death_by_chocolate +[a] ~99% Nodes: 506 Edges: 10214. death_by_chocolate +[a] 100% Nodes: 506 Edges: 10214. death_by_chocolate +[a] Building graph. death_by_chocolate +[a] Collecting root hubs. death_by_chocolate +[a] Building minimum spanning tree. death_by_chocolate +[a] Disambiguating results. death_by_chocolate +[a] Writing to file. death_by_chocolate + +[A] Word sense induction for 'death_by_chocolate': +[A] Nodes: 506 Edges: 10214 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. storm_in_a_teacup +[a] ~00% Nodes: 0 Edges: 0. storm_in_a_teacup +[a] ~09% Nodes: 285 Edges: 4630. storm_in_a_teacup +[a] ~19% Nodes: 459 Edges: 7666. storm_in_a_teacup +[a] ~29% Nodes: 691 Edges: 13078. storm_in_a_teacup +[a] ~39% Nodes: 792 Edges: 16080. storm_in_a_teacup +[a] ~49% Nodes: 931 Edges: 19147. storm_in_a_teacup +[a] ~59% Nodes: 1197 Edges: 27907. storm_in_a_teacup +[a] ~69% Nodes: 1384 Edges: 33634. storm_in_a_teacup +[a] ~79% Nodes: 1499 Edges: 37377. storm_in_a_teacup +[a] ~89% Nodes: 1583 Edges: 40413. storm_in_a_teacup +[a] ~99% Nodes: 1653 Edges: 43224. storm_in_a_teacup +[a] 100% Nodes: 1653 Edges: 43224. storm_in_a_teacup +[a] Building graph. storm_in_a_teacup +[a] Collecting root hubs. storm_in_a_teacup +[a] Building minimum spanning tree. storm_in_a_teacup +[a] Disambiguating results. storm_in_a_teacup +[a] Writing to file. storm_in_a_teacup + +[A] Word sense induction for 'storm_in_a_teacup': +[A] Nodes: 1653 Edges: 43224 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. gay_bar +[a] ~00% Nodes: 0 Edges: 0. gay_bar +[a] ~09% Nodes: 1365 Edges: 44297. gay_bar +[a] ~19% Nodes: 2178 Edges: 74867. gay_bar +[a] ~29% Nodes: 2947 Edges: 122014. gay_bar +[a] ~39% Nodes: 3628 Edges: 162509. gay_bar +[a] ~49% Nodes: 4143 Edges: 193169. gay_bar +[a] ~59% Nodes: 4694 Edges: 240290. gay_bar +[a] ~69% Nodes: 5118 Edges: 269316. gay_bar +[a] ~79% Nodes: 5615 Edges: 310902. gay_bar +[a] ~89% Nodes: 6059 Edges: 349160. gay_bar +[a] ~99% Nodes: 6735 Edges: 400442. gay_bar +[a] 100% Nodes: 6735 Edges: 400442. gay_bar +[a] Building graph. gay_bar +[a] Collecting root hubs. gay_bar +[a] Building minimum spanning tree. gay_bar +[a] Disambiguating results. gay_bar +[a] Writing to file. gay_bar + +[A] Word sense induction for 'gay_bar': +[A] Nodes: 6735 Edges: 400442 +[A] Root hubs: + 1. gay: ['bar', 'first', 'city', 'men', 'police', 'york'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 9), (1, 10), (1, 11), (1, 12), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. another_day_in_paradise +[a] ~00% Nodes: 0 Edges: 0. another_day_in_paradise +[a] ~09% Nodes: 104 Edges: 1462. another_day_in_paradise +[a] ~19% Nodes: 494 Edges: 14133. another_day_in_paradise +[a] ~29% Nodes: 593 Edges: 17701. another_day_in_paradise +[a] ~39% Nodes: 800 Edges: 24420. another_day_in_paradise +[a] ~49% Nodes: 1020 Edges: 35772. another_day_in_paradise +[a] ~59% Nodes: 1112 Edges: 38293. another_day_in_paradise +[a] ~69% Nodes: 1201 Edges: 41413. another_day_in_paradise +[a] ~79% Nodes: 1252 Edges: 43286. another_day_in_paradise +[a] ~89% Nodes: 1302 Edges: 44880. another_day_in_paradise +[a] ~99% Nodes: 1404 Edges: 50812. another_day_in_paradise +[a] 100% Nodes: 1404 Edges: 50812. another_day_in_paradise +[a] Building graph. another_day_in_paradise +[a] Collecting root hubs. another_day_in_paradise +[a] Building minimum spanning tree. another_day_in_paradise +[a] Disambiguating results. another_day_in_paradise +[a] Writing to file. another_day_in_paradise + +[A] Word sense induction for 'another_day_in_paradise': +[A] Nodes: 1404 Edges: 50812 +[A] Root hubs: + 1. phil: ['song', 'collins', 'music', 'number', 'first', 'album'] +[A] Mapping: [(1, 1), (1, 2), (1, 6), (1, 7), (1, 11), (1, 14), (1, 15), (1, 17), (1, 21), (1, 22), (1, 26), (1, 27), (1, 31), (1, 32), (1, 37), (1, 50), (1, 51), (1, 54), (1, 59), (1, 60), (1, 64), (1, 65), (1, 72), (1, 73), (1, 75), (1, 77), (1, 78), (1, 79), (1, 84), (1, 87), (1, 88), (1, 91), (1, 92), (1, 93), (1, 98)] + +[a] Counting nodes and edges. cassius_marcellus_clay +[a] ~00% Nodes: 0 Edges: 0. cassius_marcellus_clay +[a] Building graph. cassius_marcellus_clay +[a] Collecting root hubs. cassius_marcellus_clay +[a] Building minimum spanning tree. cassius_marcellus_clay +[a] Disambiguating results. cassius_marcellus_clay +[a] Writing to file. cassius_marcellus_clay + +[A] Word sense induction for 'cassius_marcellus_clay': +[A] Nodes: 2331 Edges: 2414350 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. civil_disobedience +[a] ~00% Nodes: 0 Edges: 0. civil_disobedience +[a] ~16% Nodes: 3274 Edges: 179060. civil_disobedience +[a] ~27% Nodes: 5535 Edges: 331904. civil_disobedience +[a] ~36% Nodes: 7275 Edges: 535170. civil_disobedience +[a] ~43% Nodes: 8630 Edges: 689194. civil_disobedience +[a] ~49% Nodes: 9459 Edges: 765874. civil_disobedience +[a] ~59% Nodes: 10531 Edges: 876161. civil_disobedience +[a] ~69% Nodes: 11538 Edges: 988374. civil_disobedience +[a] ~79% Nodes: 12622 Edges: 1144458. civil_disobedience +[a] ~89% Nodes: 13460 Edges: 1255767. civil_disobedience +[a] ~99% Nodes: 14462 Edges: 1385381. civil_disobedience +[a] 100% Nodes: 14467 Edges: 1385791. civil_disobedience +[a] Building graph. civil_disobedience +[a] Collecting root hubs. civil_disobedience +[a] Building minimum spanning tree. civil_disobedience +[a] Disambiguating results. civil_disobedience +[a] Writing to file. civil_disobedience + +[A] Word sense induction for 'civil_disobedience': +[A] Nodes: 14467 Edges: 1385791 +[A] Root hubs: + 1. movement: ['india', 'congress', 'government', 'indian', 'gandhi', 'british'] + 2. thoreau: ['henry', 'david', 'essay', 'civil', 'resistance', 'government'] + 3. electronic: ['media', 'disturbance', 'protest', 'action', 'group', 'art'] + 4. island: ['people', 'protests', 'navy', 'days', 'puerto', 'u.s'] +[A] Mapping: [(1, 1), (2, 2), (1, 3), (2, 4), (1, 5), (2, 6), (2, 7), (1, 8), (2, 9), (2, 10), (1, 11), (1, 12), (2, 13), (1, 14), (2, 15), (2, 16), (1, 17), (1, 18), (2, 19), (2, 20), (1, 21), (2, 22), (2, 23), (2, 24), (2, 25), (2, 26), (1, 27), (1, 28), (1, 29), (2, 30), (2, 31), (2, 32), (2, 33), (1, 34), (1, 35), (1, 36), (2, 37), (2, 38), (2, 39), (2, 40), (2, 41), (2, 42), (2, 43), (2, 44), (2, 45), (1, 46), (2, 47), (1, 48), (2, 49), (2, 50), (1, 51), (1, 52), (2, 53), (2, 54), (2, 55), (3, 56), (2, 57), (2, 58), (2, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (2, 68), (2, 69), (2, 70), (1, 71), (3, 72), (1, 73), (1, 74), (2, 75), (2, 76), (1, 77), (2, 78), (1, 79), (1, 80), (2, 81), (2, 82), (1, 83), (2, 84), (1, 85), (1, 86), (2, 87), (1, 88), (2, 89), (1, 90), (1, 91), (2, 92), (2, 93), (3, 94), (1, 95), (2, 96), (1, 97), (2, 98), (1, 99), (2, 100)] + +[a] Counting nodes and edges. bullet_in_the_head +[a] ~00% Nodes: 0 Edges: 0. bullet_in_the_head +[a] ~09% Nodes: 154 Edges: 2374. bullet_in_the_head +[a] ~19% Nodes: 536 Edges: 13557. bullet_in_the_head +[a] ~29% Nodes: 683 Edges: 18794. bullet_in_the_head +[a] ~39% Nodes: 808 Edges: 23306. bullet_in_the_head +[a] ~49% Nodes: 834 Edges: 23869. bullet_in_the_head +[a] ~59% Nodes: 970 Edges: 28583. bullet_in_the_head +[a] ~69% Nodes: 980 Edges: 28661. bullet_in_the_head +[a] ~79% Nodes: 1197 Edges: 36868. bullet_in_the_head +[a] ~89% Nodes: 1253 Edges: 39144. bullet_in_the_head +[a] ~99% Nodes: 1335 Edges: 41147. bullet_in_the_head +[a] 100% Nodes: 1335 Edges: 41147. bullet_in_the_head +[a] Building graph. bullet_in_the_head +[a] Collecting root hubs. bullet_in_the_head +[a] Building minimum spanning tree. bullet_in_the_head +[a] Disambiguating results. bullet_in_the_head +[a] Writing to file. bullet_in_the_head + +[A] Word sense induction for 'bullet_in_the_head': +[A] Nodes: 1335 Edges: 41147 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. junk_mail +[a] ~00% Nodes: 0 Edges: 0. junk_mail +[a] ~09% Nodes: 349 Edges: 6049. junk_mail +[a] ~19% Nodes: 663 Edges: 16927. junk_mail +[a] ~29% Nodes: 973 Edges: 27156. junk_mail +[a] ~39% Nodes: 1116 Edges: 29543. junk_mail +[a] ~49% Nodes: 1593 Edges: 46369. junk_mail +[a] ~59% Nodes: 1813 Edges: 53711. junk_mail +[a] ~69% Nodes: 2037 Edges: 61749. junk_mail +[a] ~79% Nodes: 2280 Edges: 72187. junk_mail +[a] ~89% Nodes: 2369 Edges: 75549. junk_mail +[a] ~99% Nodes: 2650 Edges: 122830. junk_mail +[a] 100% Nodes: 2650 Edges: 122830. junk_mail +[a] Building graph. junk_mail +[a] Collecting root hubs. junk_mail +[a] Building minimum spanning tree. junk_mail +[a] Disambiguating results. junk_mail +[a] Writing to file. junk_mail + +[A] Word sense induction for 'junk_mail': +[A] Nodes: 2650 Edges: 122830 +[A] Root hubs: + 1. mail: ['service', 'bulk', 'spam', 'first', 'office', 'advertising'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 6), (1, 8), (1, 10), (1, 12), (1, 13), (1, 15), (1, 16), (1, 17), (1, 18), (1, 20), (1, 22), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 30), (1, 31), (1, 33), (1, 35), (1, 38), (1, 40), (1, 41), (1, 43), (1, 44), (1, 45), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 55), (1, 56), (1, 58), (1, 60), (1, 62), (1, 63), (1, 64), (1, 65), (1, 67), (1, 68), (1, 69), (1, 70), (1, 72), (1, 73), (1, 75), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 86), (1, 87), (1, 89), (1, 90), (1, 94), (1, 95), (1, 96), (1, 97)] + +[a] Counting nodes and edges. gorky_park +[a] ~00% Nodes: 0 Edges: 0. gorky_park +[a] ~09% Nodes: 420 Edges: 10011. gorky_park +[a] ~19% Nodes: 693 Edges: 16411. gorky_park +[a] ~29% Nodes: 887 Edges: 22068. gorky_park +[a] ~39% Nodes: 1138 Edges: 32279. gorky_park +[a] ~49% Nodes: 1253 Edges: 36583. gorky_park +[a] ~59% Nodes: 1470 Edges: 45317. gorky_park +[a] ~69% Nodes: 1688 Edges: 50624. gorky_park +[a] ~79% Nodes: 1961 Edges: 60583. gorky_park +[a] ~89% Nodes: 2147 Edges: 67468. gorky_park +[a] ~99% Nodes: 2329 Edges: 75151. gorky_park +[a] 100% Nodes: 2329 Edges: 75151. gorky_park +[a] Building graph. gorky_park +[a] Collecting root hubs. gorky_park +[a] Building minimum spanning tree. gorky_park +[a] Disambiguating results. gorky_park +[a] Writing to file. gorky_park + +[A] Word sense induction for 'gorky_park': +[A] Nodes: 2329 Edges: 75151 +[A] Root hubs: + 1. moscow: ['first', 'soviet', 'russia', 'russian', 'park', 'august'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (1, 10), (1, 11), (1, 12), (1, 14), (1, 16), (1, 25), (1, 29), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 42), (1, 43), (1, 44), (1, 46), (1, 47), (1, 49), (1, 50), (1, 52), (1, 55), (1, 56), (1, 60), (1, 61), (1, 64), (1, 70), (1, 71), (1, 74), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 89), (1, 91), (1, 92), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. micro_chip +[a] ~00% Nodes: 0 Edges: 0. micro_chip +[a] ~09% Nodes: 23 Edges: 253. micro_chip +[a] ~19% Nodes: 64 Edges: 729. micro_chip +[a] ~29% Nodes: 91 Edges: 1080. micro_chip +[a] ~39% Nodes: 91 Edges: 1080. micro_chip +[a] ~49% Nodes: 91 Edges: 1080. micro_chip +[a] ~59% Nodes: 113 Edges: 1333. micro_chip +[a] ~69% Nodes: 177 Edges: 3543. micro_chip +[a] ~79% Nodes: 177 Edges: 3543. micro_chip +[a] ~89% Nodes: 177 Edges: 3543. micro_chip +[a] ~99% Nodes: 220 Edges: 4013. micro_chip +[a] 100% Nodes: 220 Edges: 4013. micro_chip +[a] Building graph. micro_chip +[a] Collecting root hubs. micro_chip +[a] Building minimum spanning tree. micro_chip +[a] Disambiguating results. micro_chip +[a] Writing to file. micro_chip + +[A] Word sense induction for 'micro_chip': +[A] Nodes: 220 Edges: 4013 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. the_glass_bead_game +[a] ~00% Nodes: 0 Edges: 0. glass_bead_game +[a] ~09% Nodes: 220 Edges: 3036. glass_bead_game +[a] ~19% Nodes: 394 Edges: 7278. glass_bead_game +[a] ~29% Nodes: 466 Edges: 9925. glass_bead_game +[a] ~39% Nodes: 666 Edges: 17432. glass_bead_game +[a] ~49% Nodes: 928 Edges: 26746. glass_bead_game +[a] ~59% Nodes: 953 Edges: 27412. glass_bead_game +[a] ~69% Nodes: 965 Edges: 27563. glass_bead_game +[a] ~79% Nodes: 974 Edges: 27608. glass_bead_game +[a] ~89% Nodes: 1078 Edges: 33760. glass_bead_game +[a] ~99% Nodes: 1134 Edges: 37244. glass_bead_game +[a] 100% Nodes: 1134 Edges: 37244. glass_bead_game +[a] Building graph. the_glass_bead_game +[a] Collecting root hubs. the_glass_bead_game +[a] Building minimum spanning tree. the_glass_bead_game +[a] Disambiguating results. the_glass_bead_game +[a] Writing to file. the_glass_bead_game + +[A] Word sense induction for 'the_glass_bead_game': +[A] Nodes: 1134 Edges: 37244 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. the_colour_of_magic +[a] ~00% Nodes: 0 Edges: 0. colour_of_magic +[a] ~09% Nodes: 435 Edges: 10038. colour_of_magic +[a] ~19% Nodes: 629 Edges: 14443. colour_of_magic +[a] ~29% Nodes: 818 Edges: 19662. colour_of_magic +[a] ~39% Nodes: 884 Edges: 21206. colour_of_magic +[a] ~49% Nodes: 1062 Edges: 26965. colour_of_magic +[a] ~59% Nodes: 1244 Edges: 34500. colour_of_magic +[a] ~69% Nodes: 1293 Edges: 35783. colour_of_magic +[a] ~79% Nodes: 1461 Edges: 42607. colour_of_magic +[a] ~89% Nodes: 1682 Edges: 51512. colour_of_magic +[a] ~99% Nodes: 1786 Edges: 56335. colour_of_magic +[a] 100% Nodes: 1786 Edges: 56335. colour_of_magic +[a] Building graph. the_colour_of_magic +[a] Collecting root hubs. the_colour_of_magic +[a] Building minimum spanning tree. the_colour_of_magic +[a] Disambiguating results. the_colour_of_magic +[a] Writing to file. the_colour_of_magic + +[A] Word sense induction for 'the_colour_of_magic': +[A] Nodes: 1786 Edges: 56335 +[A] Root hubs: + 1. pratchett: ['terry', 'discworld', 'series', 'first', 'adaptation', 'novel'] +[A] Mapping: [(1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 23), (1, 24), (1, 25), (1, 28), (1, 29), (1, 31), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 55), (1, 56), (1, 57), (1, 59), (1, 60), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 69), (1, 70), (1, 72), (1, 73), (1, 75), (1, 77), (1, 78), (1, 81), (1, 82), (1, 83), (1, 85), (1, 86), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 96), (1, 97), (1, 99), (1, 100)] + +[a] Counting nodes and edges. reign_of_terror +[a] ~00% Nodes: 0 Edges: 0. reign_of_terror +[a] ~14% Nodes: 2888 Edges: 127844. reign_of_terror +[a] ~25% Nodes: 5015 Edges: 251804. reign_of_terror +[a] ~33% Nodes: 6671 Edges: 386146. reign_of_terror +[a] ~40% Nodes: 8030 Edges: 488339. reign_of_terror +[a] ~49% Nodes: 9250 Edges: 579184. reign_of_terror +[a] ~59% Nodes: 10415 Edges: 676169. reign_of_terror +[a] ~69% Nodes: 11512 Edges: 785298. reign_of_terror +[a] ~79% Nodes: 12540 Edges: 908788. reign_of_terror +[a] ~89% Nodes: 13498 Edges: 1014353. reign_of_terror +[a] ~99% Nodes: 14226 Edges: 1090757. reign_of_terror +[a] 100% Nodes: 14234 Edges: 1091420. reign_of_terror +[a] Building graph. reign_of_terror +[a] Collecting root hubs. reign_of_terror +[a] Building minimum spanning tree. reign_of_terror +[a] Disambiguating results. reign_of_terror +[a] Writing to file. reign_of_terror + +[A] Word sense induction for 'reign_of_terror': +[A] Nodes: 14234 Edges: 1091420 +[A] Root hubs: + 1. french: ['revolution', 'france', 'paris', 'revolutionary', 'many', 'louis'] + 2. minister: ['prime', 'british', 'troops', 'enemy', 'winston', 'coast'] + 3. world: ['war', 'first', 'time', 'people', 'history', 'end'] + 4. album: ['band', 'song', 'sleigh', 'release', 'bells', 'single'] + 5. police: ['people', 'political', 'government', 'man', 'south', 'officers'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (4, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (2, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (4, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (4, 63), (2, 64), (4, 65), (4, 66), (4, 67), (4, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 92), (1, 93), (1, 94), (1, 95), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. fight_night +[a] ~00% Nodes: 0 Edges: 0. fight_night +[a] ~09% Nodes: 1402 Edges: 56834. fight_night +[a] ~19% Nodes: 2211 Edges: 85968. fight_night +[a] ~29% Nodes: 2870 Edges: 117177. fight_night +[a] ~39% Nodes: 3533 Edges: 155328. fight_night +[a] ~49% Nodes: 3773 Edges: 167979. fight_night +[a] ~59% Nodes: 4249 Edges: 198860. fight_night +[a] ~69% Nodes: 4685 Edges: 224188. fight_night +[a] ~79% Nodes: 5178 Edges: 262312. fight_night +[a] ~89% Nodes: 5405 Edges: 277433. fight_night +[a] ~99% Nodes: 5831 Edges: 309397. fight_night +[a] 100% Nodes: 5831 Edges: 309401. fight_night +[a] Building graph. fight_night +[a] Collecting root hubs. fight_night +[a] Building minimum spanning tree. fight_night +[a] Disambiguating results. fight_night +[a] Writing to file. fight_night + +[A] Word sense induction for 'fight_night': +[A] Nodes: 5831 Edges: 309401 +[A] Root hubs: + 1. fight: ['ufc', 'round', 'decision', 'first', 'unanimous', 'bout'] + 2. ea: ['sports', 'game', 'video', 'round', 'boxing', 'series'] + 3. open: ['impact', 'tna', 'match', 'wrestling', 'episode', 'championship'] + 4. room: ['locker', 'traditional', 'sponsor', 'money', 'bonuses', 'payout'] + 5. casino: ['championship', 'event', 'mixed', 'arts', 'ultimate', 'martial'] +[A] Mapping: [(2, 1), (1, 2), (2, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 8), (1, 9), (1, 10), (2, 11), (2, 13), (1, 14), (5, 15), (2, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (2, 27), (1, 28), (1, 29), (1, 30), (2, 31), (2, 32), (1, 33), (2, 34), (2, 35), (1, 36), (1, 37), (1, 38), (2, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (2, 48), (1, 49), (5, 50), (1, 51), (1, 52), (1, 53), (1, 54), (2, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (2, 61), (1, 62), (1, 63), (2, 64), (2, 65), (2, 66), (1, 67), (1, 68), (3, 69), (1, 70), (1, 71), (2, 72), (2, 73), (1, 74), (2, 75), (1, 76), (2, 77), (1, 78), (1, 79), (1, 80), (2, 81), (1, 82), (2, 83), (1, 84), (3, 85), (1, 86), (1, 87), (5, 88), (1, 89), (1, 90), (1, 91), (1, 93), (2, 94), (1, 95), (2, 96), (2, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. heavy_rotation +[a] ~00% Nodes: 0 Edges: 0. heavy_rotation +[a] ~09% Nodes: 1699 Edges: 71688. heavy_rotation +[a] ~19% Nodes: 2999 Edges: 142745. heavy_rotation +[a] ~29% Nodes: 3686 Edges: 183427. heavy_rotation +[a] ~39% Nodes: 4462 Edges: 228593. heavy_rotation +[a] ~49% Nodes: 5103 Edges: 274589. heavy_rotation +[a] ~59% Nodes: 5774 Edges: 320925. heavy_rotation +[a] ~69% Nodes: 6268 Edges: 356058. heavy_rotation +[a] ~79% Nodes: 6934 Edges: 407110. heavy_rotation +[a] ~89% Nodes: 7672 Edges: 484862. heavy_rotation +[a] ~99% Nodes: 8169 Edges: 534988. heavy_rotation +[a] 100% Nodes: 8176 Edges: 535721. heavy_rotation +[a] Building graph. heavy_rotation +[a] Collecting root hubs. heavy_rotation +[a] Building minimum spanning tree. heavy_rotation +[a] Disambiguating results. heavy_rotation +[a] Writing to file. heavy_rotation + +[A] Word sense induction for 'heavy_rotation': +[A] Nodes: 8176 Edges: 535721 +[A] Root hubs: + 1. music: ['video', 'mtv', 'album', 'single', 'song', 'first'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. american_beauty +[a] ~00% Nodes: 0 Edges: 0. american_beauty +[a] ~09% Nodes: 1170 Edges: 41569. american_beauty +[a] ~19% Nodes: 2315 Edges: 84341. american_beauty +[a] ~29% Nodes: 2866 Edges: 107772. american_beauty +[a] ~39% Nodes: 3357 Edges: 135527. american_beauty +[a] ~49% Nodes: 3747 Edges: 154781. american_beauty +[a] ~59% Nodes: 4325 Edges: 185434. american_beauty +[a] ~69% Nodes: 4736 Edges: 212309. american_beauty +[a] ~79% Nodes: 5212 Edges: 242813. american_beauty +[a] ~89% Nodes: 5572 Edges: 266988. american_beauty +[a] ~99% Nodes: 6519 Edges: 357876. american_beauty +[a] 100% Nodes: 6519 Edges: 357876. american_beauty +[a] Building graph. american_beauty +[a] Collecting root hubs. american_beauty +[a] Building minimum spanning tree. american_beauty +[a] Disambiguating results. american_beauty +[a] Writing to file. american_beauty + +[A] Word sense induction for 'american_beauty': +[A] Nodes: 6519 Edges: 357876 +[A] Root hubs: + 1. film: ['films', 'american', 'best', 'mendes', 'award', 'director'] + 2. miss: ['pageant', 'titleholder', 'usa', 'queen', 'title', 'america'] + 3. grateful: ['dead', 'album', 'albums', 'band', 'workingman', 'song'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 8), (2, 10), (1, 11), (1, 13), (1, 14), (1, 16), (1, 17), (2, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 24), (1, 27), (1, 28), (2, 30), (1, 31), (1, 32), (1, 33), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 44), (1, 45), (3, 46), (1, 47), (1, 48), (1, 49), (1, 52), (1, 53), (1, 54), (1, 55), (3, 56), (1, 57), (1, 58), (2, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 66), (1, 67), (1, 68), (1, 69), (1, 71), (2, 72), (1, 75), (1, 76), (2, 77), (2, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 93), (3, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. bat_boy +[a] ~00% Nodes: 0 Edges: 0. bat_boy +[a] ~09% Nodes: 355 Edges: 7570. bat_boy +[a] ~19% Nodes: 837 Edges: 25301. bat_boy +[a] ~29% Nodes: 916 Edges: 27899. bat_boy +[a] ~39% Nodes: 984 Edges: 29560. bat_boy +[a] ~49% Nodes: 1072 Edges: 33404. bat_boy +[a] ~59% Nodes: 1221 Edges: 38675. bat_boy +[a] ~69% Nodes: 1414 Edges: 47235. bat_boy +[a] ~79% Nodes: 1561 Edges: 52483. bat_boy +[a] ~89% Nodes: 1760 Edges: 60710. bat_boy +[a] ~99% Nodes: 1915 Edges: 67859. bat_boy +[a] 100% Nodes: 1915 Edges: 67859. bat_boy +[a] Building graph. bat_boy +[a] Collecting root hubs. bat_boy +[a] Building minimum spanning tree. bat_boy +[a] Disambiguating results. bat_boy +[a] Writing to file. bat_boy + +[A] Word sense induction for 'bat_boy': +[A] Nodes: 1915 Edges: 67859 +[A] Root hubs: + 1. musical: ['broadway', 'theatre', 'world', 'show', 'york', 'end'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 6), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 19), (1, 20), (1, 23), (1, 24), (1, 25), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 33), (1, 34), (1, 36), (1, 37), (1, 39), (1, 40), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 58), (1, 59), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 68), (1, 70), (1, 71), (1, 72), (1, 73), (1, 76), (1, 77), (1, 78), (1, 79), (1, 81), (1, 82), (1, 83), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 93), (1, 97), (1, 100)] + +[a] Counting nodes and edges. tree_of_knowledge +[a] ~00% Nodes: 0 Edges: 0. tree_of_knowledge +[a] ~09% Nodes: 899 Edges: 30244. tree_of_knowledge +[a] ~19% Nodes: 1387 Edges: 43956. tree_of_knowledge +[a] ~29% Nodes: 1864 Edges: 79415. tree_of_knowledge +[a] ~39% Nodes: 2188 Edges: 92237. tree_of_knowledge +[a] ~49% Nodes: 2870 Edges: 129817. tree_of_knowledge +[a] ~59% Nodes: 3153 Edges: 144289. tree_of_knowledge +[a] ~69% Nodes: 3546 Edges: 172457. tree_of_knowledge +[a] ~79% Nodes: 3858 Edges: 198201. tree_of_knowledge +[a] ~89% Nodes: 4199 Edges: 216315. tree_of_knowledge +[a] ~99% Nodes: 4413 Edges: 229030. tree_of_knowledge +[a] 100% Nodes: 4415 Edges: 229091. tree_of_knowledge +[a] Building graph. tree_of_knowledge +[a] Collecting root hubs. tree_of_knowledge +[a] Building minimum spanning tree. tree_of_knowledge +[a] Disambiguating results. tree_of_knowledge +[a] Writing to file. tree_of_knowledge + +[A] Word sense induction for 'tree_of_knowledge': +[A] Nodes: 4415 Edges: 229091 +[A] Root hubs: + 1. good: ['evil', 'tree', 'adam', 'god', 'fruit', 'life'] + 2. system: ['psychology', 'henriques', 'unification', 'theoretical', 'review', 'general'] +[A] Mapping: [(1, 1), (1, 4), (1, 6), (1, 7), (1, 8), (1, 10), (2, 11), (1, 12), (1, 13), (1, 15), (2, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 28), (1, 29), (1, 32), (1, 33), (1, 35), (1, 36), (1, 38), (1, 39), (1, 40), (2, 42), (1, 43), (2, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 50), (2, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 60), (1, 61), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 69), (2, 70), (1, 72), (1, 74), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (2, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 93), (1, 94), (1, 95), (1, 97), (1, 98)] + +[a] Counting nodes and edges. in_the_name_of_love +[a] ~00% Nodes: 0 Edges: 0. in_the_name_of_love +[a] ~09% Nodes: 641 Edges: 20430. in_the_name_of_love +[a] ~19% Nodes: 1354 Edges: 46834. in_the_name_of_love +[a] ~29% Nodes: 1796 Edges: 67634. in_the_name_of_love +[a] ~39% Nodes: 2257 Edges: 86615. in_the_name_of_love +[a] ~49% Nodes: 2704 Edges: 109343. in_the_name_of_love +[a] ~59% Nodes: 2890 Edges: 117275. in_the_name_of_love +[a] ~69% Nodes: 3130 Edges: 131285. in_the_name_of_love +[a] ~79% Nodes: 3438 Edges: 150742. in_the_name_of_love +[a] ~89% Nodes: 3665 Edges: 165133. in_the_name_of_love +[a] ~99% Nodes: 3820 Edges: 175525. in_the_name_of_love +[a] 100% Nodes: 3820 Edges: 175525. in_the_name_of_love +[a] Building graph. in_the_name_of_love +[a] Collecting root hubs. in_the_name_of_love +[a] Building minimum spanning tree. in_the_name_of_love +[a] Disambiguating results. in_the_name_of_love +[a] Writing to file. in_the_name_of_love + +[A] Word sense induction for 'in_the_name_of_love': +[A] Nodes: 3820 Edges: 175525 +[A] Root hubs: + 1. album: ['single', 'song', 'songs', 'band', 'records', 'first'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (1, 10), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 81), (1, 82), (1, 83), (1, 84), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. agent_blue +[a] ~00% Nodes: 0 Edges: 0. agent_blue +[a] ~09% Nodes: 37 Edges: 480. agent_blue +[a] ~19% Nodes: 115 Edges: 2167. agent_blue +[a] ~29% Nodes: 158 Edges: 2947. agent_blue +[a] ~39% Nodes: 158 Edges: 2947. agent_blue +[a] ~49% Nodes: 213 Edges: 3913. agent_blue +[a] ~59% Nodes: 346 Edges: 8941. agent_blue +[a] ~69% Nodes: 397 Edges: 10641. agent_blue +[a] ~79% Nodes: 419 Edges: 11359. agent_blue +[a] ~89% Nodes: 526 Edges: 19196. agent_blue +[a] ~99% Nodes: 533 Edges: 19217. agent_blue +[a] 100% Nodes: 533 Edges: 19217. agent_blue +[a] Building graph. agent_blue +[a] Collecting root hubs. agent_blue +[a] Building minimum spanning tree. agent_blue +[a] Disambiguating results. agent_blue +[a] Writing to file. agent_blue + +[A] Word sense induction for 'agent_blue': +[A] Nodes: 533 Edges: 19217 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. lake_of_the_woods +[a] ~00% Nodes: 0 Edges: 0. lake_of_the_woods +[a] ~09% Nodes: 1102 Edges: 37111. lake_of_the_woods +[a] ~19% Nodes: 1381 Edges: 47580. lake_of_the_woods +[a] ~29% Nodes: 2059 Edges: 80159. lake_of_the_woods +[a] ~39% Nodes: 2349 Edges: 95851. lake_of_the_woods +[a] ~49% Nodes: 2519 Edges: 103257. lake_of_the_woods +[a] ~59% Nodes: 2759 Edges: 113490. lake_of_the_woods +[a] ~69% Nodes: 3071 Edges: 134004. lake_of_the_woods +[a] ~79% Nodes: 3279 Edges: 145871. lake_of_the_woods +[a] ~89% Nodes: 3549 Edges: 165861. lake_of_the_woods +[a] ~99% Nodes: 3636 Edges: 172741. lake_of_the_woods +[a] 100% Nodes: 3636 Edges: 172741. lake_of_the_woods +[a] Building graph. lake_of_the_woods +[a] Collecting root hubs. lake_of_the_woods +[a] Building minimum spanning tree. lake_of_the_woods +[a] Disambiguating results. lake_of_the_woods +[a] Writing to file. lake_of_the_woods + +[A] Word sense induction for 'lake_of_the_woods': +[A] Nodes: 3636 Edges: 172741 +[A] Root hubs: + 1. lake: ['river', 'minnesota', 'north', 'west', 'superior', 'bay'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 41), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 61), (1, 62), (1, 64), (1, 65), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 86), (1, 87), (1, 88), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 99), (1, 100)] + +[a] Counting nodes and edges. james_bond +[a] ~00% Nodes: 0 Edges: 0. james_bond +[a] ~32% Nodes: 6439 Edges: 329248. james_bond +[a] ~52% Nodes: 10454 Edges: 656516. james_bond +[a] ~66% Nodes: 13245 Edges: 941687. james_bond +[a] ~77% Nodes: 15419 Edges: 1158026. james_bond +[a] ~88% Nodes: 17652 Edges: 1446682. james_bond +[a] ~97% Nodes: 19522 Edges: 1706896. james_bond +[a] Building graph. james_bond +[a] Collecting root hubs. james_bond +[a] Building minimum spanning tree. james_bond +[a] Disambiguating results. james_bond +[a] Writing to file. james_bond + +[A] Word sense induction for 'james_bond': +[A] Nodes: 20008 Edges: 1780638 +[A] Root hubs: + 1. film: ['bond', 'films', 'series', 'first', 'role', 'character'] + 2. naval: ['intelligence', 'ian', 'war', 'novels', 'world', 'bond'] + 3. ornithologist: ['name', 'bond', 'american', 'birds', 'author', 'west'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (3, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (3, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (2, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (3, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. space_raiders +[a] ~00% Nodes: 0 Edges: 0. space_raiders +[a] ~09% Nodes: 8 Edges: 28. space_raiders +[a] ~19% Nodes: 109 Edges: 2578. space_raiders +[a] ~29% Nodes: 229 Edges: 6099. space_raiders +[a] ~39% Nodes: 282 Edges: 6656. space_raiders +[a] ~49% Nodes: 385 Edges: 10404. space_raiders +[a] ~59% Nodes: 516 Edges: 12986. space_raiders +[a] ~69% Nodes: 564 Edges: 14038. space_raiders +[a] ~79% Nodes: 603 Edges: 14503. space_raiders +[a] ~89% Nodes: 665 Edges: 15733. space_raiders +[a] ~99% Nodes: 665 Edges: 15733. space_raiders +[a] 100% Nodes: 665 Edges: 15733. space_raiders +[a] Building graph. space_raiders +[a] Collecting root hubs. space_raiders +[a] Building minimum spanning tree. space_raiders +[a] Disambiguating results. space_raiders +[a] Writing to file. space_raiders + +[A] Word sense induction for 'space_raiders': +[A] Nodes: 665 Edges: 15733 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. mark_forster +[a] ~00% Nodes: 0 Edges: 0. mark_forster +[a] ~09% Nodes: 0 Edges: 0. mark_forster +[a] ~19% Nodes: 79 Edges: 2320. mark_forster +[a] ~29% Nodes: 79 Edges: 2320. mark_forster +[a] ~39% Nodes: 79 Edges: 2320. mark_forster +[a] ~49% Nodes: 79 Edges: 2320. mark_forster +[a] ~59% Nodes: 241 Edges: 9477. mark_forster +[a] ~69% Nodes: 241 Edges: 9477. mark_forster +[a] ~79% Nodes: 252 Edges: 9543. mark_forster +[a] ~89% Nodes: 252 Edges: 9543. mark_forster +[a] ~99% Nodes: 270 Edges: 9714. mark_forster +[a] 100% Nodes: 270 Edges: 9714. mark_forster +[a] Building graph. mark_forster +[a] Collecting root hubs. mark_forster +[a] Building minimum spanning tree. mark_forster +[a] Disambiguating results. mark_forster +[a] Writing to file. mark_forster + +[A] Word sense induction for 'mark_forster': +[A] Nodes: 270 Edges: 9714 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. queen_of_the_night +[a] ~00% Nodes: 0 Edges: 0. queen_of_the_night +[a] ~09% Nodes: 747 Edges: 22341. queen_of_the_night +[a] ~19% Nodes: 1185 Edges: 39716. queen_of_the_night +[a] ~29% Nodes: 1879 Edges: 68816. queen_of_the_night +[a] ~39% Nodes: 2123 Edges: 77752. queen_of_the_night +[a] ~49% Nodes: 2474 Edges: 93871. queen_of_the_night +[a] ~59% Nodes: 2789 Edges: 108536. queen_of_the_night +[a] ~69% Nodes: 3134 Edges: 128052. queen_of_the_night +[a] ~79% Nodes: 3479 Edges: 148557. queen_of_the_night +[a] ~89% Nodes: 3864 Edges: 170553. queen_of_the_night +[a] ~99% Nodes: 4176 Edges: 189253. queen_of_the_night +[a] 100% Nodes: 4176 Edges: 189253. queen_of_the_night +[a] Building graph. queen_of_the_night +[a] Collecting root hubs. queen_of_the_night +[a] Building minimum spanning tree. queen_of_the_night +[a] Disambiguating results. queen_of_the_night +[a] Writing to file. queen_of_the_night + +[A] Word sense induction for 'queen_of_the_night': +[A] Nodes: 4176 Edges: 189253 +[A] Root hubs: + 1. opera: ['magic', 'flute', 'mozart', 'role', 'roles', 'debut'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 10), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 25), (1, 26), (1, 30), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 40), (1, 42), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 81), (1, 82), (1, 83), (1, 84), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 92), (1, 95), (1, 96), (1, 97), (1, 99), (1, 100)] + +[a] Counting nodes and edges. the_marquise_of_o +[a] ~00% Nodes: 0 Edges: 0. marquise_of_o +[a] ~09% Nodes: 34 Edges: 309. marquise_of_o +[a] ~19% Nodes: 34 Edges: 309. marquise_of_o +[a] ~29% Nodes: 35 Edges: 312. marquise_of_o +[a] ~39% Nodes: 78 Edges: 1387. marquise_of_o +[a] ~49% Nodes: 78 Edges: 1387. marquise_of_o +[a] ~59% Nodes: 79 Edges: 1392. marquise_of_o +[a] ~69% Nodes: 79 Edges: 1392. marquise_of_o +[a] ~79% Nodes: 103 Edges: 1668. marquise_of_o +[a] ~89% Nodes: 103 Edges: 1668. marquise_of_o +[a] ~99% Nodes: 103 Edges: 1668. marquise_of_o +[a] 100% Nodes: 103 Edges: 1668. marquise_of_o +[a] Building graph. the_marquise_of_o +[a] Collecting root hubs. the_marquise_of_o +[a] Building minimum spanning tree. the_marquise_of_o +[a] Disambiguating results. the_marquise_of_o +[a] Writing to file. the_marquise_of_o + +[A] Word sense induction for 'the_marquise_of_o': +[A] Nodes: 103 Edges: 1668 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. mount_huxley +[a] ~00% Nodes: 0 Edges: 0. mount_huxley +[a] ~09% Nodes: 20 Edges: 190. mount_huxley +[a] ~19% Nodes: 83 Edges: 1169. mount_huxley +[a] ~29% Nodes: 83 Edges: 1169. mount_huxley +[a] ~39% Nodes: 119 Edges: 1907. mount_huxley +[a] ~49% Nodes: 127 Edges: 2355. mount_huxley +[a] ~59% Nodes: 207 Edges: 5267. mount_huxley +[a] ~69% Nodes: 208 Edges: 5303. mount_huxley +[a] ~79% Nodes: 221 Edges: 5464. mount_huxley +[a] ~89% Nodes: 221 Edges: 5464. mount_huxley +[a] ~99% Nodes: 221 Edges: 5464. mount_huxley +[a] 100% Nodes: 221 Edges: 5464. mount_huxley +[a] Building graph. mount_huxley +[a] Collecting root hubs. mount_huxley +[a] Building minimum spanning tree. mount_huxley +[a] Disambiguating results. mount_huxley +[a] Writing to file. mount_huxley + +[A] Word sense induction for 'mount_huxley': +[A] Nodes: 221 Edges: 5464 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. ace_of_spades +[a] ~00% Nodes: 0 Edges: 0. ace_of_spades +[a] ~09% Nodes: 754 Edges: 18932. ace_of_spades +[a] ~19% Nodes: 1299 Edges: 36175. ace_of_spades +[a] ~29% Nodes: 1671 Edges: 46132. ace_of_spades +[a] ~39% Nodes: 2014 Edges: 62139. ace_of_spades +[a] ~49% Nodes: 2532 Edges: 79600. ace_of_spades +[a] ~59% Nodes: 2801 Edges: 87945. ace_of_spades +[a] Building graph. ace_of_spades +[a] Collecting root hubs. ace_of_spades +[a] Building minimum spanning tree. ace_of_spades +[a] Disambiguating results. ace_of_spades +[a] Writing to file. ace_of_spades + +[A] Word sense induction for 'ace_of_spades': +[A] Nodes: 5211 Edges: 3024883 +[A] Root hubs: + 1. band: ['motörhead', 'album', 'uk', 'cover', 'metal', 'single'] + 2. card: ['cards', 'deck', 'ace', 'playing', 'clubs', 'red'] +[A] Mapping: [(1, 1), (2, 2), (1, 3), (1, 5), (2, 7), (1, 8), (1, 13), (1, 14), (1, 16), (1, 18), (2, 19), (1, 20), (2, 21), (1, 25), (1, 26), (2, 33), (2, 34), (1, 35), (1, 36), (2, 38), (2, 39), (2, 44), (2, 45), (2, 47), (1, 48), (2, 49), (2, 50), (1, 51), (2, 54), (1, 55), (1, 56), (2, 57), (1, 58), (2, 59), (1, 62), (1, 64), (1, 66), (1, 67), (1, 68), (1, 69), (2, 70), (2, 71), (2, 74), (2, 75), (2, 76), (2, 78), (2, 79), (1, 80), (2, 81), (2, 85), (1, 87), (1, 88), (1, 90), (1, 92), (1, 94), (2, 96), (1, 97), (2, 98)] + +[a] Counting nodes and edges. the_blue_bird +[a] ~00% Nodes: 0 Edges: 0. blue_bird +[a] ~09% Nodes: 871 Edges: 18132. blue_bird +[a] ~19% Nodes: 1843 Edges: 52530. blue_bird +[a] ~29% Nodes: 2451 Edges: 77899. blue_bird +[a] ~39% Nodes: 2903 Edges: 93971. blue_bird +[a] ~49% Nodes: 3525 Edges: 122059. blue_bird +[a] ~59% Nodes: 4001 Edges: 142802. blue_bird +[a] ~69% Nodes: 4389 Edges: 160772. blue_bird +[a] ~79% Nodes: 5097 Edges: 206060. blue_bird +[a] ~89% Nodes: 5729 Edges: 252402. blue_bird +[a] ~99% Nodes: 6135 Edges: 278405. blue_bird +[a] 100% Nodes: 6135 Edges: 278405. blue_bird +[a] Building graph. the_blue_bird +[a] Collecting root hubs. the_blue_bird +[a] Building minimum spanning tree. the_blue_bird +[a] Disambiguating results. the_blue_bird +[a] Writing to file. the_blue_bird + +[A] Word sense induction for 'the_blue_bird': +[A] Nodes: 6135 Edges: 278405 +[A] Root hubs: + 1. school: ['bus', 'buses', 'american', 'chassis', 'company', 'body'] + 2. campbell: ['record', 'malcolm', 'speed', 'land', 'car', 'world'] + 3. maeterlinck: ['maurice', 'theatre', 'play', 'art', 'film', 'production'] + 4. detroit: ['jazz', 'band', 'july', 'house', 'press', 'club'] +[A] Mapping: [(1, 1), (3, 2), (3, 4), (1, 5), (1, 6), (4, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (3, 17), (4, 18), (1, 20), (1, 21), (1, 22), (1, 23), (3, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 31), (1, 32), (1, 36), (1, 38), (1, 39), (3, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (3, 50), (1, 51), (1, 52), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (3, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (4, 77), (1, 78), (2, 79), (1, 80), (1, 82), (3, 83), (3, 84), (1, 85), (1, 86), (1, 87), (3, 89), (1, 90), (3, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. freedom_of_the_press +[a] ~00% Nodes: 0 Edges: 0. freedom_of_the_press +[a] ~14% Nodes: 2805 Edges: 122234. freedom_of_the_press +[a] ~22% Nodes: 4458 Edges: 226304. freedom_of_the_press +[a] ~29% Nodes: 5562 Edges: 323944. freedom_of_the_press +[a] ~39% Nodes: 6580 Edges: 418865. freedom_of_the_press +[a] ~49% Nodes: 7651 Edges: 510121. freedom_of_the_press +[a] ~59% Nodes: 8590 Edges: 601423. freedom_of_the_press +[a] ~69% Nodes: 9537 Edges: 694006. freedom_of_the_press +[a] ~79% Nodes: 10273 Edges: 766147. freedom_of_the_press +[a] ~89% Nodes: 11176 Edges: 867276. freedom_of_the_press +[a] ~99% Nodes: 11755 Edges: 926476. freedom_of_the_press +[a] 100% Nodes: 11763 Edges: 927068. freedom_of_the_press +[a] Building graph. freedom_of_the_press +[a] Collecting root hubs. freedom_of_the_press +[a] Building minimum spanning tree. freedom_of_the_press +[a] Disambiguating results. freedom_of_the_press +[a] Writing to file. freedom_of_the_press + +[A] Word sense induction for 'freedom_of_the_press': +[A] Nodes: 11763 Edges: 927068 +[A] Root hubs: + 1. freedom: ['press', 'speech', 'government', 'rights', 'media', 'law'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. double_negative +[a] ~00% Nodes: 0 Edges: 0. double_negative +[a] ~09% Nodes: 631 Edges: 16097. double_negative +[a] ~19% Nodes: 1069 Edges: 47530. double_negative +[a] ~29% Nodes: 1480 Edges: 58949. double_negative +[a] ~39% Nodes: 1714 Edges: 65101. double_negative +[a] ~49% Nodes: 1962 Edges: 73573. double_negative +[a] ~59% Nodes: 2577 Edges: 134499. double_negative +[a] ~69% Nodes: 2695 Edges: 138150. double_negative +[a] ~79% Nodes: 2835 Edges: 145000. double_negative +[a] ~89% Nodes: 3032 Edges: 152883. double_negative +[a] ~99% Nodes: 3225 Edges: 160403. double_negative +[a] 100% Nodes: 3225 Edges: 160403. double_negative +[a] Building graph. double_negative +[a] Collecting root hubs. double_negative +[a] Building minimum spanning tree. double_negative +[a] Disambiguating results. double_negative +[a] Writing to file. double_negative + +[A] Word sense induction for 'double_negative': +[A] Nodes: 3225 Edges: 160403 +[A] Root hubs: + 1. negative: ['english', 'double', 'material', 'positive', 'example', 'cell'] + 2. effects: ['visual', 'film', 'supervisor', 'digital', 'work', 'team'] +[A] Mapping: [(1, 1), (2, 2), (1, 3), (1, 4), (2, 14), (1, 15), (1, 25), (1, 29), (1, 31), (1, 34), (1, 35), (2, 39), (1, 41), (2, 43), (1, 45), (1, 46), (1, 47), (1, 48), (1, 50), (1, 51), (2, 54), (1, 55), (1, 57), (1, 58), (2, 60), (1, 62), (2, 66), (1, 67), (2, 68), (1, 69), (2, 70), (1, 72), (1, 74), (1, 78), (1, 81), (2, 83), (2, 84), (1, 85), (1, 88), (1, 89), (1, 95), (1, 96), (1, 97), (1, 99), (1, 100)] + +[a] Counting nodes and edges. hall_of_justice +[a] ~00% Nodes: 0 Edges: 0. hall_of_justice +[a] ~09% Nodes: 937 Edges: 28532. hall_of_justice +[a] ~19% Nodes: 1374 Edges: 47023. hall_of_justice +[a] ~29% Nodes: 1803 Edges: 63983. hall_of_justice +[a] ~39% Nodes: 2216 Edges: 80307. hall_of_justice +[a] ~49% Nodes: 2563 Edges: 100603. hall_of_justice +[a] ~59% Nodes: 2771 Edges: 111711. hall_of_justice +[a] ~69% Nodes: 3284 Edges: 146719. hall_of_justice +[a] ~79% Nodes: 3514 Edges: 158725. hall_of_justice +[a] ~89% Nodes: 3871 Edges: 178694. hall_of_justice +[a] ~99% Nodes: 4217 Edges: 198220. hall_of_justice +[a] 100% Nodes: 4217 Edges: 198220. hall_of_justice +[a] Building graph. hall_of_justice +[a] Collecting root hubs. hall_of_justice +[a] Building minimum spanning tree. hall_of_justice +[a] Disambiguating results. hall_of_justice +[a] Writing to file. hall_of_justice + +[A] Word sense induction for 'hall_of_justice': +[A] Nodes: 4217 Edges: 198220 +[A] Root hubs: + 1. city: ['grand', 'dredd', 'judge', 'hall', 'building', 'mega'] + 2. league: ['justice', 'america', 'vol', 'lantern', 'members', 'black'] +[A] Mapping: [(1, 1), (1, 2), (2, 3), (2, 5), (1, 6), (1, 7), (1, 8), (2, 10), (2, 12), (2, 13), (2, 15), (1, 16), (2, 17), (2, 18), (2, 20), (2, 22), (2, 23), (1, 24), (2, 25), (2, 26), (2, 27), (2, 28), (1, 29), (1, 30), (2, 31), (2, 32), (2, 33), (1, 34), (1, 35), (2, 36), (2, 38), (1, 39), (1, 40), (1, 42), (1, 43), (1, 44), (2, 45), (2, 46), (1, 47), (1, 48), (1, 49), (2, 50), (2, 51), (1, 52), (1, 53), (2, 54), (1, 55), (1, 56), (1, 57), (1, 58), (2, 59), (2, 60), (1, 61), (1, 62), (2, 63), (1, 64), (2, 66), (1, 67), (2, 68), (1, 69), (1, 70), (1, 71), (2, 72), (2, 73), (2, 74), (1, 75), (1, 76), (2, 77), (2, 78), (1, 79), (1, 80), (1, 81), (2, 82), (2, 84), (2, 85), (1, 86), (1, 87), (2, 88), (1, 89), (2, 90), (2, 91), (1, 92), (1, 93), (2, 94), (1, 95), (2, 96), (1, 97), (2, 98), (1, 99), (2, 100)] + +[a] Counting nodes and edges. charles_de_gaulle +[a] ~00% Nodes: 0 Edges: 0. charles_de_gaulle +[a] ~18% Nodes: 3679 Edges: 141799. charles_de_gaulle +[a] ~27% Nodes: 5516 Edges: 257853. charles_de_gaulle +[a] ~37% Nodes: 7409 Edges: 389611. charles_de_gaulle +[a] ~45% Nodes: 9044 Edges: 557545. charles_de_gaulle +[a] ~51% Nodes: 10286 Edges: 674718. charles_de_gaulle +[a] ~59% Nodes: 11692 Edges: 840134. charles_de_gaulle +[a] ~69% Nodes: 12729 Edges: 956236. charles_de_gaulle +[a] Building graph. charles_de_gaulle +[a] Collecting root hubs. charles_de_gaulle +[a] Building minimum spanning tree. charles_de_gaulle +[a] Disambiguating results. charles_de_gaulle +[a] Writing to file. charles_de_gaulle + +[A] Word sense induction for 'charles_de_gaulle': +[A] Nodes: 28573 Edges: 149698459 +[A] Root hubs: + 1. french: ['france', 'president', 'general', 'war', 'government', 'world'] + 2. frankfurt: ['paris', 'airport', 'london', 'heathrow', 'international', 'traffic'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (2, 100)] + +[a] Counting nodes and edges. special_edition +[a] ~00% Nodes: 0 Edges: 0. special_edition +[a] ~38% Nodes: 7704 Edges: 437422. special_edition +[a] ~57% Nodes: 11566 Edges: 731673. special_edition +[a] ~74% Nodes: 14944 Edges: 1029135. special_edition +[a] ~88% Nodes: 17630 Edges: 1308660. special_edition +[a] ~99% Nodes: 19999 Edges: 1531801. special_edition +[a] Building graph. special_edition +[a] Collecting root hubs. special_edition +[a] Building minimum spanning tree. special_edition +[a] Disambiguating results. special_edition +[a] Writing to file. special_edition + +[A] Word sense induction for 'special_edition': +[A] Nodes: 20002 Edges: 1531963 +[A] Root hubs: + 1. first: ['album', 'release', 'dvd', 'time', 'version', 'second'] + 2. leather: ['interior', 'model', 'seats', 'black', 'wheels', 'front'] + 3. scene: ['dvd', 'film', 'release', 'original', 'scenes', 'version'] +[A] Mapping: [(3, 1), (3, 2), (3, 3), (3, 4), (1, 5), (1, 6), (3, 7), (1, 8), (3, 9), (3, 10), (1, 11), (1, 12), (1, 13), (3, 14), (1, 15), (1, 16), (1, 17), (1, 18), (3, 19), (1, 20), (1, 21), (1, 22), (3, 23), (1, 24), (3, 25), (3, 26), (3, 27), (1, 28), (1, 29), (3, 30), (1, 31), (3, 32), (1, 33), (1, 34), (3, 35), (3, 36), (3, 37), (1, 38), (1, 39), (3, 40), (3, 41), (3, 42), (1, 43), (1, 44), (1, 45), (3, 46), (3, 47), (3, 48), (3, 49), (3, 50), (3, 51), (3, 52), (1, 53), (3, 54), (1, 55), (1, 56), (3, 57), (1, 58), (1, 59), (1, 60), (3, 61), (1, 62), (1, 63), (3, 64), (1, 65), (1, 66), (3, 67), (3, 68), (1, 69), (3, 70), (3, 71), (3, 72), (3, 73), (1, 74), (3, 75), (3, 76), (1, 77), (3, 78), (1, 79), (3, 80), (3, 81), (3, 82), (3, 83), (3, 84), (3, 85), (3, 86), (3, 87), (3, 88), (1, 89), (1, 90), (3, 91), (3, 92), (3, 93), (1, 94), (3, 95), (3, 96), (3, 97), (3, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. beer_for_my_horses +[a] ~00% Nodes: 0 Edges: 0. beer_for_my_horses +[a] ~09% Nodes: 152 Edges: 2974. beer_for_my_horses +[a] ~19% Nodes: 204 Edges: 4035. beer_for_my_horses +[a] ~29% Nodes: 222 Edges: 4443. beer_for_my_horses +[a] ~39% Nodes: 247 Edges: 5025. beer_for_my_horses +[a] ~49% Nodes: 303 Edges: 6900. beer_for_my_horses +[a] ~59% Nodes: 303 Edges: 6900. beer_for_my_horses +[a] ~69% Nodes: 430 Edges: 13477. beer_for_my_horses +[a] ~79% Nodes: 468 Edges: 14651. beer_for_my_horses +[a] ~89% Nodes: 501 Edges: 15816. beer_for_my_horses +[a] ~99% Nodes: 554 Edges: 17386. beer_for_my_horses +[a] 100% Nodes: 554 Edges: 17386. beer_for_my_horses +[a] Building graph. beer_for_my_horses +[a] Collecting root hubs. beer_for_my_horses +[a] Building minimum spanning tree. beer_for_my_horses +[a] Disambiguating results. beer_for_my_horses +[a] Writing to file. beer_for_my_horses + +[A] Word sense induction for 'beer_for_my_horses': +[A] Nodes: 554 Edges: 17386 +[A] Root hubs: + 1. song: ['keith', 'country', 'nelson', 'single', 'album', 'number'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 10), (1, 11), (1, 12), (1, 16), (1, 19), (1, 23), (1, 24), (1, 25), (1, 26), (1, 29), (1, 30), (1, 32), (1, 33), (1, 35), (1, 36), (1, 39), (1, 40), (1, 42), (1, 43), (1, 47), (1, 48), (1, 49), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 58), (1, 60), (1, 61), (1, 62), (1, 64), (1, 65), (1, 70), (1, 71), (1, 72), (1, 74), (1, 48), (1, 82), (1, 84), (1, 85), (1, 86), (1, 88), (1, 89), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. heart_attack +[a] ~00% Nodes: 0 Edges: 0. heart_attack +[a] ~69% Nodes: 13913 Edges: 809222. heart_attack +[a] Building graph. heart_attack +[a] Collecting root hubs. heart_attack +[a] Building minimum spanning tree. heart_attack +[a] Disambiguating results. heart_attack +[a] Writing to file. heart_attack + +[A] Word sense induction for 'heart_attack': +[A] Nodes: 20029 Edges: 1381367 +[A] Root hubs: + 1. death: ['time', 'age', 'years', 'first', 'home', 'son'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. tai_chi +[a] ~00% Nodes: 0 Edges: 0. tai_chi +[a] ~09% Nodes: 1103 Edges: 36872. tai_chi +[a] ~19% Nodes: 1876 Edges: 66688. tai_chi +[a] ~29% Nodes: 2576 Edges: 110848. tai_chi +[a] ~39% Nodes: 3287 Edges: 152278. tai_chi +[a] ~49% Nodes: 3730 Edges: 195359. tai_chi +[a] ~59% Nodes: 4301 Edges: 233857. tai_chi +[a] ~69% Nodes: 4925 Edges: 266998. tai_chi +[a] ~79% Nodes: 5311 Edges: 293963. tai_chi +[a] ~89% Nodes: 5743 Edges: 331540. tai_chi +[a] ~99% Nodes: 6225 Edges: 370194. tai_chi +[a] 100% Nodes: 6227 Edges: 370226. tai_chi +[a] Building graph. tai_chi +[a] Collecting root hubs. tai_chi +[a] Building minimum spanning tree. tai_chi +[a] Disambiguating results. tai_chi +[a] Writing to file. tai_chi + +[A] Word sense induction for 'tai_chi': +[A] Nodes: 6227 Edges: 370226 +[A] Root hubs: + 1. martial: ['arts', 'chinese', 'style', 'kung', 'fu', 'chuan'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 46), (1, 47), (1, 48), (1, 49), (1, 51), (1, 52), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. rain_or_shine +[a] ~00% Nodes: 0 Edges: 0. rain_or_shine +[a] ~09% Nodes: 537 Edges: 15568. rain_or_shine +[a] ~19% Nodes: 1044 Edges: 31203. rain_or_shine +[a] ~29% Nodes: 1420 Edges: 48631. rain_or_shine +[a] ~39% Nodes: 1859 Edges: 72274. rain_or_shine +[a] ~49% Nodes: 2183 Edges: 88844. rain_or_shine +[a] ~59% Nodes: 2510 Edges: 105074. rain_or_shine +[a] ~69% Nodes: 2769 Edges: 120046. rain_or_shine +[a] ~79% Nodes: 3101 Edges: 137135. rain_or_shine +[a] ~89% Nodes: 3380 Edges: 150740. rain_or_shine +[a] ~99% Nodes: 3594 Edges: 163411. rain_or_shine +[a] 100% Nodes: 3594 Edges: 163411. rain_or_shine +[a] Building graph. rain_or_shine +[a] Collecting root hubs. rain_or_shine +[a] Building minimum spanning tree. rain_or_shine +[a] Disambiguating results. rain_or_shine +[a] Writing to file. rain_or_shine + +[A] Word sense induction for 'rain_or_shine': +[A] Nodes: 3594 Edges: 163411 +[A] Root hubs: + 1. team: ['elasto', 'painters', 'game', 'cup', 'philippine', 'first'] +[A] Mapping: [(1, 2), (1, 3), (1, 6), (1, 7), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 18), (1, 19), (1, 23), (1, 25), (1, 26), (1, 34), (1, 37), (1, 43), (1, 45), (1, 47), (1, 48), (1, 49), (1, 53), (1, 54), (1, 56), (1, 58), (1, 59), (1, 60), (1, 62), (1, 64), (1, 67), (1, 68), (1, 70), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 78), (1, 79), (1, 80), (1, 81), (1, 84), (1, 85), (1, 86), (1, 89), (1, 90), (1, 92), (1, 94), (1, 96), (1, 100)] + +[a] Counting nodes and edges. attack_of_the_mutant +[a] ~00% Nodes: 0 Edges: 0. attack_of_the_mutant +[a] ~09% Nodes: 44 Edges: 631. attack_of_the_mutant +[a] ~19% Nodes: 54 Edges: 706. attack_of_the_mutant +[a] ~29% Nodes: 148 Edges: 1698. attack_of_the_mutant +[a] ~39% Nodes: 333 Edges: 5831. attack_of_the_mutant +[a] ~49% Nodes: 367 Edges: 6262. attack_of_the_mutant +[a] ~59% Nodes: 385 Edges: 6544. attack_of_the_mutant +[a] ~69% Nodes: 385 Edges: 6544. attack_of_the_mutant +[a] ~79% Nodes: 562 Edges: 12603. attack_of_the_mutant +[a] ~89% Nodes: 584 Edges: 13337. attack_of_the_mutant +[a] ~99% Nodes: 592 Edges: 13392. attack_of_the_mutant +[a] 100% Nodes: 592 Edges: 13392. attack_of_the_mutant +[a] Building graph. attack_of_the_mutant +[a] Collecting root hubs. attack_of_the_mutant +[a] Building minimum spanning tree. attack_of_the_mutant +[a] Disambiguating results. attack_of_the_mutant +[a] Writing to file. attack_of_the_mutant + +[A] Word sense induction for 'attack_of_the_mutant': +[A] Nodes: 592 Edges: 13392 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. magic_lantern +[a] ~00% Nodes: 0 Edges: 0. magic_lantern +[a] ~09% Nodes: 1219 Edges: 35207. magic_lantern +[a] ~19% Nodes: 1627 Edges: 51517. magic_lantern +[a] ~29% Nodes: 2201 Edges: 77255. magic_lantern +[a] ~39% Nodes: 2620 Edges: 93227. magic_lantern +[a] ~49% Nodes: 3030 Edges: 117822. magic_lantern +[a] ~59% Nodes: 3355 Edges: 133291. magic_lantern +[a] ~69% Nodes: 3837 Edges: 157277. magic_lantern +[a] ~79% Nodes: 4299 Edges: 179256. magic_lantern +[a] ~89% Nodes: 4687 Edges: 214792. magic_lantern +[a] ~99% Nodes: 4850 Edges: 222537. magic_lantern +[a] 100% Nodes: 4855 Edges: 222688. magic_lantern +[a] Building graph. magic_lantern +[a] Collecting root hubs. magic_lantern +[a] Building minimum spanning tree. magic_lantern +[a] Disambiguating results. magic_lantern +[a] Writing to file. magic_lantern + +[A] Word sense induction for 'magic_lantern': +[A] Nodes: 4855 Edges: 222688 +[A] Root hubs: + 1. first: ['film', 'time', 'shows', 'camera', 'images', 'history'] + 2. fbi: ['computer', 'tools', 'order', 'messages', 'law', 'november'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (2, 8), (1, 11), (1, 12), (1, 13), (1, 15), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 23), (1, 24), (1, 25), (1, 26), (2, 27), (1, 28), (1, 29), (2, 30), (1, 31), (1, 33), (1, 35), (2, 36), (1, 37), (2, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (2, 46), (1, 47), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (2, 62), (1, 63), (2, 64), (1, 65), (1, 66), (1, 67), (1, 68), (2, 69), (1, 70), (1, 71), (1, 72), (2, 73), (1, 75), (2, 77), (1, 78), (1, 79), (1, 81), (1, 84), (1, 85), (1, 86), (2, 87), (1, 88), (2, 89), (1, 90), (1, 92), (1, 93), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. civil_war +[a] ~00% Nodes: 0 Edges: 0. civil_war +[a] Building graph. civil_war +[a] Collecting root hubs. civil_war +[a] Building minimum spanning tree. civil_war +[a] Disambiguating results. civil_war +[a] Writing to file. civil_war + +[A] Word sense induction for 'civil_war': +[A] Nodes: 20035 Edges: 1727057 +[A] Root hubs: + 1. war: ['american', 'army', 'states', 'union', 'united', 'world'] + 2. beavers: ['oregon', 'state', 'ducks', 'first', 'game', 'win'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (2, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. before_the_storm +[a] ~00% Nodes: 0 Edges: 0. before_the_storm +[a] ~09% Nodes: 1396 Edges: 50198. before_the_storm +[a] ~19% Nodes: 2098 Edges: 78702. before_the_storm +[a] ~29% Nodes: 2757 Edges: 114419. before_the_storm +[a] ~39% Nodes: 3252 Edges: 140487. before_the_storm +[a] ~49% Nodes: 3782 Edges: 176072. before_the_storm +[a] ~59% Nodes: 4548 Edges: 227495. before_the_storm +[a] ~69% Nodes: 4906 Edges: 256358. before_the_storm +[a] ~79% Nodes: 5436 Edges: 298427. before_the_storm +[a] ~89% Nodes: 5787 Edges: 326798. before_the_storm +[a] ~99% Nodes: 6211 Edges: 366227. before_the_storm +[a] 100% Nodes: 6211 Edges: 366227. before_the_storm +[a] Building graph. before_the_storm +[a] Collecting root hubs. before_the_storm +[a] Building minimum spanning tree. before_the_storm +[a] Disambiguating results. before_the_storm +[a] Writing to file. before_the_storm + +[A] Word sense induction for 'before_the_storm': +[A] Nodes: 6211 Edges: 366227 +[A] Root hubs: + 1. storm: ['hurricane', 'tropical', 'people', 'damage', 'landfall', 'residents'] + 2. album: ['calm', 'first', 'single', 'band', 'songs', 'debut'] + 3. university: ['press', 'california', 'calm', 'history', 'tibet', 'goldstein'] +[A] Mapping: [(2, 1), (1, 2), (1, 3), (2, 4), (1, 5), (2, 6), (2, 7), (2, 8), (2, 10), (1, 12), (2, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 19), (1, 21), (1, 22), (2, 23), (2, 24), (1, 25), (2, 26), (2, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 34), (2, 36), (1, 37), (1, 38), (1, 39), (1, 40), (2, 41), (1, 42), (2, 43), (2, 44), (2, 45), (1, 46), (1, 47), (2, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (2, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (2, 62), (1, 63), (1, 64), (1, 65), (2, 66), (1, 67), (1, 68), (2, 69), (1, 70), (1, 72), (1, 73), (1, 74), (2, 75), (1, 76), (2, 77), (1, 80), (1, 81), (1, 82), (2, 83), (1, 84), (1, 85), (2, 86), (1, 87), (1, 88), (1, 89), (1, 90), (2, 91), (1, 92), (1, 93), (1, 94), (2, 95), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. sign_of_the_cross +[a] ~00% Nodes: 0 Edges: 0. sign_of_the_cross +[a] ~09% Nodes: 1444 Edges: 54611. sign_of_the_cross +[a] ~19% Nodes: 2831 Edges: 157872. sign_of_the_cross +[a] ~29% Nodes: 4080 Edges: 246160. sign_of_the_cross +[a] ~39% Nodes: 4568 Edges: 273558. sign_of_the_cross +[a] ~49% Nodes: 5245 Edges: 315291. sign_of_the_cross +[a] ~59% Nodes: 5844 Edges: 360243. sign_of_the_cross +[a] ~69% Nodes: 6494 Edges: 411930. sign_of_the_cross +[a] ~79% Nodes: 6922 Edges: 445719. sign_of_the_cross +[a] ~89% Nodes: 7265 Edges: 474604. sign_of_the_cross +[a] ~99% Nodes: 7712 Edges: 503048. sign_of_the_cross +[a] 100% Nodes: 7712 Edges: 503048. sign_of_the_cross +[a] Building graph. sign_of_the_cross +[a] Collecting root hubs. sign_of_the_cross +[a] Building minimum spanning tree. sign_of_the_cross +[a] Disambiguating results. sign_of_the_cross +[a] Writing to file. sign_of_the_cross + +[A] Word sense induction for 'sign_of_the_cross': +[A] Nodes: 7712 Edges: 503048 +[A] Root hubs: + 1. church: ['holy', 'use', 'catholic', 'cross', 'priest', 'many'] + 2. london: ['part', 'english', 'p.', 'wilson', 'england', 'time'] + 3. b.: ['cecil', 'demille', 'film', 'films', 'first', 'stage'] + 4. house: ['head', 'family', 'christmas', 'household', 'home', 'morning'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (4, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 36), (1, 38), (1, 40), (2, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (4, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (4, 69), (2, 70), (2, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (3, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (2, 90), (1, 91), (4, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 100)] + +[a] Counting nodes and edges. volcanic_rock +[a] ~00% Nodes: 0 Edges: 0. volcanic_rock +[a] ~09% Nodes: 1563 Edges: 47768. volcanic_rock +[a] ~19% Nodes: 2647 Edges: 96079. volcanic_rock +[a] ~29% Nodes: 3627 Edges: 145401. volcanic_rock +[a] ~39% Nodes: 4405 Edges: 198722. volcanic_rock +[a] ~49% Nodes: 5067 Edges: 251755. volcanic_rock +[a] ~59% Nodes: 5575 Edges: 293582. volcanic_rock +[a] ~69% Nodes: 6066 Edges: 341442. volcanic_rock +[a] ~79% Nodes: 6715 Edges: 394680. volcanic_rock +[a] ~89% Nodes: 7248 Edges: 443816. volcanic_rock +[a] ~99% Nodes: 7654 Edges: 477312. volcanic_rock +[a] 100% Nodes: 7654 Edges: 477312. volcanic_rock +[a] Building graph. volcanic_rock +[a] Collecting root hubs. volcanic_rock +[a] Building minimum spanning tree. volcanic_rock +[a] Disambiguating results. volcanic_rock +[a] Writing to file. volcanic_rock + +[A] Word sense induction for 'volcanic_rock': +[A] Nodes: 7654 Edges: 477312 +[A] Root hubs: + 1. rock: ['volcanic', 'years', 'sedimentary', 'basalt', 'rocks', 'lava'] + 2. moist: ['dry', 'lava', 'eurasia', 'combination', 'slopes', 'hot'] + 3. clay: ['water', 'large', 'rocks', 'several', 'different', 'many'] +[A] Mapping: [(2, 1), (2, 2), (1, 3), (2, 4), (2, 5), (2, 6), (1, 7), (2, 8), (1, 9), (2, 10), (1, 11), (1, 12), (2, 13), (1, 14), (2, 15), (2, 16), (2, 17), (2, 18), (2, 19), (1, 20), (1, 21), (2, 22), (2, 23), (2, 24), (1, 25), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (2, 31), (2, 32), (2, 33), (1, 34), (1, 35), (2, 36), (2, 37), (2, 38), (2, 39), (1, 40), (2, 41), (1, 42), (2, 43), (2, 44), (2, 45), (1, 46), (2, 47), (2, 48), (2, 49), (1, 50), (1, 51), (1, 53), (2, 54), (2, 55), (2, 56), (2, 57), (2, 58), (2, 59), (2, 60), (2, 61), (1, 62), (1, 63), (1, 64), (2, 65), (2, 66), (2, 67), (1, 68), (1, 69), (1, 70), (2, 71), (2, 72), (2, 73), (1, 74), (2, 75), (1, 76), (1, 77), (2, 79), (2, 80), (2, 81), (2, 82), (2, 83), (2, 84), (1, 85), (1, 86), (1, 87), (1, 88), (2, 89), (2, 90), (2, 91), (2, 92), (2, 93), (2, 94), (2, 95), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. sean_fallon +[a] ~00% Nodes: 0 Edges: 0. sean_fallon +[a] ~09% Nodes: 0 Edges: 0. sean_fallon +[a] ~19% Nodes: 89 Edges: 1205. sean_fallon +[a] ~29% Nodes: 127 Edges: 1797. sean_fallon +[a] ~39% Nodes: 155 Edges: 2175. sean_fallon +[a] ~49% Nodes: 155 Edges: 2175. sean_fallon +[a] ~59% Nodes: 216 Edges: 4140. sean_fallon +[a] ~69% Nodes: 307 Edges: 7208. sean_fallon +[a] ~79% Nodes: 337 Edges: 7643. sean_fallon +[a] ~89% Nodes: 395 Edges: 8999. sean_fallon +[a] ~99% Nodes: 395 Edges: 8999. sean_fallon +[a] 100% Nodes: 395 Edges: 8999. sean_fallon +[a] Building graph. sean_fallon +[a] Collecting root hubs. sean_fallon +[a] Building minimum spanning tree. sean_fallon +[a] Disambiguating results. sean_fallon +[a] Writing to file. sean_fallon + +[A] Word sense induction for 'sean_fallon': +[A] Nodes: 395 Edges: 8999 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. space_opera +[a] ~00% Nodes: 0 Edges: 0. space_opera +[a] ~09% Nodes: 1472 Edges: 56649. space_opera +[a] ~19% Nodes: 2950 Edges: 135920. space_opera +[a] ~29% Nodes: 3545 Edges: 165947. space_opera +[a] ~39% Nodes: 4354 Edges: 218882. space_opera +[a] ~49% Nodes: 5035 Edges: 267839. space_opera +[a] ~59% Nodes: 5751 Edges: 332678. space_opera +[a] ~69% Nodes: 6238 Edges: 375769. space_opera +[a] ~79% Nodes: 6784 Edges: 424377. space_opera +[a] ~89% Nodes: 7151 Edges: 454146. space_opera +[a] ~99% Nodes: 7581 Edges: 486984. space_opera +[a] 100% Nodes: 7606 Edges: 489859. space_opera +[a] Building graph. space_opera +[a] Collecting root hubs. space_opera +[a] Building minimum spanning tree. space_opera +[a] Disambiguating results. space_opera +[a] Writing to file. space_opera + +[A] Word sense induction for 'space_opera': +[A] Nodes: 7606 Edges: 489859 +[A] Root hubs: + 1. fiction: ['science', 'space', 'series', 'stories', 'novel', 'story'] + 2. george: ['star', 'film', 'lucas', 'wars', 'american', 'epic'] + 3. teachings: ['scientology', 'hubbard', 'church', 'xenu', 'many', 'group'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 6), (1, 7), (1, 8), (1, 9), (1, 11), (1, 12), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 75), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. dive_bomber +[a] ~00% Nodes: 0 Edges: 0. dive_bomber +[a] ~09% Nodes: 1552 Edges: 62429. dive_bomber +[a] ~19% Nodes: 2400 Edges: 107288. dive_bomber +[a] ~29% Nodes: 3012 Edges: 146129. dive_bomber +[a] ~39% Nodes: 3622 Edges: 189805. dive_bomber +[a] ~49% Nodes: 3967 Edges: 215794. dive_bomber +[a] ~59% Nodes: 4286 Edges: 234305. dive_bomber +[a] ~69% Nodes: 4650 Edges: 267247. dive_bomber +[a] ~79% Nodes: 5017 Edges: 301087. dive_bomber +[a] ~89% Nodes: 5352 Edges: 336496. dive_bomber +[a] ~99% Nodes: 5620 Edges: 357799. dive_bomber +[a] 100% Nodes: 5620 Edges: 357799. dive_bomber +[a] Building graph. dive_bomber +[a] Collecting root hubs. dive_bomber +[a] Building minimum spanning tree. dive_bomber +[a] Disambiguating results. dive_bomber +[a] Writing to file. dive_bomber + +[A] Word sense induction for 'dive_bomber': +[A] Nodes: 5620 Edges: 357799 +[A] Root hubs: + 1. aircraft: ['air', 'war', 'carrier', 'fighter', 'attack', 'japanese'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 15), (1, 16), (1, 17), (1, 18), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 25), (1, 26), (1, 27), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 57), (1, 59), (1, 60), (1, 61), (1, 62), (1, 64), (1, 65), (1, 67), (1, 68), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 76), (1, 77), (1, 78), (1, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. stranger_in_town +[a] ~00% Nodes: 0 Edges: 0. stranger_in_town +[a] ~09% Nodes: 165 Edges: 3113. stranger_in_town +[a] ~19% Nodes: 454 Edges: 12714. stranger_in_town +[a] ~29% Nodes: 518 Edges: 13710. stranger_in_town +[a] ~39% Nodes: 605 Edges: 16439. stranger_in_town +[a] ~49% Nodes: 625 Edges: 16840. stranger_in_town +[a] ~59% Nodes: 752 Edges: 24719. stranger_in_town +[a] ~69% Nodes: 865 Edges: 28156. stranger_in_town +[a] ~79% Nodes: 961 Edges: 31122. stranger_in_town +[a] ~89% Nodes: 1114 Edges: 36420. stranger_in_town +[a] ~99% Nodes: 1191 Edges: 38531. stranger_in_town +[a] 100% Nodes: 1191 Edges: 38531. stranger_in_town +[a] Building graph. stranger_in_town +[a] Collecting root hubs. stranger_in_town +[a] Building minimum spanning tree. stranger_in_town +[a] Disambiguating results. stranger_in_town +[a] Writing to file. stranger_in_town + +[A] Word sense induction for 'stranger_in_town': +[A] Nodes: 1191 Edges: 38531 +[A] Root hubs: + 1. single: ['album', 'rock', 'song', 'band', 'music', 'david'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 6), (1, 9), (1, 10), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 38), (1, 41), (1, 42), (1, 44), (1, 47), (1, 50), (1, 51), (1, 52), (1, 56), (1, 57), (1, 58), (1, 61), (1, 67), (1, 71), (1, 72), (1, 73), (1, 84), (1, 88), (1, 89), (1, 94), (1, 100)] + +[a] Counting nodes and edges. lost_in_space +[a] ~00% Nodes: 0 Edges: 0. lost_in_space +[a] ~09% Nodes: 1571 Edges: 51725. lost_in_space +[a] ~19% Nodes: 2288 Edges: 84857. lost_in_space +[a] ~29% Nodes: 2764 Edges: 102484. lost_in_space +[a] ~39% Nodes: 3414 Edges: 142313. lost_in_space +[a] ~49% Nodes: 4036 Edges: 184725. lost_in_space +[a] ~59% Nodes: 4798 Edges: 234956. lost_in_space +[a] ~69% Nodes: 5163 Edges: 255521. lost_in_space +[a] ~79% Nodes: 5790 Edges: 299646. lost_in_space +[a] ~89% Nodes: 6164 Edges: 330254. lost_in_space +[a] ~99% Nodes: 6827 Edges: 384996. lost_in_space +[a] 100% Nodes: 6827 Edges: 384996. lost_in_space +[a] Building graph. lost_in_space +[a] Collecting root hubs. lost_in_space +[a] Building minimum spanning tree. lost_in_space +[a] Disambiguating results. lost_in_space +[a] Writing to file. lost_in_space + +[A] Word sense induction for 'lost_in_space': +[A] Nodes: 6827 Edges: 384996 +[A] Root hubs: + 1. series: ['television', 'tv', 'episode', 'show', 'film', 'cbs'] + 2. album: ['songs', 'track', 'first', 'second', 'version', 'tracks'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (2, 15), (1, 16), (1, 17), (1, 18), (2, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 25), (1, 26), (1, 27), (1, 28), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 40), (1, 41), (1, 42), (1, 43), (1, 44), (1, 45), (2, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 59), (1, 60), (1, 62), (1, 63), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 75), (1, 76), (1, 77), (1, 78), (2, 79), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (2, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99)] + +[a] Counting nodes and edges. black_hole +[a] ~00% Nodes: 0 Edges: 0. black_hole +[a] Building graph. black_hole +[a] Collecting root hubs. black_hole +[a] Building minimum spanning tree. black_hole +[a] Disambiguating results. black_hole +[a] Writing to file. black_hole + +[A] Word sense induction for 'black_hole': +[A] Nodes: 13341 Edges: 43500540 +[A] Root hubs: + 1. time: ['space', 'years', 'horizon', 'event', 'black_holes', 'star'] + 2. stars: ['mass', 'star', 'galaxy', 'massive', 'years', 'supermassive'] +[A] Mapping: [(2, 1), (2, 2), (1, 3), (1, 4), (2, 5), (2, 6), (1, 7), (2, 8), (2, 9), (2, 10), (1, 11), (1, 12), (2, 13), (1, 14), (1, 15), (2, 16), (2, 17), (1, 18), (2, 19), (2, 20), (1, 21), (1, 22), (2, 23), (1, 24), (1, 25), (1, 27), (2, 29), (2, 30), (2, 31), (2, 32), (1, 33), (2, 34), (1, 35), (2, 36), (2, 37), (2, 38), (2, 39), (2, 40), (1, 41), (2, 42), (2, 43), (2, 44), (2, 45), (1, 46), (2, 47), (2, 48), (2, 49), (2, 50), (2, 51), (1, 52), (2, 53), (1, 54), (2, 55), (1, 56), (2, 57), (2, 58), (2, 59), (1, 60), (2, 61), (1, 62), (2, 63), (2, 64), (1, 65), (1, 66), (2, 67), (2, 68), (2, 69), (1, 70), (1, 71), (2, 72), (2, 74), (1, 75), (1, 76), (2, 77), (2, 78), (1, 79), (2, 80), (2, 81), (2, 83), (1, 85), (1, 86), (2, 87), (1, 88), (1, 89), (2, 90), (1, 91), (1, 93), (1, 94), (2, 96), (2, 97), (1, 98), (2, 99), (2, 100)] + +[a] Counting nodes and edges. freedom_of_the_seas +[a] ~00% Nodes: 0 Edges: 0. freedom_of_the_seas +[a] ~09% Nodes: 146 Edges: 2937. freedom_of_the_seas +[a] ~19% Nodes: 417 Edges: 9436. freedom_of_the_seas +[a] ~29% Nodes: 825 Edges: 26353. freedom_of_the_seas +[a] ~39% Nodes: 1105 Edges: 38647. freedom_of_the_seas +[a] ~49% Nodes: 1228 Edges: 44743. freedom_of_the_seas +[a] ~59% Nodes: 1361 Edges: 49719. freedom_of_the_seas +[a] ~69% Nodes: 1586 Edges: 58015. freedom_of_the_seas +[a] ~79% Nodes: 1719 Edges: 63399. freedom_of_the_seas +[a] ~89% Nodes: 1830 Edges: 68010. freedom_of_the_seas +[a] ~99% Nodes: 1931 Edges: 73822. freedom_of_the_seas +[a] 100% Nodes: 1931 Edges: 73822. freedom_of_the_seas +[a] Building graph. freedom_of_the_seas +[a] Collecting root hubs. freedom_of_the_seas +[a] Building minimum spanning tree. freedom_of_the_seas +[a] Disambiguating results. freedom_of_the_seas +[a] Writing to file. freedom_of_the_seas + +[A] Word sense induction for 'freedom_of_the_seas': +[A] Nodes: 1931 Edges: 73822 +[A] Root hubs: + 1. seas: ['ships', 'high', 'sea', 'law', 'international', 'ship'] + 2. war: ['international', 'law', 'nations', 'united', 'first', 'states'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 13), (1, 14), (1, 15), (1, 16), (1, 17), (1, 18), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 26), (1, 27), (1, 28), (1, 29), (1, 30), (1, 31), (1, 32), (1, 33), (1, 34), (1, 35), (1, 36), (1, 37), (1, 38), (1, 39), (1, 41), (1, 43), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (1, 64), (1, 65), (1, 67), (1, 68), (1, 69), (1, 70), (1, 71), (1, 72), (1, 73), (1, 74), (1, 76), (1, 78), (1, 80), (1, 81), (1, 82), (1, 83), (1, 84), (1, 85), (1, 86), (1, 88), (1, 89), (1, 90), (1, 91), (1, 92), (1, 93), (1, 95), (1, 96), (1, 97), (1, 98), (1, 100)] + +[a] Counting nodes and edges. stephen_king +[a] ~00% Nodes: 0 Edges: 0. stephen_king +[a] ~17% Nodes: 3483 Edges: 135291. stephen_king +[a] ~31% Nodes: 6306 Edges: 321195. stephen_king +[a] ~38% Nodes: 7789 Edges: 438823. stephen_king +[a] ~46% Nodes: 9306 Edges: 586309. stephen_king +[a] ~52% Nodes: 10403 Edges: 685526. stephen_king +[a] ~59% Nodes: 11567 Edges: 811041. stephen_king +[a] ~69% Nodes: 12481 Edges: 916378. stephen_king +[a] ~79% Nodes: 13380 Edges: 1012530. stephen_king +[a] ~89% Nodes: 14422 Edges: 1141814. stephen_king +[a] ~99% Nodes: 15307 Edges: 1260821. stephen_king +[a] 100% Nodes: 15307 Edges: 1260821. stephen_king +[a] Building graph. stephen_king +[a] Collecting root hubs. stephen_king +[a] Building minimum spanning tree. stephen_king +[a] Disambiguating results. stephen_king +[a] Writing to file. stephen_king + +[A] Word sense induction for 'stephen_king': +[A] Nodes: 15307 Edges: 1260821 +[A] Root hubs: + 1. film: ['horror', 'novel', 'story', 'movie', 'adaptation', 'king'] + 2. books: ['book', 'king', 'series', 'story', 'novel', 'author'] + 3. tan: ['rock', 'barry', 'groening', 'dave', 'matt', 'bottom'] +[A] Mapping: [(1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (2, 7), (1, 8), (1, 9), (1, 10), (2, 11), (1, 12), (1, 13), (1, 14), (2, 15), (1, 16), (2, 17), (1, 18), (1, 19), (2, 20), (1, 21), (2, 22), (1, 23), (1, 24), (1, 25), (2, 26), (1, 27), (1, 28), (2, 29), (2, 30), (1, 31), (2, 32), (1, 33), (2, 34), (1, 35), (2, 36), (1, 37), (1, 38), (1, 39), (1, 40), (2, 41), (1, 42), (1, 43), (1, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (2, 50), (1, 51), (2, 52), (1, 53), (2, 54), (1, 55), (2, 56), (1, 57), (1, 58), (1, 59), (2, 60), (1, 61), (2, 62), (2, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 69), (1, 70), (2, 71), (1, 72), (1, 73), (1, 74), (1, 75), (2, 76), (1, 77), (1, 78), (2, 79), (1, 80), (1, 81), (1, 82), (2, 83), (1, 84), (2, 85), (2, 86), (2, 87), (1, 88), (2, 89), (1, 90), (2, 91), (1, 92), (1, 93), (1, 94), (2, 95), (2, 96), (2, 97), (1, 98), (2, 99), (1, 100)] + +[a] Counting nodes and edges. hair_of_the_dog +[a] ~00% Nodes: 0 Edges: 0. hair_of_the_dog +[a] ~09% Nodes: 126 Edges: 2417. hair_of_the_dog +[a] ~19% Nodes: 248 Edges: 5733. hair_of_the_dog +[a] ~29% Nodes: 559 Edges: 12129. hair_of_the_dog +[a] ~39% Nodes: 683 Edges: 14853. hair_of_the_dog +[a] ~49% Nodes: 916 Edges: 24821. hair_of_the_dog +[a] ~59% Nodes: 1150 Edges: 34925. hair_of_the_dog +[a] ~69% Nodes: 1272 Edges: 38552. hair_of_the_dog +[a] ~79% Nodes: 1373 Edges: 41436. hair_of_the_dog +[a] ~89% Nodes: 1547 Edges: 46024. hair_of_the_dog +[a] ~99% Nodes: 1650 Edges: 50362. hair_of_the_dog +[a] 100% Nodes: 1650 Edges: 50362. hair_of_the_dog +[a] Building graph. hair_of_the_dog +[a] Collecting root hubs. hair_of_the_dog +[a] Building minimum spanning tree. hair_of_the_dog +[a] Disambiguating results. hair_of_the_dog +[a] Writing to file. hair_of_the_dog + +[A] Word sense induction for 'hair_of_the_dog': +[A] Nodes: 1650 Edges: 50362 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. soul_food +[a] ~00% Nodes: 0 Edges: 0. soul_food +[a] ~09% Nodes: 998 Edges: 30478. soul_food +[a] ~19% Nodes: 1603 Edges: 51582. soul_food +[a] ~29% Nodes: 2503 Edges: 98707. soul_food +[a] ~39% Nodes: 2901 Edges: 118578. soul_food +[a] ~49% Nodes: 3353 Edges: 145157. soul_food +[a] ~59% Nodes: 3714 Edges: 163200. soul_food +[a] ~69% Nodes: 4007 Edges: 179520. soul_food +[a] ~79% Nodes: 4601 Edges: 233645. soul_food +[a] ~89% Nodes: 4993 Edges: 266589. soul_food +[a] ~99% Nodes: 5173 Edges: 280474. soul_food +[a] 100% Nodes: 5173 Edges: 280474. soul_food +[a] Building graph. soul_food +[a] Collecting root hubs. soul_food +[a] Building minimum spanning tree. soul_food +[a] Disambiguating results. soul_food +[a] Writing to file. soul_food + +[A] Word sense induction for 'soul_food': +[A] Nodes: 5173 Edges: 280474 +[A] Root hubs: + 1. american: ['african', 'television', 'series', 'film', 'black', 'first'] + 2. album: ['music', 'song', 'taqueria', 'guerrero', 'single', 'records'] + 3. restaurant: ['food', 'street', 'chicken', 'first', 'soul', 'group'] +[A] Mapping: [(1, 1), (1, 2), (2, 3), (1, 4), (1, 5), (2, 6), (1, 7), (1, 8), (1, 9), (1, 10), (1, 11), (1, 12), (1, 13), (1, 14), (3, 15), (1, 17), (2, 18), (2, 19), (1, 20), (2, 21), (2, 22), (2, 23), (1, 24), (1, 25), (1, 26), (1, 27), (2, 28), (1, 30), (3, 31), (3, 32), (1, 33), (2, 34), (1, 35), (2, 36), (1, 37), (1, 38), (1, 39), (2, 40), (1, 41), (1, 42), (1, 43), (2, 44), (1, 45), (1, 46), (1, 47), (1, 48), (1, 49), (1, 50), (2, 51), (1, 52), (1, 53), (3, 54), (2, 55), (2, 56), (1, 58), (1, 60), (1, 61), (3, 62), (2, 63), (1, 64), (1, 65), (3, 66), (1, 67), (2, 68), (1, 69), (1, 70), (1, 71), (1, 72), (2, 73), (1, 74), (2, 75), (1, 76), (2, 77), (1, 78), (2, 79), (1, 80), (2, 81), (1, 82), (2, 83), (2, 84), (1, 85), (2, 86), (2, 87), (1, 88), (2, 90), (1, 91), (2, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (3, 99), (2, 100)] + +[a] Counting nodes and edges. the_art_of_seduction +[a] ~00% Nodes: 0 Edges: 0. art_of_seduction +[a] ~09% Nodes: 84 Edges: 1022. art_of_seduction +[a] ~19% Nodes: 229 Edges: 3544. art_of_seduction +[a] ~29% Nodes: 423 Edges: 8031. art_of_seduction +[a] ~39% Nodes: 500 Edges: 9578. art_of_seduction +[a] ~49% Nodes: 662 Edges: 17621. art_of_seduction +[a] ~59% Nodes: 844 Edges: 21487. art_of_seduction +[a] ~69% Nodes: 1008 Edges: 27037. art_of_seduction +[a] ~79% Nodes: 1210 Edges: 36058. art_of_seduction +[a] ~89% Nodes: 1271 Edges: 37614. art_of_seduction +[a] ~99% Nodes: 1314 Edges: 38827. art_of_seduction +[a] 100% Nodes: 1314 Edges: 38827. art_of_seduction +[a] Building graph. the_art_of_seduction +[a] Collecting root hubs. the_art_of_seduction +[a] Building minimum spanning tree. the_art_of_seduction +[a] Disambiguating results. the_art_of_seduction +[a] Writing to file. the_art_of_seduction + +[A] Word sense induction for 'the_art_of_seduction': +[A] Nodes: 1314 Edges: 38827 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + +[a] Counting nodes and edges. division_by_zero +[a] ~00% Nodes: 0 Edges: 0. division_by_zero +[a] ~09% Nodes: 249 Edges: 3393. division_by_zero +[a] ~19% Nodes: 388 Edges: 6110. division_by_zero +[a] ~29% Nodes: 523 Edges: 9449. division_by_zero +[a] ~39% Nodes: 558 Edges: 10012. division_by_zero +[a] ~49% Nodes: 669 Edges: 12460. division_by_zero +[a] ~59% Nodes: 906 Edges: 21912. division_by_zero +[a] ~69% Nodes: 1039 Edges: 25187. division_by_zero +[a] ~79% Nodes: 1089 Edges: 26389. division_by_zero +[a] ~89% Nodes: 1128 Edges: 26900. division_by_zero +[a] ~99% Nodes: 1249 Edges: 30875. division_by_zero +[a] 100% Nodes: 1249 Edges: 30875. division_by_zero +[a] Building graph. division_by_zero +[a] Collecting root hubs. division_by_zero +[a] Building minimum spanning tree. division_by_zero +[a] Disambiguating results. division_by_zero +[a] Writing to file. division_by_zero + +[A] Word sense induction for 'division_by_zero': +[A] Nodes: 1249 Edges: 30875 +[A] Root hubs: + 1. numbers: ['real', 'function', 'example', 'negative', 'division', 'undefined'] +[A] Mapping: [(1, 1), (1, 2), (1, 4), (1, 5), (1, 7), (1, 11), (1, 12), (1, 14), (1, 15), (1, 17), (1, 19), (1, 20), (1, 21), (1, 22), (1, 23), (1, 24), (1, 26), (1, 27), (1, 28), (1, 29), (1, 31), (1, 32), (1, 35), (1, 37), (1, 40), (1, 42), (1, 46), (1, 47), (1, 48), (1, 50), (1, 51), (1, 52), (1, 53), (1, 54), (1, 55), (1, 56), (1, 57), (1, 58), (1, 63), (1, 64), (1, 65), (1, 66), (1, 67), (1, 68), (1, 70), (1, 71), (1, 73), (1, 74), (1, 75), (1, 79), (1, 81), (1, 85), (1, 86), (1, 87), (1, 88), (1, 90), (1, 91), (1, 92), (1, 93), (1, 94), (1, 95), (1, 96), (1, 97), (1, 98), (1, 99), (1, 100)] + +[a] Counting nodes and edges. la_mancha +[a] ~00% Nodes: 0 Edges: 0. la_mancha +[a] ~13% Nodes: 2600 Edges: 86545. la_mancha +[a] ~20% Nodes: 4086 Edges: 151156. la_mancha +[a] ~29% Nodes: 5596 Edges: 239993. la_mancha +[a] ~39% Nodes: 6693 Edges: 323357. la_mancha +[a] ~49% Nodes: 7592 Edges: 382078. la_mancha +[a] ~59% Nodes: 8597 Edges: 464256. la_mancha +[a] ~69% Nodes: 9295 Edges: 514235. la_mancha +[a] ~79% Nodes: 10230 Edges: 580461. la_mancha +[a] ~89% Nodes: 11064 Edges: 647111. la_mancha +[a] ~99% Nodes: 12394 Edges: 806066. la_mancha +[a] 100% Nodes: 12400 Edges: 806294. la_mancha +[a] Building graph. la_mancha +[a] Collecting root hubs. la_mancha +[a] Building minimum spanning tree. la_mancha +[a] Disambiguating results. la_mancha +[a] Writing to file. la_mancha + +[A] Word sense induction for 'la_mancha': +[A] Nodes: 12400 Edges: 806294 +[A] Root hubs: + 1. castile: ['spain', 'municipality', 'population', 'province', 'inhabitants', 'ine'] + 2. man: ['musical', 'broadway', 'theatre', 'production', 'stage', 'quixote'] + 3. castilla: ['spain', 'spanish', 'toledo', 'region', 'autonomous', 'province'] +[A] Mapping: [(1, 1), (1, 2), (2, 3), (1, 4), (2, 6), (2, 7), (1, 8), (2, 9), (2, 10), (1, 11), (2, 12), (2, 13), (1, 14), (1, 15), (2, 16), (2, 17), (2, 20), (1, 21), (2, 22), (3, 23), (1, 24), (2, 26), (2, 27), (2, 28), (1, 29), (2, 30), (2, 31), (2, 32), (2, 33), (2, 34), (1, 35), (2, 36), (2, 37), (2, 38), (2, 39), (1, 40), (1, 41), (2, 42), (1, 43), (1, 44), (2, 45), (2, 46), (2, 47), (1, 48), (2, 49), (1, 50), (1, 51), (2, 52), (1, 53), (2, 54), (3, 55), (2, 56), (2, 57), (2, 58), (1, 59), (1, 60), (1, 61), (1, 62), (1, 63), (2, 64), (2, 65), (1, 66), (2, 67), (2, 68), (2, 69), (2, 70), (2, 71), (1, 72), (3, 73), (2, 74), (1, 75), (2, 76), (2, 77), (2, 78), (1, 79), (1, 80), (2, 81), (2, 82), (2, 83), (1, 84), (1, 85), (1, 87), (1, 88), (1, 89), (1, 90), (1, 91), (2, 92), (2, 93), (2, 94), (2, 95), (2, 96), (1, 97), (2, 98), (2, 99), (2, 100)] + +[a] Counting nodes and edges. down_in_the_valley +[a] ~00% Nodes: 0 Edges: 0. down_in_the_valley +[a] ~09% Nodes: 367 Edges: 11689. down_in_the_valley +[a] ~19% Nodes: 838 Edges: 21975. down_in_the_valley +[a] ~29% Nodes: 991 Edges: 26440. down_in_the_valley +[a] ~39% Nodes: 1238 Edges: 34743. down_in_the_valley +[a] ~49% Nodes: 1503 Edges: 42737. down_in_the_valley +[a] ~59% Nodes: 1699 Edges: 50024. down_in_the_valley +[a] ~69% Nodes: 1866 Edges: 59981. down_in_the_valley +[a] ~79% Nodes: 2056 Edges: 67606. down_in_the_valley +[a] ~89% Nodes: 2249 Edges: 73754. down_in_the_valley +[a] ~99% Nodes: 2480 Edges: 83689. down_in_the_valley +[a] 100% Nodes: 2480 Edges: 83689. down_in_the_valley +[a] Building graph. down_in_the_valley +[a] Collecting root hubs. down_in_the_valley +[a] Building minimum spanning tree. down_in_the_valley +[a] Disambiguating results. down_in_the_valley +[a] Writing to file. down_in_the_valley + +[A] Word sense induction for 'down_in_the_valley': +[A] Nodes: 2480 Edges: 83689 +[A] Root hubs: +[A] Mapping: [(1, 1, 0), (1, 2, 0), (1, 3, 0), (1, 4, 0), (1, 5, 0), (1, 6, 0), (1, 7, 0), (1, 8, 0), (1, 9, 0), (1, 10, 0), (1, 11, 0), (1, 12, 0), (1, 13, 0), (1, 14, 0), (1, 15, 0), (1, 16, 0), (1, 17, 0), (1, 18, 0), (1, 19, 0), (1, 20, 0), (1, 21, 0), (1, 22, 0), (1, 23, 0), (1, 24, 0), (1, 25, 0), (1, 26, 0), (1, 27, 0), (1, 28, 0), (1, 29, 0), (1, 30, 0), (1, 31, 0), (1, 32, 0), (1, 33, 0), (1, 34, 0), (1, 35, 0), (1, 36, 0), (1, 37, 0), (1, 38, 0), (1, 39, 0), (1, 40, 0), (1, 41, 0), (1, 42, 0), (1, 43, 0), (1, 44, 0), (1, 45, 0), (1, 46, 0), (1, 47, 0), (1, 48, 0), (1, 49, 0), (1, 50, 0), (1, 51, 0), (1, 52, 0), (1, 53, 0), (1, 54, 0), (1, 55, 0), (1, 56, 0), (1, 57, 0), (1, 58, 0), (1, 59, 0), (1, 60, 0), (1, 61, 0), (1, 62, 0), (1, 63, 0), (1, 64, 0), (1, 65, 0), (1, 66, 0), (1, 67, 0), (1, 68, 0), (1, 69, 0), (1, 70, 0), (1, 71, 0), (1, 72, 0), (1, 73, 0), (1, 74, 0), (1, 75, 0), (1, 76, 0), (1, 77, 0), (1, 78, 0), (1, 79, 0), (1, 80, 0), (1, 81, 0), (1, 82, 0), (1, 83, 0), (1, 84, 0), (1, 85, 0), (1, 86, 0), (1, 87, 0), (1, 88, 0), (1, 89, 0), (1, 90, 0), (1, 91, 0), (1, 92, 0), (1, 93, 0), (1, 94, 0), (1, 95, 0), (1, 96, 0), (1, 97, 0), (1, 98, 0), (1, 99, 0), (1, 100, 0)] + diff --git a/results/try3.log b/results/try3.log new file mode 100644 index 0000000..16e74ba --- /dev/null +++ b/results/try3.log @@ -0,0 +1,278 @@ +[ INFO ] Configuration - Loading /eval.properties FROM /home/students/zimmermann/Courses/ws17/fsem/absinth/WSI-Evaluator/config/eval.properties +[ INFO ] WSIEvaluator - Run started at 17:13 +[ INFO ] Dataset - Loading the datasets/trial +[ INFO ] Dataset - Loading the topics data datasets/trial +[ INFO ] Dataset - Loading the subtopics data +[ INFO ] Dataset - Loading the snippets data +[ INFO ] Dataset - Loading the relations data +[ INFO ] Dataset - Loading the relations data +[ INFO ] WSIEvaluator - +=================================================== +Starting the evaluation +=================================================== +[ INFO ] WSIEvaluator - +=================================================== +subtopic-recall@K default: 100 +=================================================== +[ WARN ] WSIEvaluator - +============= Query 1 : "soul food" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 7, 9, 10, 11, 12, 13, 14, 17, 20, 24, 25, 26, 27, 30, 33, 35, 37, 38, 39, 41, 42, 43, 45, 46, 47, 48, 49, 50, 52, 53, 56, 58, 60, 61, 63, 64, 65, 67, 69, 70, 71, 72, 74, 75, 76, 78, 80, 82, 83, 85, 88, 90, 91, 93, 94, 95, 96, 97, 98] +The cluster 2 contains the snippets: [3, 6, 8, 18, 19, 21, 22, 23, 28, 34, 36, 40, 44, 51, 55, 68, 73, 77, 79, 81, 84, 86, 87, 92, 100] +The cluster 3 contains the snippets: [15, 31, 32, 54, 62, 66, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 15, 2, 6, 31, 4, 8, 32, 5, 18, 54, 7, 19, 62, 9, 21, 66, 10, 22, 99, 11, 23, 12, 28, 13, 34, 14, 36, 17, 40, 20, 44, 24, 51, 25, 55, 26, 68, 27, 73, 30, 77, 33, 79, 35, 81, 37, 84, 38, 86, 39, 87, 41, 92, 42, 100, 43, 45, 46, 47, 48, 49, 50, 52, 53, 56, 58, 60, 61, 63, 64, 65, 67, 69, 70, 71, 72, 74, 75, 76, 78, 80, 82, 83, 85, 88, 90, 91, 93, 94, 95, 96, 97, 98, 16, 29, 57, 59, 89] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "soul food" =============== +============ Value of Rand Index = 0.5935353535353536 ================================= +============ Partial average Rand Index = 0.5935353535353536 ====== +============ Value of Adjusted Rand Index = 0.2078401481738628 ================================= +============ Partial average of Adjusted Rand Index = 0.2078401481738628 ================================= +============ Value of Jaccard Index = 0.45355784899511137 ================================= +============ Partial average of Jaccard Index = 0.45355784899511137 ====== +============ Precision = 0.8, Recall = 0.8172043010752689, F1 = 0.8085106382978724 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 31.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 2 : "the block" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 8, 9, 11, 13, 14, 15, 16, 19, 20, 22, 23, 24, 25, 26, 27, 28, 30, 31, 34, 35, 37, 38, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 58, 59, 60, 61, 63, 64, 65, 67, 68, 69, 70, 73, 74, 77, 80, 81, 84, 85, 86, 89, 90, 92, 94, 95, 96, 99] +The cluster 3 contains the snippets: [12, 21, 29, 32, 36, 43, 53, 55, 57, 62, 66, 72, 75, 76, 78, 79, 82, 83, 91, 93, 97, 100] +The cluster 2 contains the snippets: [7, 33, 39, 56, 71, 87, 88, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 7, 12, 3, 33, 21, 4, 39, 29, 5, 56, 32, 6, 71, 36, 8, 87, 43, 9, 88, 53, 11, 98, 55, 13, 57, 14, 62, 15, 66, 16, 72, 19, 75, 20, 76, 22, 78, 23, 79, 24, 82, 25, 83, 26, 91, 27, 93, 28, 97, 30, 100, 31, 34, 35, 37, 38, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 58, 59, 60, 61, 63, 64, 65, 67, 68, 69, 70, 73, 74, 77, 80, 81, 84, 85, 86, 89, 90, 92, 94, 95, 96, 99, 1, 10, 17, 18] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the block" =============== +============ Value of Rand Index = 0.6096969696969697 ================================= +============ Partial average Rand Index = 0.6016161616161617 ====== +============ Value of Adjusted Rand Index = 0.22217541028673304 ================================= +============ Partial average of Adjusted Rand Index = 0.2150077792302979 ================================= +============ Value of Jaccard Index = 0.4598825831702544 ================================= +============ Partial average of Jaccard Index = 0.4567202160826829 ====== +============ Precision = 0.20833333333333334, Recall = 0.7407407407407407, F1 = 0.3252032520325203 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 32.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 3 : "stephen king" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [3, 4, 6, 7, 11, 12, 15, 16, 17, 20, 22, 24, 25, 26, 27, 29, 30, 32, 33, 34, 35, 36, 37, 38, 40, 41, 44, 46, 47, 48, 49, 50, 51, 54, 55, 56, 59, 60, 61, 62, 63, 64, 66, 68, 69, 70, 71, 72, 74, 76, 77, 79, 82, 83, 85, 86, 87, 89, 91, 93, 94, 95, 96, 97, 99] +The cluster 1 contains the snippets: [1, 2, 5, 8, 9, 10, 13, 14, 18, 19, 21, 23, 28, 31, 39, 42, 43, 45, 53, 57, 58, 65, 67, 73, 75, 78, 80, 81, 84, 88, 90, 92, 98, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 2, 4, 5, 6, 8, 7, 9, 11, 10, 12, 13, 15, 14, 16, 18, 17, 19, 20, 21, 22, 23, 24, 28, 25, 31, 26, 39, 27, 42, 29, 43, 30, 45, 32, 53, 33, 57, 34, 58, 35, 65, 36, 67, 37, 73, 38, 75, 40, 78, 41, 80, 44, 81, 46, 84, 47, 88, 48, 90, 49, 92, 50, 98, 51, 100, 54, 55, 56, 59, 60, 61, 62, 63, 64, 66, 68, 69, 70, 71, 72, 74, 76, 77, 79, 82, 83, 85, 86, 87, 89, 91, 93, 94, 95, 96, 97, 99, 52] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "stephen king" =============== +============ Value of Rand Index = 0.5276767676767676 ================================= +============ Partial average Rand Index = 0.576969696969697 ====== +============ Value of Adjusted Rand Index = -0.00965607780138522 ================================= +============ Partial average of Adjusted Rand Index = 0.14011982688640354 ================================= +============ Value of Jaccard Index = 0.5243133265513733 ================================= +============ Partial average of Jaccard Index = 0.4792512529055797 ====== +============ Precision = 0.98989898989899, Recall = 0.98989898989899, F1 = 0.98989898989899 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 49.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 4 : "cool water" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 6, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 29, 30, 32, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47, 48, 49, 52, 53, 54, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 86, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 6, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 29, 30, 32, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47, 48, 49, 52, 53, 54, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 86, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100, 3, 5, 8, 9, 10, 12, 25, 26, 27, 31, 35, 40, 46, 50, 51, 55, 56, 69, 73, 82, 87, 89, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "cool water" =============== +============ Value of Rand Index = 0.6121212121212121 ================================= +============ Partial average Rand Index = 0.5857575757575757 ====== +============ Value of Adjusted Rand Index = 0.17574083154775647 ================================= +============ Partial average of Adjusted Rand Index = 0.14902507805174176 ================================= +============ Value of Jaccard Index = 0.5251051199604254 ================================= +============ Partial average of Jaccard Index = 0.49071471966929114 ====== +============ Precision = 0.15584415584415584, Recall = 0.48, F1 = 0.23529411764705882 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 77.0 ============ +=========================================================================== + +[ INFO ] WSIEvaluator - + +=========== Final average value of S-recall@K: ============= +1 0.3958 +2 0.5417 +3 0.6250 +4 0.6250 +5 0.6250 +6 0.6250 +7 0.6250 +8 0.6250 +9 0.6250 +10 0.7083 +11 0.8542 +12 0.8542 +13 0.8542 +14 0.8542 +15 0.8542 +16 0.9167 +17 0.9167 +18 0.9167 +19 0.9167 +20 0.9167 +21 0.9167 +22 0.9167 +23 0.9167 +24 0.9167 +25 0.9167 +26 0.9167 +27 0.9167 +28 0.9167 +29 0.9167 +30 0.9167 +31 0.9167 +32 0.9167 +33 0.9167 +34 0.9167 +35 0.9167 +36 0.9167 +37 0.9167 +38 0.9167 +39 0.9167 +40 0.9167 +41 0.9167 +42 0.9167 +43 0.9167 +44 0.9167 +45 0.9167 +46 0.9167 +47 0.9167 +48 0.9167 +49 0.9167 +50 0.9167 +51 0.9167 +52 0.9167 +53 0.9167 +54 0.9167 +55 0.9167 +56 0.9167 +57 0.9167 +58 0.9167 +59 0.9167 +60 0.9167 +61 0.9167 +62 0.9167 +63 0.9167 +64 0.9167 +65 0.9167 +66 0.9167 +67 0.9167 +68 0.9167 +69 0.9167 +70 0.9167 +71 0.9167 +72 0.9167 +73 0.9167 +74 0.9167 +75 0.9167 +76 0.9167 +77 0.9167 +78 0.9167 +79 0.9167 +80 1.0000 +81 1.0000 +82 1.0000 +83 1.0000 +84 1.0000 +85 1.0000 +86 1.0000 +87 1.0000 +88 1.0000 +89 1.0000 +90 1.0000 +91 1.0000 +92 1.0000 +93 1.0000 +94 1.0000 +95 1.0000 +96 1.0000 +97 1.0000 +98 1.0000 +99 1.0000 +100 1.0000 + +=========== Final average value of S-precision@r: ============= +0.4000 0.6222 +0.4500 0.4798 +0.5000 0.3708 +0.5500 0.2717 +0.6000 0.2375 +0.6500 0.2119 +0.7000 0.1455 +0.7500 0.1471 +0.8000 0.1374 +0.8500 0.1291 +0.9000 0.1218 +0.9500 0.1154 +1.0000 0.0267 + +=========== Final average value of F1: ===================== +average F1 = 0.6293233944294127 + +=========== Final average value of Rand Index: ============= +average Rand Index = 0.5857575757575757 + +=========== Final average value of Adjusted Rand Index: ==== +average Adj Rand Index = 0.14902507805174176 + +=========== Final average value of Jaccard Index: ========== +average Jaccard Index = 0.49071471966929114 + +================ Statistics: ==================================== +============ average number of created clusters: 2.25 +============ average cluster size: 47.54166666666667 + +[ WARN ] WSIEvaluator - Simulation started at: 17:13 and completed at 17:13 +Execution time: 1.773 sec diff --git a/results/try4.log b/results/try4.log new file mode 100644 index 0000000..fa5ef08 --- /dev/null +++ b/results/try4.log @@ -0,0 +1,3649 @@ +[ INFO ] Configuration - Loading /eval.properties FROM /home/students/zimmermann/Courses/ws17/fsem/absinth/WSI-Evaluator/config/eval.properties +[ INFO ] WSIEvaluator - Run started at 03:01 +[ INFO ] Dataset - Loading the datasets/MORESQUE/ +[ INFO ] Dataset - Loading the topics data datasets/MORESQUE/ +[ INFO ] Dataset - Loading the subtopics data +[ INFO ] Dataset - Loading the snippets data +[ INFO ] Dataset - Loading the relations data +[ INFO ] Dataset - Loading the relations data +[ INFO ] WSIEvaluator - +=================================================== +Starting the evaluation +=================================================== +[ INFO ] WSIEvaluator - +=================================================== +subtopic-recall@K default: 100 +=================================================== +[ WARN ] WSIEvaluator - +============= Query 1 : "the blue bird" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 5, 6, 10, 11, 12, 13, 14, 15, 16, 20, 21, 22, 23, 26, 27, 28, 29, 31, 32, 36, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 74, 75, 76, 78, 80, 82, 85, 86, 87, 90, 92, 93, 94, 95, 97, 98, 99, 100] +The cluster 3 contains the snippets: [2, 4, 17, 25, 40, 50, 68, 83, 84, 89, 91] +The cluster 4 contains the snippets: [9, 18, 77] +The cluster 2 contains the snippets: [79] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 79, 2, 9, 5, 4, 18, 6, 17, 77, 10, 25, 11, 40, 12, 50, 13, 68, 14, 83, 15, 84, 16, 89, 20, 91, 21, 22, 23, 26, 27, 28, 29, 31, 32, 36, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 74, 75, 76, 78, 80, 82, 85, 86, 87, 90, 92, 93, 94, 95, 97, 98, 99, 100, 3, 7, 8, 19, 24, 30, 33, 34, 35, 37, 53, 61, 81, 88, 96] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the blue bird" =============== +============ Value of Rand Index = 0.5834343434343434 ================================= +============ Partial average Rand Index = 0.5834343434343434 ====== +============ Value of Adjusted Rand Index = 0.17610698044642664 ================================= +============ Partial average of Adjusted Rand Index = 0.17610698044642664 ================================= +============ Value of Jaccard Index = 0.45130388504523683 ================================= +============ Partial average of Jaccard Index = 0.45130388504523683 ====== +============ Precision = 0.2235294117647059, Recall = 0.7037037037037037, F1 = 0.3392857142857143 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 21.25 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 2 : "crown of thorns" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 9, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 51, 52, 56, 57, 59, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 77, 81, 82, 83, 84, 85, 86, 87, 89, 90, 92, 93, 94, 95, 96, 97, 99, 100] +The cluster 3 contains the snippets: [10, 24, 37, 49, 50, 54, 76, 78, 91, 98] +The cluster 2 contains the snippets: [88] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 88, 10, 2, 24, 3, 37, 4, 49, 5, 50, 6, 54, 9, 76, 11, 78, 12, 91, 13, 98, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 51, 52, 56, 57, 59, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 77, 81, 82, 83, 84, 85, 86, 87, 89, 90, 92, 93, 94, 95, 96, 97, 99, 100, 7, 8, 15, 29, 48, 53, 55, 58, 60, 62, 75, 79, 80] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "crown of thorns" =============== +============ Value of Rand Index = 0.46 ================================= +============ Partial average Rand Index = 0.5217171717171717 ====== +============ Value of Adjusted Rand Index = 0.029582182042369273 ================================= +============ Partial average of Adjusted Rand Index = 0.10284458124439796 ================================= +============ Value of Jaccard Index = 0.20588235294117646 ================================= +============ Partial average of Jaccard Index = 0.32859311899320665 ====== +============ Precision = 0.20689655172413793, Recall = 0.3050847457627119, F1 = 0.2465753424657534 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 29.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 3 : "hall of justice" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 6, 7, 8, 16, 24, 29, 30, 34, 35, 39, 40, 42, 43, 44, 47, 48, 49, 52, 53, 55, 56, 57, 58, 61, 62, 64, 67, 69, 70, 71, 75, 76, 79, 80, 81, 86, 87, 89, 92, 93, 95, 97, 99] +The cluster 2 contains the snippets: [3, 5, 10, 12, 13, 15, 17, 18, 20, 22, 23, 25, 26, 27, 28, 31, 32, 33, 36, 38, 45, 46, 50, 51, 54, 59, 60, 63, 66, 68, 72, 73, 74, 77, 78, 82, 84, 85, 88, 90, 91, 94, 96, 98, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 2, 5, 6, 10, 7, 12, 8, 13, 16, 15, 24, 17, 29, 18, 30, 20, 34, 22, 35, 23, 39, 25, 40, 26, 42, 27, 43, 28, 44, 31, 47, 32, 48, 33, 49, 36, 52, 38, 53, 45, 55, 46, 56, 50, 57, 51, 58, 54, 61, 59, 62, 60, 64, 63, 67, 66, 69, 68, 70, 72, 71, 73, 75, 74, 76, 77, 79, 78, 80, 82, 81, 84, 86, 85, 87, 88, 89, 90, 92, 91, 93, 94, 95, 96, 97, 98, 99, 100, 4, 9, 11, 14, 19, 21, 37, 41, 65, 83] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "hall of justice" =============== +============ Value of Rand Index = 0.5454545454545454 ================================= +============ Partial average Rand Index = 0.5296296296296296 ====== +============ Value of Adjusted Rand Index = 0.03794832035766849 ================================= +============ Partial average of Adjusted Rand Index = 0.08121249428215481 ================================= +============ Value of Jaccard Index = 0.25323597743113174 ================================= +============ Partial average of Jaccard Index = 0.30347407180584834 ====== +============ Precision = 0.4666666666666667, Recall = 0.6666666666666666, F1 = 0.5490196078431373 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 45.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 4 : "cool water" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 6, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 29, 30, 32, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47, 48, 49, 52, 53, 54, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 86, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 6, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 29, 30, 32, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47, 48, 49, 52, 53, 54, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 86, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100, 3, 5, 8, 9, 10, 12, 25, 26, 27, 31, 35, 40, 46, 50, 51, 55, 56, 69, 73, 82, 87, 89, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "cool water" =============== +============ Value of Rand Index = 0.6026262626262626 ================================= +============ Partial average Rand Index = 0.5478787878787879 ====== +============ Value of Adjusted Rand Index = 0.14985391490759462 ================================= +============ Partial average of Adjusted Rand Index = 0.09837284943851476 ================================= +============ Value of Jaccard Index = 0.5195407914020518 ================================= +============ Partial average of Jaccard Index = 0.3574907517048992 ====== +============ Precision = 0.15584415584415584, Recall = 0.5, F1 = 0.2376237623762376 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 77.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 5 : "the art of seduction" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the art of seduction" =============== +============ Value of Rand Index = 0.5254545454545455 ================================= +============ Partial average Rand Index = 0.5433939393939393 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07869827955081181 ================================= +============ Value of Jaccard Index = 0.5254545454545455 ================================= +============ Partial average of Jaccard Index = 0.3910835104548284 ====== +============ Precision = 0.21, Recall = 0.6774193548387096, F1 = 0.32061068702290074 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 6 : "radioactive man" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 8, 9, 10, 14, 15, 18, 20, 22, 23, 27, 37, 40, 41, 42, 43, 44, 45, 47, 48, 55, 56, 57, 60, 61, 62, 65, 66, 68, 69, 70, 71, 74, 78, 79, 83, 84, 87, 91, 92, 93, 96, 98] +The cluster 2 contains the snippets: [5, 7, 24, 29, 31, 35, 50, 53, 63, 64, 73, 75, 76, 82, 90] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 5, 2, 7, 8, 24, 9, 29, 10, 31, 14, 35, 15, 50, 18, 53, 20, 63, 22, 64, 23, 73, 27, 75, 37, 76, 40, 82, 41, 90, 42, 43, 44, 45, 47, 48, 55, 56, 57, 60, 61, 62, 65, 66, 68, 69, 70, 71, 74, 78, 79, 83, 84, 87, 91, 92, 93, 96, 98, 3, 4, 6, 11, 12, 13, 16, 17, 19, 21, 25, 26, 28, 30, 32, 33, 34, 36, 38, 39, 46, 49, 51, 52, 54, 58, 59, 67, 72, 77, 80, 81, 85, 86, 88, 89, 94, 95, 97, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "radioactive man" =============== +============ Value of Rand Index = 0.6791919191919192 ================================= +============ Partial average Rand Index = 0.566026936026936 ====== +============ Value of Adjusted Rand Index = 0.21390386084051713 ================================= +============ Partial average of Adjusted Rand Index = 0.10123254309909602 ================================= +============ Value of Jaccard Index = 0.33639782699540327 ================================= +============ Partial average of Jaccard Index = 0.3819692298782576 ====== +============ Precision = 0.576271186440678, Recall = 0.3469387755102041, F1 = 0.43312101910828027 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 29.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 7 : "radius of curvature" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 1, 38, 76, 87] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "radius of curvature" =============== +============ Value of Rand Index = 0.2816161616161616 ================================= +============ Partial average Rand Index = 0.5253968253968254 ====== +============ Value of Adjusted Rand Index = 5.307390085871351E-4 ================================= +============ Partial average of Adjusted Rand Index = 0.08684657108616618 ================================= +============ Value of Jaccard Index = 0.23493975903614459 ================================= +============ Partial average of Jaccard Index = 0.36096501975795575 ====== +============ Precision = 0.375, Recall = 0.35294117647058826, F1 = 0.3636363636363636 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 96.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 8 : "twilight of the gods" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "twilight of the gods" =============== +============ Value of Rand Index = 0.24343434343434345 ================================= +============ Partial average Rand Index = 0.4901515151515151 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.0759907497003954 ================================= +============ Value of Jaccard Index = 0.24343434343434345 ================================= +============ Partial average of Jaccard Index = 0.3462736852175042 ====== +============ Precision = 0.18, Recall = 0.32142857142857145, F1 = 0.23076923076923075 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 9 : "sign of the cross" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 38, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 86, 87, 88, 89, 91, 93, 94, 95, 96, 97, 100] +The cluster 2 contains the snippets: [41, 70, 71, 90] +The cluster 4 contains the snippets: [19, 53, 69, 92] +The cluster 3 contains the snippets: [81] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 41, 81, 19, 2, 70, 53, 3, 71, 69, 4, 90, 92, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 38, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 86, 87, 88, 89, 91, 93, 94, 95, 96, 97, 100, 9, 35, 37, 39, 98, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "sign of the cross" =============== +============ Value of Rand Index = 0.4953535353535354 ================================= +============ Partial average Rand Index = 0.49072951739618403 ====== +============ Value of Adjusted Rand Index = 0.04658327119336076 ================================= +============ Partial average of Adjusted Rand Index = 0.07272325208850267 ================================= +============ Value of Jaccard Index = 0.39206619615478217 ================================= +============ Partial average of Jaccard Index = 0.3513617419883129 ====== +============ Precision = 0.4787234042553192, Recall = 0.8333333333333334, F1 = 0.6081081081081082 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 23.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 10 : "in the name of love" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 5, 6, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 4, 9, 11, 27, 39, 52, 80, 85] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "in the name of love" =============== +============ Value of Rand Index = 0.5468686868686868 ================================= +============ Partial average Rand Index = 0.49634343434343436 ====== +============ Value of Adjusted Rand Index = -0.09833489665738805 ================================= +============ Partial average of Adjusted Rand Index = 0.0556174372139136 ================================= +============ Value of Jaccard Index = 0.5301633850020947 ================================= +============ Partial average of Jaccard Index = 0.369241906289691 ====== +============ Precision = 0.14130434782608695, Recall = 0.5909090909090909, F1 = 0.2280701754385965 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 92.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 11 : "stephen king" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 8, 9, 10, 12, 13, 14, 16, 18, 19, 21, 23, 24, 25, 27, 28, 31, 33, 35, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 55, 57, 58, 59, 61, 64, 65, 66, 67, 68, 69, 70, 72, 73, 74, 75, 77, 78, 80, 81, 82, 84, 88, 90, 92, 93, 94, 98, 100] +The cluster 2 contains the snippets: [7, 11, 15, 17, 20, 22, 26, 29, 30, 32, 34, 36, 41, 50, 52, 54, 56, 60, 62, 63, 71, 76, 79, 83, 85, 86, 87, 89, 91, 95, 96, 97, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 7, 2, 11, 3, 15, 4, 17, 5, 20, 6, 22, 8, 26, 9, 29, 10, 30, 12, 32, 13, 34, 14, 36, 16, 41, 18, 50, 19, 52, 21, 54, 23, 56, 24, 60, 25, 62, 27, 63, 28, 71, 31, 76, 33, 79, 35, 83, 37, 85, 38, 86, 39, 87, 40, 89, 42, 91, 43, 95, 44, 96, 45, 97, 46, 99, 47, 48, 49, 51, 53, 55, 57, 58, 59, 61, 64, 65, 66, 67, 68, 69, 70, 72, 73, 74, 75, 77, 78, 80, 81, 82, 84, 88, 90, 92, 93, 94, 98, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "stephen king" =============== +============ Value of Rand Index = 0.5404040404040404 ================================= +============ Partial average Rand Index = 0.5003489439853076 ====== +============ Value of Adjusted Rand Index = -0.010231087585925133 ================================= +============ Partial average of Adjusted Rand Index = 0.04963120768665554 ================================= +============ Value of Jaccard Index = 0.5250521920668059 ================================= +============ Partial average of Jaccard Index = 0.3834064777239741 ====== +============ Precision = 0.96, Recall = 1.0, F1 = 0.9795918367346939 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 50.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 12 : "private practice" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 8, 10, 13, 16, 17, 19, 21, 22, 24, 25, 27, 28, 29, 30, 31, 39, 41, 46, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 65, 66, 68, 69, 70, 71, 72, 75, 76, 78, 80, 81, 82, 83, 86, 87, 88, 89, 91, 93, 94, 95, 97, 99, 100] +The cluster 3 contains the snippets: [4, 7, 9, 12, 14, 18, 20, 23, 26, 33, 34, 35, 36, 38, 40, 42, 43, 44, 45, 47, 49, 52, 62, 63, 64, 67, 73, 74, 77, 79, 84, 85, 90, 92, 96, 98] +The cluster 4 contains the snippets: [11, 32, 37] +The cluster 2 contains the snippets: [59] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 59, 4, 11, 2, 7, 32, 3, 9, 37, 5, 12, 6, 14, 8, 18, 10, 20, 13, 23, 16, 26, 17, 33, 19, 34, 21, 35, 22, 36, 24, 38, 25, 40, 27, 42, 28, 43, 29, 44, 30, 45, 31, 47, 39, 49, 41, 52, 46, 62, 48, 63, 50, 64, 51, 67, 53, 73, 54, 74, 55, 77, 56, 79, 57, 84, 58, 85, 60, 90, 61, 92, 65, 96, 66, 98, 68, 69, 70, 71, 72, 75, 76, 78, 80, 81, 82, 83, 86, 87, 88, 89, 91, 93, 94, 95, 97, 99, 100, 15] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "private practice" =============== +============ Value of Rand Index = 0.5282828282828282 ================================= +============ Partial average Rand Index = 0.5026767676767677 ====== +============ Value of Adjusted Rand Index = 0.05226888873838056 ================================= +============ Partial average of Adjusted Rand Index = 0.04985101444096596 ================================= +============ Value of Jaccard Index = 0.3272832036876981 ================================= +============ Partial average of Jaccard Index = 0.3787295382209512 ====== +============ Precision = 0.47474747474747475, Recall = 0.94, F1 = 0.6308724832214765 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 24.75 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 13 : "micro chip" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "micro chip" =============== +============ Value of Rand Index = 0.3202020202020202 ================================= +============ Partial average Rand Index = 0.4886402486402487 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.04601632102243011 ================================= +============ Value of Jaccard Index = 0.3202020202020202 ================================= +============ Partial average of Jaccard Index = 0.3742274214502641 ====== +============ Precision = 0.44, Recall = 0.4536082474226804, F1 = 0.4467005076142132 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 14 : "the glass bead game" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the glass bead game" =============== +============ Value of Rand Index = 0.44303030303030305 ================================= +============ Partial average Rand Index = 0.4853823953823954 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.04272944094939939 ================================= +============ Value of Jaccard Index = 0.44303030303030305 ================================= +============ Partial average of Jaccard Index = 0.3791419129916955 ====== +============ Precision = 0.43, Recall = 0.8775510204081632, F1 = 0.5771812080536912 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 15 : "la mancha" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 2 contains the snippets: [3, 6, 7, 9, 10, 12, 13, 16, 17, 20, 22, 26, 27, 28, 30, 31, 32, 33, 34, 36, 37, 38, 39, 42, 45, 46, 47, 49, 52, 54, 56, 57, 58, 64, 65, 67, 68, 69, 70, 71, 74, 76, 77, 78, 81, 82, 83, 92, 93, 94, 95, 96, 98, 99, 100] +The cluster 1 contains the snippets: [1, 2, 4, 8, 11, 14, 15, 21, 24, 29, 35, 40, 41, 43, 44, 48, 50, 51, 53, 59, 60, 61, 62, 63, 66, 72, 75, 79, 80, 84, 85, 87, 88, 89, 90, 91, 97] +The cluster 3 contains the snippets: [23, 55, 73] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 23, 2, 6, 55, 4, 7, 73, 8, 9, 11, 10, 14, 12, 15, 13, 21, 16, 24, 17, 29, 20, 35, 22, 40, 26, 41, 27, 43, 28, 44, 30, 48, 31, 50, 32, 51, 33, 53, 34, 59, 36, 60, 37, 61, 38, 62, 39, 63, 42, 66, 45, 72, 46, 75, 47, 79, 49, 80, 52, 84, 54, 85, 56, 87, 57, 88, 58, 89, 64, 90, 65, 91, 67, 97, 68, 69, 70, 71, 74, 76, 77, 78, 81, 82, 83, 92, 93, 94, 95, 96, 98, 99, 100, 5, 18, 19, 25, 86] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "la mancha" =============== +============ Value of Rand Index = 0.6963636363636364 ================================= +============ Partial average Rand Index = 0.4994478114478115 ====== +============ Value of Adjusted Rand Index = 0.3769685884496757 ================================= +============ Partial average of Adjusted Rand Index = 0.06501205078275114 ================================= +============ Value of Jaccard Index = 0.525418377012946 ================================= +============ Partial average of Jaccard Index = 0.3888936772597789 ====== +============ Precision = 0.3157894736842105, Recall = 0.7692307692307693, F1 = 0.4477611940298507 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 31.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 16 : "richard tracey" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "richard tracey" =============== +============ Value of Rand Index = 0.5561616161616162 ================================= +============ Partial average Rand Index = 0.5029924242424243 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.060948797608829194 ================================= +============ Value of Jaccard Index = 0.5561616161616162 ================================= +============ Partial average of Jaccard Index = 0.3993479234411438 ====== +============ Precision = 0.23, Recall = 0.7931034482758621, F1 = 0.35658914728682173 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 17 : "heart attack" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "heart attack" =============== +============ Value of Rand Index = 0.9604040404040404 ================================= +============ Partial average Rand Index = 0.5298989898989899 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.057363574220074535 ================================= +============ Value of Jaccard Index = 0.9604040404040404 ================================= +============ Partial average of Jaccard Index = 0.43235122443896123 ====== +============ Precision = 0.98, Recall = 0.9245283018867925, F1 = 0.9514563106796116 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 18 : "new england" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 7 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 20, 21, 22, 24, 25, 26, 28, 29, 32, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 47, 49, 52, 54, 55, 56, 57, 59, 61, 63, 64, 65, 67, 68, 69, 70, 74, 75, 77, 81, 83, 85, 86, 88, 90, 91, 92, 94, 95, 97, 99] +The cluster 6 contains the snippets: [4, 13, 19, 27, 30, 31, 39, 40, 48, 50, 51, 58, 60, 66, 71, 72, 73, 76, 82, 87, 93, 96] +The cluster 2 contains the snippets: [2, 5, 8, 33, 46, 62, 84, 100] +The cluster 4 contains the snippets: [53, 78] +The cluster 5 contains the snippets: [80, 89] +The cluster 3 contains the snippets: [23, 98] +The cluster 7 contains the snippets: [16] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 23, 53, 80, 4, 16, 3, 5, 98, 78, 89, 13, 6, 8, 19, 7, 33, 27, 9, 46, 30, 10, 62, 31, 11, 84, 39, 12, 100, 40, 14, 48, 15, 50, 17, 51, 18, 58, 20, 60, 21, 66, 22, 71, 24, 72, 25, 73, 26, 76, 28, 82, 29, 87, 32, 93, 34, 96, 35, 36, 37, 38, 41, 42, 43, 44, 45, 47, 49, 52, 54, 55, 56, 57, 59, 61, 63, 64, 65, 67, 68, 69, 70, 74, 75, 77, 81, 83, 85, 86, 88, 90, 91, 92, 94, 95, 97, 99, 79] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "new england" =============== +============ Value of Rand Index = 0.5761616161616162 ================================= +============ Partial average Rand Index = 0.5324691358024691 ====== +============ Value of Adjusted Rand Index = 0.1339427281121651 ================================= +============ Partial average of Adjusted Rand Index = 0.06161797165852402 ================================= +============ Value of Jaccard Index = 0.35683629675045986 ================================= +============ Partial average of Jaccard Index = 0.42815595067848894 ====== +============ Precision = 0.2222222222222222, Recall = 0.5945945945945946, F1 = 0.32352941176470584 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 7 ============ +============ average size of the created clusters: 14.142857142857142 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 19 : "fly with me" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 6, 7, 8, 10, 13, 17, 22, 23, 26, 27, 28, 30, 35, 37, 38, 42, 44, 45, 51, 52, 55, 57, 58, 60, 63, 67, 69, 74, 75, 80, 81, 84, 85, 87, 88, 90, 92, 98, 99, 100] +The cluster 2 contains the snippets: [4, 24, 25, 66, 68] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 4, 3, 24, 6, 25, 7, 66, 8, 68, 10, 13, 17, 22, 23, 26, 27, 28, 30, 35, 37, 38, 42, 44, 45, 51, 52, 55, 57, 58, 60, 63, 67, 69, 74, 75, 80, 81, 84, 85, 87, 88, 90, 92, 98, 99, 100, 1, 5, 9, 11, 12, 14, 15, 16, 18, 19, 20, 21, 29, 31, 32, 33, 34, 36, 39, 40, 41, 43, 46, 47, 48, 49, 50, 53, 54, 56, 59, 61, 62, 64, 65, 70, 71, 72, 73, 76, 77, 78, 79, 82, 83, 86, 89, 91, 93, 94, 95, 96, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "fly with me" =============== +============ Value of Rand Index = 0.5408080808080808 ================================= +============ Partial average Rand Index = 0.5329080276448697 ====== +============ Value of Adjusted Rand Index = 0.12632412017418 ================================= +============ Partial average of Adjusted Rand Index = 0.0650235584225059 ================================= +============ Value of Jaccard Index = 0.4577767175572519 ================================= +============ Partial average of Jaccard Index = 0.4297149384089501 ====== +============ Precision = 0.1702127659574468, Recall = 0.6666666666666666, F1 = 0.2711864406779661 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 23.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 20 : "agent blue" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "agent blue" =============== +============ Value of Rand Index = 0.5046464646464647 ================================= +============ Partial average Rand Index = 0.5314949494949494 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.061772380501380605 ================================= +============ Value of Jaccard Index = 0.5046464646464647 ================================= +============ Partial average of Jaccard Index = 0.43346151472082584 ====== +============ Precision = 0.26, Recall = 0.7647058823529411, F1 = 0.3880597014925373 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 21 : "across the universe" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 7, 8, 9, 10, 13, 14, 16, 17, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 39, 44, 49, 51, 53, 58, 60, 65, 66, 70, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 88, 91, 92, 93, 95, 96, 97, 98, 99, 100] +The cluster 4 contains the snippets: [3, 4, 6, 11, 15, 18, 20, 40, 41, 42, 43, 47, 48, 50, 54, 57, 59, 61, 62, 63, 68, 69, 72, 84, 85, 86, 87, 90, 94] +The cluster 2 contains the snippets: [21, 22, 64, 67] +The cluster 3 contains the snippets: [33, 89] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 21, 33, 3, 2, 22, 89, 4, 7, 64, 6, 8, 67, 11, 9, 15, 10, 18, 13, 20, 14, 40, 16, 41, 17, 42, 19, 43, 23, 47, 24, 48, 25, 50, 26, 54, 27, 57, 28, 59, 29, 61, 30, 62, 31, 63, 32, 68, 34, 69, 35, 72, 36, 84, 37, 85, 39, 86, 44, 87, 49, 90, 51, 94, 53, 58, 60, 65, 66, 70, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 88, 91, 92, 93, 95, 96, 97, 98, 99, 100, 5, 12, 38, 45, 46, 52, 55, 56, 71] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "across the universe" =============== +============ Value of Rand Index = 0.6084848484848485 ================================= +============ Partial average Rand Index = 0.5351611351611351 ====== +============ Value of Adjusted Rand Index = 0.17154165094934704 ================================= +============ Partial average of Adjusted Rand Index = 0.06699948861795044 ================================= +============ Value of Jaccard Index = 0.3487903225806452 ================================= +============ Partial average of Jaccard Index = 0.429429553190341 ====== +============ Precision = 0.6373626373626373, Recall = 0.7435897435897436, F1 = 0.6863905325443787 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 22.75 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 22 : "attack of the mutant" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "attack of the mutant" =============== +============ Value of Rand Index = 0.48505050505050507 ================================= +============ Partial average Rand Index = 0.5328833792470156 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06395405731713451 ================================= +============ Value of Jaccard Index = 0.48505050505050507 ================================= +============ Partial average of Jaccard Index = 0.43195777827489396 ====== +============ Precision = 0.16, Recall = 0.48484848484848486, F1 = 0.24060150375939848 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 23 : "the block" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 4, 5, 6, 8, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 31, 32, 33, 34, 35, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 57, 58, 60, 61, 62, 63, 65, 67, 68, 69, 70, 72, 73, 74, 77, 78, 80, 81, 83, 84, 85, 86, 89, 90, 92, 93, 96, 97, 99] +The cluster 3 contains the snippets: [2, 12, 21, 29, 36, 53, 66, 75, 76, 79, 82, 87, 91, 100] +The cluster 2 contains the snippets: [7, 28, 30, 39, 56, 59, 64, 71, 88, 94, 95, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 7, 2, 4, 28, 12, 5, 30, 21, 6, 39, 29, 8, 56, 36, 9, 59, 53, 11, 64, 66, 13, 71, 75, 14, 88, 76, 15, 94, 79, 16, 95, 82, 17, 98, 87, 18, 91, 19, 100, 20, 22, 23, 24, 25, 26, 27, 31, 32, 33, 34, 35, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 57, 58, 60, 61, 62, 63, 65, 67, 68, 69, 70, 72, 73, 74, 77, 78, 80, 81, 83, 84, 85, 86, 89, 90, 92, 93, 96, 97, 99, 1, 10] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the block" =============== +============ Value of Rand Index = 0.6933333333333334 ================================= +============ Partial average Rand Index = 0.5398594642072903 ====== +============ Value of Adjusted Rand Index = 0.37849478303189277 ================================= +============ Partial average of Adjusted Rand Index = 0.07762974104386312 ================================= +============ Value of Jaccard Index = 0.5689948892674617 ================================= +============ Partial average of Jaccard Index = 0.43791591353544035 ====== +============ Precision = 0.19387755102040816, Recall = 0.7037037037037037, F1 = 0.304 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 32.666666666666664 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 24 : "lake of the woods" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 53, 54, 55, 56, 57, 58, 59, 61, 62, 64, 65, 67, 68, 69, 70, 71, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 53, 54, 55, 56, 57, 58, 59, 61, 62, 64, 65, 67, 68, 69, 70, 71, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 99, 100, 6, 14, 40, 42, 51, 52, 60, 63, 66, 72, 73, 85, 89, 98] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "lake of the woods" =============== +============ Value of Rand Index = 0.4351515151515152 ================================= +============ Partial average Rand Index = 0.535496632996633 ====== +============ Value of Adjusted Rand Index = -0.06047044899770698 ================================= +============ Partial average of Adjusted Rand Index = 0.07187556645879771 ================================= +============ Value of Jaccard Index = 0.3626624116708457 ================================= +============ Partial average of Jaccard Index = 0.43478035095774886 ====== +============ Precision = 0.16279069767441862, Recall = 0.34146341463414637, F1 = 0.22047244094488191 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 86.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 25 : "freedom of the seas" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 68, 69, 70, 71, 72, 73, 74, 76, 78, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 95, 96, 97, 98, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 68, 69, 70, 71, 72, 73, 74, 76, 78, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 95, 96, 97, 98, 100, 12, 25, 40, 42, 44, 66, 75, 77, 79, 87, 94, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "freedom of the seas" =============== +============ Value of Rand Index = 0.6274747474747475 ================================= +============ Partial average Rand Index = 0.5391757575757576 ====== +============ Value of Adjusted Rand Index = 0.1773928766862555 ================================= +============ Partial average of Adjusted Rand Index = 0.07609625886789602 ================================= +============ Value of Jaccard Index = 0.5721577726218098 ================================= +============ Partial average of Jaccard Index = 0.44027544782431144 ====== +============ Precision = 0.7727272727272727, Recall = 0.918918918918919, F1 = 0.8395061728395061 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 88.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 26 : "robert watts" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 4, 5, 6, 8, 9, 10, 14, 15, 17, 19, 20, 21, 27, 28, 30, 31, 34, 36, 37, 38, 39, 41, 42, 44, 45, 48, 50, 51, 52, 54, 55, 56, 57, 62, 65, 66, 67, 68, 69, 70, 71, 72, 74, 76, 77, 78, 80, 81, 83, 85, 90, 92, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 4, 5, 6, 8, 9, 10, 14, 15, 17, 19, 20, 21, 27, 28, 30, 31, 34, 36, 37, 38, 39, 41, 42, 44, 45, 48, 50, 51, 52, 54, 55, 56, 57, 62, 65, 66, 67, 68, 69, 70, 71, 72, 74, 76, 77, 78, 80, 81, 83, 85, 90, 92, 96, 97, 98, 99, 100, 1, 3, 7, 11, 12, 13, 16, 18, 22, 23, 24, 25, 26, 29, 32, 33, 35, 40, 43, 46, 47, 49, 53, 58, 59, 60, 61, 63, 64, 73, 75, 79, 82, 84, 86, 87, 88, 89, 91, 93, 94, 95] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "robert watts" =============== +============ Value of Rand Index = 0.5561616161616162 ================================= +============ Partial average Rand Index = 0.5398290598290599 ====== +============ Value of Adjusted Rand Index = 0.11552175688870954 ================================= +============ Partial average of Adjusted Rand Index = 0.07761262417638884 ================================= +============ Value of Jaccard Index = 0.33605318827440317 ================================= +============ Partial average of Jaccard Index = 0.4362668993800842 ====== +============ Precision = 0.5, Recall = 0.5918367346938775, F1 = 0.5420560747663551 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 58.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 27 : "look back in anger" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 8, 10, 11, 12, 14, 15, 17, 18, 20, 31, 32, 34, 36, 42, 43, 44, 46, 48, 49, 50, 51, 52, 53, 54, 59, 66, 68, 72, 73, 74, 76, 77, 80, 82, 83, 85, 86, 88, 90, 91, 93, 95, 99, 100] +The cluster 2 contains the snippets: [7, 9, 13, 21, 23, 24, 25, 26, 27, 28, 30, 35, 37, 39, 40, 45, 47, 55, 56, 57, 58, 61, 62, 63, 64, 65, 67, 69, 71, 75, 78, 81, 84, 87, 89, 92, 96, 97, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 7, 2, 9, 3, 13, 5, 21, 8, 23, 10, 24, 11, 25, 12, 26, 14, 27, 15, 28, 17, 30, 18, 35, 20, 37, 31, 39, 32, 40, 34, 45, 36, 47, 42, 55, 43, 56, 44, 57, 46, 58, 48, 61, 49, 62, 50, 63, 51, 64, 52, 65, 53, 67, 54, 69, 59, 71, 66, 75, 68, 78, 72, 81, 73, 84, 74, 87, 76, 89, 77, 92, 80, 96, 82, 97, 83, 98, 85, 86, 88, 90, 91, 93, 95, 99, 100, 4, 6, 16, 19, 22, 29, 33, 38, 41, 60, 70, 79, 94] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "look back in anger" =============== +============ Value of Rand Index = 0.5511111111111111 ================================= +============ Partial average Rand Index = 0.540246913580247 ====== +============ Value of Adjusted Rand Index = 0.051707949947933596 ================================= +============ Partial average of Adjusted Rand Index = 0.07665319179755717 ================================= +============ Value of Jaccard Index = 0.2625290408230999 ================================= +============ Partial average of Jaccard Index = 0.4298321638779736 ====== +============ Precision = 0.3448275862068966, Recall = 0.6818181818181818, F1 = 0.4580152671755725 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 43.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 28 : "liquid air" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 26, 27, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 91, 92, 93, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 26, 27, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 91, 92, 93, 95, 96, 97, 98, 99, 100, 4, 5, 8, 11, 22, 23, 24, 25, 28, 32, 51, 58, 61, 77, 89, 90, 94] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "liquid air" =============== +============ Value of Rand Index = 0.5434343434343434 ================================= +============ Partial average Rand Index = 0.5403607503607505 ====== +============ Value of Adjusted Rand Index = -0.12029497697232204 ================================= +============ Partial average of Adjusted Rand Index = 0.06961932862720435 ================================= +============ Value of Jaccard Index = 0.5151255095473074 ================================= +============ Partial average of Jaccard Index = 0.4328783547947355 ====== +============ Precision = 0.1927710843373494, Recall = 0.8888888888888888, F1 = 0.31683168316831684 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 83.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 29 : "civil disobedience" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 2 contains the snippets: [2, 4, 6, 7, 9, 10, 13, 15, 16, 19, 20, 22, 23, 24, 25, 26, 30, 31, 32, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 49, 50, 53, 54, 55, 57, 58, 59, 68, 69, 70, 75, 76, 78, 81, 82, 84, 87, 89, 92, 93, 96, 98, 100] +The cluster 1 contains the snippets: [1, 3, 5, 8, 11, 12, 14, 17, 18, 21, 27, 28, 29, 34, 35, 36, 46, 48, 51, 52, 60, 61, 62, 63, 64, 65, 66, 67, 71, 73, 74, 77, 79, 80, 83, 85, 86, 88, 90, 91, 95, 97, 99] +The cluster 3 contains the snippets: [56, 72, 94] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 56, 3, 4, 72, 5, 6, 94, 8, 7, 11, 9, 12, 10, 14, 13, 17, 15, 18, 16, 21, 19, 27, 20, 28, 22, 29, 23, 34, 24, 35, 25, 36, 26, 46, 30, 48, 31, 51, 32, 52, 33, 60, 37, 61, 38, 62, 39, 63, 40, 64, 41, 65, 42, 66, 43, 67, 44, 71, 45, 73, 47, 74, 49, 77, 50, 79, 53, 80, 54, 83, 55, 85, 57, 86, 58, 88, 59, 90, 68, 91, 69, 95, 70, 97, 75, 99, 76, 78, 81, 82, 84, 87, 89, 92, 93, 96, 98, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "civil disobedience" =============== +============ Value of Rand Index = 0.5244444444444445 ================================= +============ Partial average Rand Index = 0.5398119122257053 ====== +============ Value of Adjusted Rand Index = 0.03702698983078354 ================================= +============ Partial average of Adjusted Rand Index = 0.06849545487560363 ================================= +============ Value of Jaccard Index = 0.2858009708737864 ================================= +============ Partial average of Jaccard Index = 0.42780672086642696 ====== +============ Precision = 0.55, Recall = 0.6626506024096386, F1 = 0.6010928961748634 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 33.333333333333336 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 30 : "mount huxley" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "mount huxley" =============== +============ Value of Rand Index = 0.7670707070707071 ================================= +============ Partial average Rand Index = 0.5473872053872054 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06621227304641683 ================================= +============ Value of Jaccard Index = 0.7670707070707071 ================================= +============ Partial average of Jaccard Index = 0.43911552040656965 ====== +============ Precision = 0.11, Recall = 0.8461538461538461, F1 = 0.19469026548672566 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 31 : "seduced and abandoned" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "seduced and abandoned" =============== +============ Value of Rand Index = 0.4109090909090909 ================================= +============ Partial average Rand Index = 0.5429846855653307 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06407639327072596 ================================= +============ Value of Jaccard Index = 0.4109090909090909 ================================= +============ Partial average of Jaccard Index = 0.43820563558407033 ====== +============ Precision = 0.48, Recall = 0.8275862068965517, F1 = 0.6075949367088608 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 32 : "tai chi" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 45, 50, 53, 80] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "tai chi" =============== +============ Value of Rand Index = 0.6888888888888889 ================================= +============ Partial average Rand Index = 0.5475441919191919 ====== +============ Value of Adjusted Rand Index = 0.03061145021076101 ================================= +============ Partial average of Adjusted Rand Index = 0.06303061380010207 ================================= +============ Value of Jaccard Index = 0.67206132879046 ================================= +============ Partial average of Jaccard Index = 0.44551362599676997 ====== +============ Precision = 0.78125, Recall = 0.5319148936170213, F1 = 0.6329113924050632 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 96.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 33 : "a bell for adano" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "a bell for adano" =============== +============ Value of Rand Index = 0.3751515151515151 ================================= +============ Partial average Rand Index = 0.5423201714110805 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06112059520009897 ================================= +============ Value of Jaccard Index = 0.3751515151515151 ================================= +============ Partial average of Jaccard Index = 0.44338144081964104 ====== +============ Precision = 0.51, Recall = 0.6986301369863014, F1 = 0.5895953757225434 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 34 : "gay bar" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 5, 6, 7, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 4, 8, 13, 51, 69, 80] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "gay bar" =============== +============ Value of Rand Index = 0.8341414141414142 ================================= +============ Partial average Rand Index = 0.5509031491384432 ====== +============ Value of Adjusted Rand Index = 0.38659821356606644 ================================= +============ Partial average of Adjusted Rand Index = 0.07069346632850979 ================================= +============ Value of Jaccard Index = 0.8206248634476732 ================================= +============ Partial average of Jaccard Index = 0.4544768356028184 ====== +============ Precision = 0.925531914893617, Recall = 0.8969072164948454, F1 = 0.9109947643979057 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 94.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 35 : "down in the valley" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "down in the valley" =============== +============ Value of Rand Index = 0.48323232323232324 ================================= +============ Partial average Rand Index = 0.5489696969696969 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06867365300483808 ================================= +============ Value of Jaccard Index = 0.48323232323232324 ================================= +============ Partial average of Jaccard Index = 0.4552984209636614 ====== +============ Precision = 0.21, Recall = 0.6176470588235294, F1 = 0.31343283582089554 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 36 : "space raiders" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "space raiders" =============== +============ Value of Rand Index = 0.35777777777777775 ================================= +============ Partial average Rand Index = 0.5436588103254769 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06676605153248145 ================================= +============ Value of Jaccard Index = 0.35777777777777775 ================================= +============ Partial average of Jaccard Index = 0.4525895142084979 ====== +============ Precision = 0.54, Recall = 0.5806451612903226, F1 = 0.5595854922279794 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 37 : "black hole" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 2, 5, 6, 8, 9, 10, 13, 16, 17, 19, 20, 23, 29, 30, 31, 32, 34, 36, 37, 38, 39, 40, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 57, 58, 59, 61, 63, 64, 67, 68, 69, 72, 74, 77, 78, 80, 81, 83, 87, 90, 96, 97, 99, 100] +The cluster 1 contains the snippets: [3, 4, 7, 11, 12, 14, 15, 18, 21, 22, 24, 25, 27, 33, 35, 41, 46, 52, 54, 56, 60, 62, 65, 66, 70, 71, 75, 76, 79, 85, 86, 88, 89, 91, 93, 94, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 4, 2, 7, 5, 11, 6, 12, 8, 14, 9, 15, 10, 18, 13, 21, 16, 22, 17, 24, 19, 25, 20, 27, 23, 33, 29, 35, 30, 41, 31, 46, 32, 52, 34, 54, 36, 56, 37, 60, 38, 62, 39, 65, 40, 66, 42, 70, 43, 71, 44, 75, 45, 76, 47, 79, 48, 85, 49, 86, 50, 88, 51, 89, 53, 91, 55, 93, 57, 94, 58, 98, 59, 61, 63, 64, 67, 68, 69, 72, 74, 77, 78, 80, 81, 83, 87, 90, 96, 97, 99, 100, 26, 28, 73, 82, 84, 92, 95] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "black hole" =============== +============ Value of Rand Index = 0.46484848484848484 ================================= +============ Partial average Rand Index = 0.5415288015288016 ====== +============ Value of Adjusted Rand Index = 0.02010845611231045 ================================= +============ Partial average of Adjusted Rand Index = 0.0655050354400444 ================================= +============ Value of Jaccard Index = 0.44984423676012464 ================================= +============ Partial average of Jaccard Index = 0.452515317520704 ====== +============ Precision = 0.989247311827957, Recall = 0.9387755102040817, F1 = 0.9633507853403142 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 46.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 38 : "fata morgana" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 5, 9, 16, 17, 19, 23, 24, 27, 30, 34, 45, 57, 59, 65, 68, 72, 75, 78, 87, 90, 93, 94, 97, 98] +The cluster 2 contains the snippets: [2, 4, 21, 33, 36, 39, 40, 48, 49, 51, 58, 77, 81, 83, 86, 92] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 2, 5, 4, 9, 21, 16, 33, 17, 36, 19, 39, 23, 40, 24, 48, 27, 49, 30, 51, 34, 58, 45, 77, 57, 81, 59, 83, 65, 86, 68, 92, 72, 75, 78, 87, 90, 93, 94, 97, 98, 1, 6, 7, 8, 10, 11, 12, 13, 14, 15, 18, 20, 22, 25, 26, 28, 29, 31, 32, 35, 37, 38, 41, 42, 43, 44, 46, 47, 50, 52, 53, 54, 55, 56, 60, 61, 62, 63, 64, 66, 67, 69, 70, 71, 73, 74, 76, 79, 80, 82, 84, 85, 88, 89, 91, 95, 96, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "fata morgana" =============== +============ Value of Rand Index = 0.6149494949494949 ================================= +============ Partial average Rand Index = 0.5434609250398723 ====== +============ Value of Adjusted Rand Index = 0.24055649323494657 ================================= +============ Partial average of Adjusted Rand Index = 0.07011165275043657 ================================= +============ Value of Jaccard Index = 0.3991172761664565 ================================= +============ Partial average of Jaccard Index = 0.45111010590611866 ====== +============ Precision = 0.3902439024390244, Recall = 0.4444444444444444, F1 = 0.4155844155844156 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 20.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 39 : "all that jazz" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [5, 8, 11, 13, 17, 18, 19, 20, 21, 22, 23, 24, 25, 33, 34, 35, 36, 37, 38, 40, 41, 43, 44, 49, 54, 56, 58, 60, 61, 62, 63, 66, 70, 72, 73, 75, 76, 79, 80, 81, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 96] +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 12, 14, 16, 29, 30, 32, 39, 42, 47, 50, 52, 57, 64, 67, 68, 77, 78, 82, 97, 98, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 5, 2, 8, 3, 11, 4, 13, 6, 17, 7, 18, 12, 19, 14, 20, 16, 21, 29, 22, 30, 23, 32, 24, 39, 25, 42, 33, 47, 34, 50, 35, 52, 36, 57, 37, 64, 38, 67, 40, 68, 41, 77, 43, 78, 44, 82, 49, 97, 54, 98, 56, 99, 58, 60, 61, 62, 63, 66, 70, 72, 73, 75, 76, 79, 80, 81, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 96, 9, 10, 15, 26, 27, 28, 31, 45, 46, 48, 51, 53, 55, 59, 65, 69, 71, 74, 87, 94, 95, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "all that jazz" =============== +============ Value of Rand Index = 0.6084848484848485 ================================= +============ Partial average Rand Index = 0.545128205128205 ====== +============ Value of Adjusted Rand Index = 0.1745203985765854 ================================= +============ Partial average of Adjusted Rand Index = 0.07278880007931218 ================================= +============ Value of Jaccard Index = 0.3625 ================================= +============ Partial average of Jaccard Index = 0.4488380519085259 ====== +============ Precision = 0.358974358974359, Recall = 0.6666666666666666, F1 = 0.4666666666666667 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 39.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 40 : "ten little indians" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 5, 8, 9, 10, 11, 15, 18, 20, 23, 24, 25, 26, 28, 29, 30, 31, 33, 36, 37, 40, 41, 43, 44, 45, 46, 48, 50, 53, 54, 55, 56, 57, 58, 60, 61, 63, 64, 66, 67, 68, 70, 74, 77, 78, 80, 81, 83, 85, 87, 91, 92, 93, 94, 95, 96, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 5, 8, 9, 10, 11, 15, 18, 20, 23, 24, 25, 26, 28, 29, 30, 31, 33, 36, 37, 40, 41, 43, 44, 45, 46, 48, 50, 53, 54, 55, 56, 57, 58, 60, 61, 63, 64, 66, 67, 68, 70, 74, 77, 78, 80, 81, 83, 85, 87, 91, 92, 93, 94, 95, 96, 99, 2, 3, 4, 6, 7, 12, 13, 14, 16, 17, 19, 21, 22, 27, 32, 34, 35, 38, 39, 42, 47, 49, 51, 52, 59, 62, 65, 69, 71, 72, 73, 75, 76, 79, 82, 84, 86, 88, 89, 90, 97, 98, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "ten little indians" =============== +============ Value of Rand Index = 0.5454545454545454 ================================= +============ Partial average Rand Index = 0.5451363636363636 ====== +============ Value of Adjusted Rand Index = 0.08939664399401168 ================================= +============ Partial average of Adjusted Rand Index = 0.07320399617717967 ================================= +============ Value of Jaccard Index = 0.22865958176208434 ================================= +============ Partial average of Jaccard Index = 0.44333359015486484 ====== +============ Precision = 0.3157894736842105, Recall = 0.26865671641791045, F1 = 0.29032258064516125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 57.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 41 : "speed of light" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 5 snippet clusters: ==================== +The cluster 3 contains the snippets: [3, 4, 5, 6, 9, 10, 11, 12, 14, 16, 17, 23, 24, 27, 30, 32, 33, 36, 38, 40, 42, 43, 44, 45, 46, 47, 48, 50, 51, 53, 56, 60, 61, 64, 66, 68, 69, 70, 71, 81, 84, 86, 87, 88, 89, 93, 95, 97, 100] +The cluster 1 contains the snippets: [1, 2, 13, 15, 18, 19, 20, 21, 22, 25, 28, 29, 31, 34, 35, 37, 39, 41, 49, 54, 55, 57, 59, 62, 65, 67, 72, 73, 74, 76, 77, 78, 79, 80, 82, 83, 85, 91, 94, 96, 98, 99] +The cluster 4 contains the snippets: [8, 26, 52, 63, 90] +The cluster 5 contains the snippets: [58, 75, 92] +The cluster 2 contains the snippets: [7] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 7, 3, 8, 58, 2, 4, 26, 75, 13, 5, 52, 92, 15, 6, 63, 18, 9, 90, 19, 10, 20, 11, 21, 12, 22, 14, 25, 16, 28, 17, 29, 23, 31, 24, 34, 27, 35, 30, 37, 32, 39, 33, 41, 36, 49, 38, 54, 40, 55, 42, 57, 43, 59, 44, 62, 45, 65, 46, 67, 47, 72, 48, 73, 50, 74, 51, 76, 53, 77, 56, 78, 60, 79, 61, 80, 64, 82, 66, 83, 68, 85, 69, 91, 70, 94, 71, 96, 81, 98, 84, 99, 86, 87, 88, 89, 93, 95, 97, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "speed of light" =============== +============ Value of Rand Index = 0.518989898989899 ================================= +============ Partial average Rand Index = 0.5444986449864498 ====== +============ Value of Adjusted Rand Index = 0.030310135877278533 ================================= +============ Partial average of Adjusted Rand Index = 0.07215780446254792 ================================= +============ Value of Jaccard Index = 0.29888103651354536 ================================= +============ Partial average of Jaccard Index = 0.43981035713922295 ====== +============ Precision = 0.42, Recall = 0.9545454545454546, F1 = 0.5833333333333334 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 5 ============ +============ average size of the created clusters: 20.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 42 : "ray of light" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 11, 12, 15, 18, 21, 22, 23, 24, 25, 26, 27, 29, 30, 32, 33, 34, 37, 39, 42, 43, 45, 46, 50, 52, 53, 54, 57, 60, 61, 63, 64, 65, 66, 67, 68, 70, 73, 74, 75, 83, 85, 86, 89, 95, 96, 97, 99] +The cluster 2 contains the snippets: [7, 8, 9, 13, 16, 17, 19, 28, 31, 35, 36, 40, 41, 44, 48, 51, 55, 71, 72, 76, 77, 78, 79, 80, 81, 82, 87, 88, 90, 91, 92, 93, 94, 98, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 7, 2, 8, 3, 9, 5, 13, 6, 16, 11, 17, 12, 19, 15, 28, 18, 31, 21, 35, 22, 36, 23, 40, 24, 41, 25, 44, 26, 48, 27, 51, 29, 55, 30, 71, 32, 72, 33, 76, 34, 77, 37, 78, 39, 79, 42, 80, 43, 81, 45, 82, 46, 87, 50, 88, 52, 90, 53, 91, 54, 92, 57, 93, 60, 94, 61, 98, 63, 100, 64, 65, 66, 67, 68, 70, 73, 74, 75, 83, 85, 86, 89, 95, 96, 97, 99, 4, 10, 14, 20, 38, 47, 49, 56, 58, 59, 62, 69, 84] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "ray of light" =============== +============ Value of Rand Index = 0.536969696969697 ================================= +============ Partial average Rand Index = 0.5443193843193844 ====== +============ Value of Adjusted Rand Index = 0.042542364213326696 ================================= +============ Partial average of Adjusted Rand Index = 0.07145267493280458 ================================= +============ Value of Jaccard Index = 0.27742749054224464 ================================= +============ Partial average of Jaccard Index = 0.43594409841072346 ====== +============ Precision = 0.40229885057471265, Recall = 0.8333333333333334, F1 = 0.5426356589147286 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 43.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 43 : "soul food" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 17, 20, 24, 25, 26, 27, 30, 33, 35, 37, 38, 39, 41, 42, 43, 45, 46, 47, 48, 49, 50, 52, 53, 58, 60, 61, 64, 65, 67, 69, 70, 71, 72, 74, 76, 78, 80, 82, 85, 88, 91, 93, 94, 95, 96, 97, 98] +The cluster 2 contains the snippets: [3, 6, 18, 19, 21, 22, 23, 28, 34, 36, 40, 44, 51, 55, 56, 63, 68, 73, 75, 77, 79, 81, 83, 84, 86, 87, 90, 92, 100] +The cluster 3 contains the snippets: [15, 31, 32, 54, 62, 66, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 15, 2, 6, 31, 4, 18, 32, 5, 19, 54, 7, 21, 62, 8, 22, 66, 9, 23, 99, 10, 28, 11, 34, 12, 36, 13, 40, 14, 44, 17, 51, 20, 55, 24, 56, 25, 63, 26, 68, 27, 73, 30, 75, 33, 77, 35, 79, 37, 81, 38, 83, 39, 84, 41, 86, 42, 87, 43, 90, 45, 92, 46, 100, 47, 48, 49, 50, 52, 53, 58, 60, 61, 64, 65, 67, 69, 70, 71, 72, 74, 76, 78, 80, 82, 85, 88, 91, 93, 94, 95, 96, 97, 98, 16, 29, 57, 59, 89] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "soul food" =============== +============ Value of Rand Index = 0.555959595959596 ================================= +============ Partial average Rand Index = 0.5445900869156683 ====== +============ Value of Adjusted Rand Index = 0.14746453753656577 ================================= +============ Partial average of Adjusted Rand Index = 0.07322039266777576 ================================= +============ Value of Jaccard Index = 0.4078663793103448 ================================= +============ Partial average of Jaccard Index = 0.4352911281990867 ====== +============ Precision = 0.8, Recall = 0.8085106382978723, F1 = 0.8042328042328043 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 31.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 44 : "volcanic rock" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 2, 4, 5, 6, 8, 10, 13, 15, 16, 17, 18, 19, 22, 23, 24, 31, 32, 33, 36, 37, 38, 39, 41, 43, 44, 45, 47, 48, 49, 54, 55, 56, 57, 58, 59, 60, 61, 65, 66, 67, 71, 72, 73, 75, 79, 80, 81, 82, 83, 84, 89, 90, 91, 92, 93, 94, 95] +The cluster 1 contains the snippets: [3, 7, 9, 11, 12, 14, 20, 21, 25, 26, 27, 28, 29, 30, 34, 35, 40, 42, 46, 50, 51, 53, 62, 63, 64, 68, 69, 70, 74, 76, 77, 85, 86, 87, 88, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 7, 2, 9, 4, 11, 5, 12, 6, 14, 8, 20, 10, 21, 13, 25, 15, 26, 16, 27, 17, 28, 18, 29, 19, 30, 22, 34, 23, 35, 24, 40, 31, 42, 32, 46, 33, 50, 36, 51, 37, 53, 38, 62, 39, 63, 41, 64, 43, 68, 44, 69, 45, 70, 47, 74, 48, 76, 49, 77, 54, 85, 55, 86, 56, 87, 57, 88, 58, 97, 59, 98, 60, 99, 61, 100, 65, 66, 67, 71, 72, 73, 75, 79, 80, 81, 82, 83, 84, 89, 90, 91, 92, 93, 94, 95, 52, 78, 96] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "volcanic rock" =============== +============ Value of Rand Index = 0.5187878787878788 ================================= +============ Partial average Rand Index = 0.5440036730945821 ====== +============ Value of Adjusted Rand Index = 0.061476926750641744 ================================= +============ Partial average of Adjusted Rand Index = 0.07295349571511361 ================================= +============ Value of Jaccard Index = 0.4851955910957424 ================================= +============ Partial average of Jaccard Index = 0.4364253205376471 ====== +============ Precision = 0.9690721649484536, Recall = 0.9894736842105263, F1 = 0.9791666666666666 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 48.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 45 : "storm in a teacup" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "storm in a teacup" =============== +============ Value of Rand Index = 0.5145454545454545 ================================= +============ Partial average Rand Index = 0.5433490460157127 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07133230692144443 ================================= +============ Value of Jaccard Index = 0.5145454545454545 ================================= +============ Partial average of Jaccard Index = 0.43816132351559833 ====== +============ Precision = 0.07, Recall = 0.23333333333333334, F1 = 0.1076923076923077 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 46 : "double negative" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 4, 15, 25, 29, 31, 34, 35, 41, 45, 46, 47, 48, 50, 51, 55, 57, 58, 62, 67, 69, 72, 74, 78, 81, 85, 88, 89, 95, 96, 97, 99, 100] +The cluster 2 contains the snippets: [2, 14, 39, 43, 54, 60, 66, 68, 70, 83, 84] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 14, 4, 39, 15, 43, 25, 54, 29, 60, 31, 66, 34, 68, 35, 70, 41, 83, 45, 84, 46, 47, 48, 50, 51, 55, 57, 58, 62, 67, 69, 72, 74, 78, 81, 85, 88, 89, 95, 96, 97, 99, 100, 5, 6, 7, 8, 9, 10, 11, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 36, 37, 38, 40, 42, 44, 49, 52, 53, 56, 59, 61, 63, 64, 65, 71, 73, 75, 76, 77, 79, 80, 82, 86, 87, 90, 91, 92, 93, 94, 98] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "double negative" =============== +============ Value of Rand Index = 0.5862626262626263 ================================= +============ Partial average Rand Index = 0.5442819499341239 ====== +============ Value of Adjusted Rand Index = 0.058838363942063286 ================================= +============ Partial average of Adjusted Rand Index = 0.07106069946537094 ================================= +============ Value of Jaccard Index = 0.237243947858473 ================================= +============ Partial average of Jaccard Index = 0.43379355447957385 ====== +============ Precision = 0.5777777777777777, Recall = 0.3466666666666667, F1 = 0.4333333333333333 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 22.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 47 : "the whole truth" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 4, 5, 7, 8, 9, 10, 12, 14, 15, 16, 17, 18, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 72, 73, 74, 75, 77, 78, 79, 80, 83, 84, 85, 86, 88, 89, 90, 91, 93, 94, 95, 97, 98, 99, 100] +The cluster 2 contains the snippets: [11, 19, 20, 35, 81, 82, 87, 92, 96] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 11, 3, 19, 4, 20, 5, 35, 7, 81, 8, 82, 9, 87, 10, 92, 12, 96, 14, 15, 16, 17, 18, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 72, 73, 74, 75, 77, 78, 79, 80, 83, 84, 85, 86, 88, 89, 90, 91, 93, 94, 95, 97, 98, 99, 100, 2, 6, 13, 23, 28, 34, 36, 38, 71, 76] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the whole truth" =============== +============ Value of Rand Index = 0.7212121212121212 ================================= +============ Partial average Rand Index = 0.548046421663443 ====== +============ Value of Adjusted Rand Index = 0.3564577169201128 ================================= +============ Partial average of Adjusted Rand Index = 0.07713297643249309 ================================= +============ Value of Jaccard Index = 0.670487106017192 ================================= +============ Partial average of Jaccard Index = 0.43882958749101253 ====== +============ Precision = 0.05555555555555555, Recall = 0.3333333333333333, F1 = 0.09523809523809525 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 45.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 48 : "james bond" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100] +The cluster 3 contains the snippets: [29, 37, 88] +The cluster 2 contains the snippets: [61] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 61, 29, 2, 37, 3, 88, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 94] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "james bond" =============== +============ Value of Rand Index = 0.4783838383838384 ================================= +============ Partial average Rand Index = 0.5465951178451179 ====== +============ Value of Adjusted Rand Index = -3.2599121889922956E-4 ================================= +============ Partial average of Adjusted Rand Index = 0.07551924793975576 ================================= +============ Value of Jaccard Index = 0.44899701237729406 ================================= +============ Partial average of Jaccard Index = 0.43904140884281007 ====== +============ Precision = 0.5555555555555556, Recall = 0.3691275167785235, F1 = 0.44354838709677424 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 33.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 49 : "survival of the fittest" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 8, 15, 17, 19, 21, 22, 25, 26, 27, 28, 29, 30, 31, 32, 35, 36, 39, 40, 42, 46, 48, 50, 52, 55, 56, 58, 59, 62, 63, 65, 68, 71, 72, 73, 77, 78, 80, 82, 84, 85, 86, 87, 88, 89, 90, 93, 95, 97, 99, 100] +The cluster 2 contains the snippets: [10, 11, 12, 13, 14, 18, 20, 23, 33, 37, 44, 49, 51, 53, 60, 64, 74, 79, 83, 91, 92, 96] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 10, 2, 11, 3, 12, 4, 13, 5, 14, 6, 18, 8, 20, 15, 23, 17, 33, 19, 37, 21, 44, 22, 49, 25, 51, 26, 53, 27, 60, 28, 64, 29, 74, 30, 79, 31, 83, 32, 91, 35, 92, 36, 96, 39, 40, 42, 46, 48, 50, 52, 55, 56, 58, 59, 62, 63, 65, 68, 71, 72, 73, 77, 78, 80, 82, 84, 85, 86, 87, 88, 89, 90, 93, 95, 97, 99, 100, 7, 9, 16, 24, 34, 38, 41, 43, 45, 47, 54, 57, 61, 66, 67, 69, 70, 75, 76, 81, 94, 98] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "survival of the fittest" =============== +============ Value of Rand Index = 0.5127272727272727 ================================= +============ Partial average Rand Index = 0.5459039373325089 ====== +============ Value of Adjusted Rand Index = 0.00273801429647735 ================================= +============ Partial average of Adjusted Rand Index = 0.07403391664091334 ================================= +============ Value of Jaccard Index = 0.2684258416742493 ================================= +============ Partial average of Jaccard Index = 0.43555945849243144 ====== +============ Precision = 0.1794871794871795, Recall = 0.4, F1 = 0.24778761061946902 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 39.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 50 : "mark forster" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "mark forster" =============== +============ Value of Rand Index = 0.46646464646464647 ================================= +============ Partial average Rand Index = 0.5443151515151516 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07255323830809507 ================================= +============ Value of Jaccard Index = 0.46646464646464647 ================================= +============ Partial average of Jaccard Index = 0.43617756225187576 ====== +============ Precision = 0.38, Recall = 0.8837209302325582, F1 = 0.5314685314685315 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 51 : "rain or shine" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 6, 7, 9, 10, 11, 12, 13, 18, 19, 23, 25, 26, 34, 37, 43, 45, 47, 48, 49, 53, 54, 56, 58, 59, 60, 62, 64, 67, 68, 70, 72, 73, 74, 75, 76, 78, 79, 80, 81, 84, 85, 86, 89, 90, 92, 94, 96, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 3, 6, 7, 9, 10, 11, 12, 13, 18, 19, 23, 25, 26, 34, 37, 43, 45, 47, 48, 49, 53, 54, 56, 58, 59, 60, 62, 64, 67, 68, 70, 72, 73, 74, 75, 76, 78, 79, 80, 81, 84, 85, 86, 89, 90, 92, 94, 96, 100, 1, 4, 5, 8, 14, 15, 16, 17, 20, 21, 22, 24, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 40, 41, 42, 44, 46, 50, 51, 52, 55, 57, 61, 63, 65, 66, 69, 71, 77, 82, 83, 87, 88, 91, 93, 95, 97, 98, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "rain or shine" =============== +============ Value of Rand Index = 0.49717171717171715 ================================= +============ Partial average Rand Index = 0.543390770449594 ====== +============ Value of Adjusted Rand Index = 6.546976504928194E-4 ================================= +============ Partial average of Adjusted Rand Index = 0.07114346300108326 ================================= +============ Value of Jaccard Index = 0.44970152553614856 ================================= +============ Partial average of Jaccard Index = 0.4364427380025478 ====== +============ Precision = 0.08, Recall = 0.4, F1 = 0.13333333333333333 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 50.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 52 : "another day in paradise" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 6, 7, 11, 14, 15, 17, 21, 22, 26, 27, 31, 32, 37, 50, 51, 54, 59, 60, 64, 65, 72, 73, 75, 77, 78, 79, 84, 87, 88, 91, 92, 93, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 6, 7, 11, 14, 15, 17, 21, 22, 26, 27, 31, 32, 37, 50, 51, 54, 59, 60, 64, 65, 72, 73, 75, 77, 78, 79, 84, 87, 88, 91, 92, 93, 98, 3, 4, 5, 8, 9, 10, 12, 13, 16, 18, 19, 20, 23, 24, 25, 28, 29, 30, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 52, 53, 55, 56, 57, 58, 61, 62, 63, 66, 67, 68, 69, 70, 71, 74, 76, 80, 81, 82, 83, 85, 86, 89, 90, 94, 95, 96, 97, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "another day in paradise" =============== +============ Value of Rand Index = 0.6674747474747474 ================================= +============ Partial average Rand Index = 0.545777000777001 ====== +============ Value of Adjusted Rand Index = 0.35237285239073673 ================================= +============ Partial average of Adjusted Rand Index = 0.07655172048934583 ================================= +============ Value of Jaccard Index = 0.44876088412592097 ================================= +============ Partial average of Jaccard Index = 0.43667962542799726 ====== +============ Precision = 0.6, Recall = 0.42857142857142855, F1 = 0.5 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 35.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 53 : "tree of knowledge" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 4, 6, 7, 8, 10, 12, 13, 15, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 32, 33, 35, 36, 38, 39, 40, 43, 45, 46, 47, 48, 50, 52, 53, 54, 55, 56, 57, 58, 60, 61, 63, 64, 65, 66, 67, 69, 72, 74, 76, 77, 78, 79, 80, 83, 84, 85, 86, 87, 88, 89, 93, 94, 95, 97, 98] +The cluster 2 contains the snippets: [11, 18, 42, 44, 51, 70, 82] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 11, 4, 18, 6, 42, 7, 44, 8, 51, 10, 70, 12, 82, 13, 15, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 32, 33, 35, 36, 38, 39, 40, 43, 45, 46, 47, 48, 50, 52, 53, 54, 55, 56, 57, 58, 60, 61, 63, 64, 65, 66, 67, 69, 72, 74, 76, 77, 78, 79, 80, 83, 84, 85, 86, 87, 88, 89, 93, 94, 95, 97, 98, 2, 3, 5, 9, 14, 16, 17, 27, 30, 31, 34, 37, 41, 49, 59, 62, 68, 71, 73, 75, 81, 90, 91, 92, 96, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "tree of knowledge" =============== +============ Value of Rand Index = 0.4987878787878788 ================================= +============ Partial average Rand Index = 0.5448904135696591 ====== +============ Value of Adjusted Rand Index = -0.003380509811861151 ================================= +============ Partial average of Adjusted Rand Index = 0.07504356520064381 ================================= +============ Value of Jaccard Index = 0.34813452443510245 ================================= +============ Partial average of Jaccard Index = 0.4350089631451125 ====== +============ Precision = 0.273972602739726, Recall = 0.6666666666666666, F1 = 0.3883495145631068 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 36.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 54 : "indy 500" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "indy 500" =============== +============ Value of Rand Index = 0.7018181818181818 ================================= +============ Partial average Rand Index = 0.5477964833520391 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07365386954878003 ================================= +============ Value of Jaccard Index = 0.7018181818181818 ================================= +============ Partial average of Jaccard Index = 0.4399498746020212 ====== +============ Precision = 0.82, Recall = 1.0, F1 = 0.9010989010989011 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 55 : "amarillo by morning" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "amarillo by morning" =============== +============ Value of Rand Index = 0.611919191919192 ================================= +============ Partial average Rand Index = 0.5489623507805328 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07231470828425676 ================================= +============ Value of Jaccard Index = 0.611919191919192 ================================= +============ Partial average of Jaccard Index = 0.4430765894623334 ====== +============ Precision = 0.75, Recall = 0.974025974025974, F1 = 0.8474576271186441 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 56 : "queen of the night" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 30, 33, 34, 35, 36, 37, 38, 40, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 86, 87, 88, 89, 90, 92, 95, 96, 97, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 30, 33, 34, 35, 36, 37, 38, 40, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 73, 74, 75, 76, 77, 78, 79, 81, 82, 83, 84, 86, 87, 88, 89, 90, 92, 95, 96, 97, 99, 100, 8, 9, 11, 24, 27, 28, 29, 31, 32, 39, 41, 43, 54, 62, 72, 80, 85, 91, 93, 94, 98] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "queen of the night" =============== +============ Value of Rand Index = 0.4111111111111111 ================================= +============ Partial average Rand Index = 0.5465007215007217 ====== +============ Value of Adjusted Rand Index = -0.11890299932769287 ================================= +============ Partial average of Adjusted Rand Index = 0.0689001063626148 ================================= +============ Value of Jaccard Index = 0.29640357229061065 ================================= +============ Partial average of Jaccard Index = 0.4404574284414098 ====== +============ Precision = 0.1518987341772152, Recall = 0.3157894736842105, F1 = 0.20512820512820512 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 79.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 57 : "cassius marcellus clay" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "cassius marcellus clay" =============== +============ Value of Rand Index = 0.3997979797979798 ================================= +============ Partial average Rand Index = 0.5439269891901473 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06769133256677945 ================================= +============ Value of Jaccard Index = 0.3997979797979798 ================================= +============ Partial average of Jaccard Index = 0.43974410478099873 ====== +============ Precision = 0.41, Recall = 0.7884615384615384, F1 = 0.5394736842105263 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 58 : "space opera" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 5, 10, 25, 65] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "space opera" =============== +============ Value of Rand Index = 0.36848484848484847 ================================= +============ Partial average Rand Index = 0.5409021246952284 ====== +============ Value of Adjusted Rand Index = -0.0013559978237477333 ================================= +============ Partial average of Adjusted Rand Index = 0.06650086135314967 ================================= +============ Value of Jaccard Index = 0.334610472541507 ================================= +============ Partial average of Jaccard Index = 0.43793145594928334 ====== +============ Precision = 0.5, Recall = 0.676056338028169, F1 = 0.5748502994011976 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 96.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 59 : "alpha dog" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 6, 8, 10, 12, 24, 38, 40, 45, 50, 51, 58, 66, 70, 73, 74, 75, 85, 86, 90, 94, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 6, 8, 10, 12, 24, 38, 40, 45, 50, 51, 58, 66, 70, 73, 74, 75, 85, 86, 90, 94, 98, 3, 5, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 41, 42, 43, 44, 46, 47, 48, 49, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 67, 68, 69, 71, 72, 76, 77, 78, 79, 80, 81, 82, 83, 84, 87, 88, 89, 91, 92, 93, 95, 96, 97, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "alpha dog" =============== +============ Value of Rand Index = 0.7844444444444445 ================================= +============ Partial average Rand Index = 0.5450299606231811 ====== +============ Value of Adjusted Rand Index = 0.5198996107228949 ================================= +============ Partial average of Adjusted Rand Index = 0.07418558591873857 ================================= +============ Value of Jaccard Index = 0.7058985667034179 ================================= +============ Partial average of Jaccard Index = 0.4424732713857941 ====== +============ Precision = 0.6666666666666666, Recall = 0.64, F1 = 0.6530612244897959 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 24.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 60 : "bullet in the head" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bullet in the head" =============== +============ Value of Rand Index = 0.33515151515151514 ================================= +============ Partial average Rand Index = 0.5415319865319866 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07294915948675959 ================================= +============ Value of Jaccard Index = 0.33515151515151514 ================================= +============ Partial average of Jaccard Index = 0.44068457544855616 ====== +============ Precision = 0.33, Recall = 0.55, F1 = 0.4125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 61 : "jump cut" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 7, 8, 10, 12, 17, 20, 21, 22, 23, 24, 25, 29, 30, 31, 33, 34, 37, 39, 41, 42, 43, 44, 45, 46, 47, 50, 51, 52, 53, 55, 56, 58, 59, 60, 62, 64, 65, 67, 72, 73, 74, 77, 79, 81, 82, 83, 84, 85, 86, 87, 88, 89, 92, 93, 94, 95, 97] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 7, 8, 10, 12, 17, 20, 21, 22, 23, 24, 25, 29, 30, 31, 33, 34, 37, 39, 41, 42, 43, 44, 45, 46, 47, 50, 51, 52, 53, 55, 56, 58, 59, 60, 62, 64, 65, 67, 72, 73, 74, 77, 79, 81, 82, 83, 84, 85, 86, 87, 88, 89, 92, 93, 94, 95, 97, 3, 6, 9, 11, 13, 14, 15, 16, 18, 19, 26, 27, 28, 32, 35, 36, 38, 40, 48, 49, 54, 57, 61, 63, 66, 68, 69, 70, 71, 75, 76, 78, 80, 90, 91, 96, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "jump cut" =============== +============ Value of Rand Index = 0.5341414141414141 ================================= +============ Partial average Rand Index = 0.5414108296075512 ====== +============ Value of Adjusted Rand Index = 0.07262845228835206 ================================= +============ Partial average of Adjusted Rand Index = 0.07294390199170374 ================================= +============ Value of Jaccard Index = 0.3173475429248076 ================================= +============ Partial average of Jaccard Index = 0.43866265688259304 ====== +============ Precision = 0.4262295081967213, Recall = 0.5306122448979592, F1 = 0.4727272727272728 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 61.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 62 : "family reunion" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 26, 27, 29, 30, 31, 32, 33, 36, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 67, 68, 70, 73, 74, 75, 76, 77, 78, 80, 81, 82, 83, 84, 85, 87, 90, 91, 93, 94, 95, 96, 98, 100] +The cluster 2 contains the snippets: [10, 62, 71, 79, 86, 88, 92, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 10, 3, 62, 4, 71, 5, 79, 6, 86, 7, 88, 8, 92, 9, 99, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 26, 27, 29, 30, 31, 32, 33, 36, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 67, 68, 70, 73, 74, 75, 76, 77, 78, 80, 81, 82, 83, 84, 85, 87, 90, 91, 93, 94, 95, 96, 98, 100, 1, 12, 20, 25, 28, 34, 35, 37, 43, 50, 52, 66, 69, 72, 89, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "family reunion" =============== +============ Value of Rand Index = 0.56 ================================= +============ Partial average Rand Index = 0.5417106549364616 ====== +============ Value of Adjusted Rand Index = 0.13222481937951555 ================================= +============ Partial average of Adjusted Rand Index = 0.07390004582053941 ================================= +============ Value of Jaccard Index = 0.4181138124499065 ================================= +============ Partial average of Jaccard Index = 0.43833122390787227 ====== +============ Precision = 0.6309523809523809, Recall = 0.8153846153846154, F1 = 0.7114093959731543 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 42.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 63 : "rookie of the year" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "rookie of the year" =============== +============ Value of Rand Index = 0.5927272727272728 ================================= +============ Partial average Rand Index = 0.5425204425204427 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07272702922021339 ================================= +============ Value of Jaccard Index = 0.5927272727272728 ================================= +============ Partial average of Jaccard Index = 0.44078195484151356 ====== +============ Precision = 0.75, Recall = 0.9146341463414634, F1 = 0.8241758241758242 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 64 : "junk mail" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 6, 8, 10, 12, 13, 15, 16, 17, 18, 20, 22, 24, 25, 26, 27, 28, 30, 31, 33, 35, 38, 40, 41, 43, 44, 45, 47, 48, 49, 50, 51, 52, 55, 56, 58, 60, 62, 63, 64, 65, 67, 68, 69, 70, 72, 73, 75, 78, 79, 80, 81, 82, 83, 84, 86, 87, 89, 90, 94, 95, 96, 97] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 6, 8, 10, 12, 13, 15, 16, 17, 18, 20, 22, 24, 25, 26, 27, 28, 30, 31, 33, 35, 38, 40, 41, 43, 44, 45, 47, 48, 49, 50, 51, 52, 55, 56, 58, 60, 62, 63, 64, 65, 67, 68, 69, 70, 72, 73, 75, 78, 79, 80, 81, 82, 83, 84, 86, 87, 89, 90, 94, 95, 96, 97, 4, 5, 7, 9, 11, 14, 19, 21, 23, 29, 32, 34, 36, 37, 39, 42, 46, 53, 54, 57, 59, 61, 66, 71, 74, 76, 77, 85, 88, 91, 92, 93, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "junk mail" =============== +============ Value of Rand Index = 0.6234343434343435 ================================= +============ Partial average Rand Index = 0.5437847222222224 ====== +============ Value of Adjusted Rand Index = 0.20907593928586068 ================================= +============ Partial average of Adjusted Rand Index = 0.07485748093998913 ================================= +============ Value of Jaccard Index = 0.4826533444351929 ================================= +============ Partial average of Jaccard Index = 0.4414361953039148 ====== +============ Precision = 0.676923076923077, Recall = 0.4230769230769231, F1 = 0.5207100591715975 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 65.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 65 : "little brother" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 4, 6, 8, 9, 10, 12, 13, 14, 15, 16, 23, 25, 27, 28, 29, 30, 32, 33, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 48, 50, 52, 54, 56, 58, 59, 60, 64, 68, 70, 73, 77, 79, 80, 81, 82, 84, 86, 87, 89, 90, 91, 93, 96, 97, 99, 100] +The cluster 2 contains the snippets: [1, 2, 5, 7, 11, 17, 19, 20, 21, 22, 24, 31, 43, 47, 49, 51, 53, 55, 61, 62, 65, 66, 67, 69, 71, 72, 74, 75, 76, 78, 83, 85, 88, 92, 95, 98] +The cluster 3 contains the snippets: [18, 26, 34, 35, 57, 94] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 18, 4, 2, 26, 6, 5, 34, 8, 7, 35, 9, 11, 57, 10, 17, 94, 12, 19, 13, 20, 14, 21, 15, 22, 16, 24, 23, 31, 25, 43, 27, 47, 28, 49, 29, 51, 30, 53, 32, 55, 33, 61, 36, 62, 37, 65, 38, 66, 39, 67, 40, 69, 41, 71, 42, 72, 44, 74, 45, 75, 46, 76, 48, 78, 50, 83, 52, 85, 54, 88, 56, 92, 58, 95, 59, 98, 60, 64, 68, 70, 73, 77, 79, 80, 81, 82, 84, 86, 87, 89, 90, 91, 93, 96, 97, 99, 100, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "little brother" =============== +============ Value of Rand Index = 0.5193939393939394 ================================= +============ Partial average Rand Index = 0.5434094794094797 ====== +============ Value of Adjusted Rand Index = 0.02625237585638743 ================================= +============ Partial average of Adjusted Rand Index = 0.07410971009254912 ================================= +============ Value of Jaccard Index = 0.2959455460195324 ================================= +============ Partial average of Jaccard Index = 0.43919787762261653 ====== +============ Precision = 0.26262626262626265, Recall = 0.6842105263157895, F1 = 0.3795620437956205 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 33.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 66 : "lost in space" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 59, 60, 62, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 77, 78, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99] +The cluster 2 contains the snippets: [15, 19, 46, 79, 92] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 15, 2, 19, 3, 46, 4, 79, 5, 92, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 52, 53, 54, 55, 56, 57, 59, 60, 62, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 77, 78, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 24, 29, 51, 58, 61, 64, 74, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "lost in space" =============== +============ Value of Rand Index = 0.4496969696969697 ================================= +============ Partial average Rand Index = 0.5419895928986841 ====== +============ Value of Adjusted Rand Index = 0.0375200235264351 ================================= +============ Partial average of Adjusted Rand Index = 0.07355532090215344 ================================= +============ Value of Jaccard Index = 0.3393160320155227 ================================= +============ Partial average of Jaccard Index = 0.43768451632553934 ====== +============ Precision = 0.41304347826086957, Recall = 0.6785714285714286, F1 = 0.5135135135135135 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 46.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 67 : "the game of life" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 35, 37, 38, 39, 40, 41, 42, 43, 45, 46, 47, 48, 49, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 68, 69, 70, 71, 72, 73, 74, 77, 78, 79, 80, 81, 84, 85, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 35, 37, 38, 39, 40, 41, 42, 43, 45, 46, 47, 48, 49, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 68, 69, 70, 71, 72, 73, 74, 77, 78, 79, 80, 81, 84, 85, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 5, 21, 29, 34, 36, 44, 50, 51, 64, 66, 75, 76, 82, 83, 89, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the game of life" =============== +============ Value of Rand Index = 0.44686868686868686 ================================= +============ Partial average Rand Index = 0.5405698778833109 ====== +============ Value of Adjusted Rand Index = -0.06251522851474117 ================================= +============ Partial average of Adjusted Rand Index = 0.07152441717951322 ================================= +============ Value of Jaccard Index = 0.3629595160539786 ================================= +============ Partial average of Jaccard Index = 0.4365692178140235 ====== +============ Precision = 0.27380952380952384, Recall = 0.6216216216216216, F1 = 0.38016528925619836 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 84.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 68 : "field of fire" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 3 contains the snippets: [1, 5, 8, 9, 16, 18, 20, 21, 22, 23, 28, 30, 31, 32, 33, 34, 35, 37, 38, 40, 41, 43, 44, 46, 47, 48, 50, 55, 56, 57, 58, 60, 67, 70, 71, 75, 76, 77, 79, 80, 82, 83, 84, 85, 88, 91, 92, 94, 95, 96, 97, 98, 100] +The cluster 1 contains the snippets: [2, 4, 6, 10, 12, 13, 14, 15, 19, 27, 36, 42, 45, 49, 51, 52, 53, 54, 62, 63, 64, 65, 66, 68, 69, 72, 73, 74, 78, 81, 86, 87, 89, 90, 93, 99] +The cluster 2 contains the snippets: [25, 59] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 25, 1, 4, 59, 5, 6, 8, 10, 9, 12, 16, 13, 18, 14, 20, 15, 21, 19, 22, 27, 23, 36, 28, 42, 30, 45, 31, 49, 32, 51, 33, 52, 34, 53, 35, 54, 37, 62, 38, 63, 40, 64, 41, 65, 43, 66, 44, 68, 46, 69, 47, 72, 48, 73, 50, 74, 55, 78, 56, 81, 57, 86, 58, 87, 60, 89, 67, 90, 70, 93, 71, 99, 75, 76, 77, 79, 80, 82, 83, 84, 85, 88, 91, 92, 94, 95, 96, 97, 98, 100, 3, 7, 11, 17, 24, 26, 29, 39, 61] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "field of fire" =============== +============ Value of Rand Index = 0.5509090909090909 ================================= +============ Partial average Rand Index = 0.5407219251336901 ====== +============ Value of Adjusted Rand Index = 0.026586131582509106 ================================= +============ Partial average of Adjusted Rand Index = 0.0708635600383808 ================================= +============ Value of Jaccard Index = 0.2119815668202765 ================================= +============ Partial average of Jaccard Index = 0.43326645824058607 ====== +============ Precision = 0.3076923076923077, Recall = 0.5, F1 = 0.380952380952381 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 30.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 69 : "citizen of the world" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 72, 73, 75, 77, 79, 80, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 72, 73, 75, 77, 79, 80, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 3, 9, 21, 22, 40, 47, 51, 69, 71, 74, 76, 78, 85, 94, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "citizen of the world" =============== +============ Value of Rand Index = 0.6882828282828283 ================================= +============ Partial average Rand Index = 0.5428604889474457 ====== +============ Value of Adjusted Rand Index = 0.06606255133872378 ================================= +============ Partial average of Adjusted Rand Index = 0.0707939802021539 ================================= +============ Value of Jaccard Index = 0.6785416666666667 ================================= +============ Partial average of Jaccard Index = 0.43682117140618143 ====== +============ Precision = 0.047058823529411764, Recall = 0.5714285714285714, F1 = 0.08695652173913043 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 85.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 70 : "bad to the bone" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bad to the bone" =============== +============ Value of Rand Index = 0.4581818181818182 ================================= +============ Partial average Rand Index = 0.5416507936507938 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.06978263762783742 ================================= +============ Value of Jaccard Index = 0.4581818181818182 ================================= +============ Partial average of Jaccard Index = 0.43712632350297626 ====== +============ Precision = 0.25, Recall = 0.6756756756756757, F1 = 0.36496350364963503 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 71 : "cats and dogs" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 1, 16, 24, 42, 50, 57] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "cats and dogs" =============== +============ Value of Rand Index = 0.7284848484848485 ================================= +============ Partial average Rand Index = 0.5442822592118368 ====== +============ Value of Adjusted Rand Index = 0.02563507713722283 ================================= +============ Partial average of Adjusted Rand Index = 0.06916084100120903 ================================= +============ Value of Jaccard Index = 0.7206982543640897 ================================= +============ Partial average of Jaccard Index = 0.44112029436017497 ====== +============ Precision = 0.11702127659574468, Recall = 0.9166666666666666, F1 = 0.20754716981132076 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 94.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 72 : "division by zero" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 7, 11, 12, 14, 15, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 32, 35, 37, 40, 42, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 63, 64, 65, 66, 67, 68, 70, 71, 73, 74, 75, 79, 81, 85, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 7, 11, 12, 14, 15, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 32, 35, 37, 40, 42, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 63, 64, 65, 66, 67, 68, 70, 71, 73, 74, 75, 79, 81, 85, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 3, 6, 8, 9, 10, 13, 16, 18, 25, 30, 33, 34, 36, 38, 39, 41, 43, 44, 45, 49, 59, 60, 61, 62, 69, 72, 76, 77, 78, 80, 82, 83, 84, 89] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "division by zero" =============== +============ Value of Rand Index = 0.7004040404040404 ================================= +============ Partial average Rand Index = 0.5464506172839507 ====== +============ Value of Adjusted Rand Index = 0.3865601309130211 ================================= +============ Partial average of Adjusted Rand Index = 0.07356916447220645 ================================= +============ Value of Jaccard Index = 0.5976668475311991 ================================= +============ Partial average of Jaccard Index = 0.4432945520431059 ====== +============ Precision = 0.9696969696969697, Recall = 0.7111111111111111, F1 = 0.8205128205128205 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 66.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 73 : "hair of the dog" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "hair of the dog" =============== +============ Value of Rand Index = 0.44727272727272727 ================================= +============ Partial average Rand Index = 0.5450920160509203 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07256136769861457 ================================= +============ Value of Jaccard Index = 0.44727272727272727 ================================= +============ Partial average of Jaccard Index = 0.4433490475941967 ====== +============ Precision = 0.15, Recall = 0.40540540540540543, F1 = 0.21897810218978103 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 74 : "freedom of the press" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "freedom of the press" =============== +============ Value of Rand Index = 0.642020202020202 ================================= +============ Partial average Rand Index = 0.5464018564018566 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07158080867566033 ================================= +============ Value of Jaccard Index = 0.642020202020202 ================================= +============ Partial average of Jaccard Index = 0.4460337929242777 ====== +============ Precision = 0.78, Recall = 0.8125, F1 = 0.7959183673469388 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 75 : "bat boy" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 23, 24, 25, 27, 28, 29, 30, 31, 33, 34, 36, 37, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 61, 62, 63, 64, 65, 66, 68, 70, 71, 72, 73, 76, 77, 78, 79, 81, 82, 83, 85, 86, 87, 88, 89, 90, 93, 97, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 6, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 23, 24, 25, 27, 28, 29, 30, 31, 33, 34, 36, 37, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 61, 62, 63, 64, 65, 66, 68, 70, 71, 72, 73, 76, 77, 78, 79, 81, 82, 83, 85, 86, 87, 88, 89, 90, 93, 97, 100, 5, 7, 8, 17, 18, 21, 22, 26, 32, 35, 38, 41, 57, 60, 67, 69, 74, 75, 80, 84, 91, 92, 94, 95, 96, 98, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bat boy" =============== +============ Value of Rand Index = 0.5987878787878788 ================================= +============ Partial average Rand Index = 0.5471003367003369 ====== +============ Value of Adjusted Rand Index = 0.2163895614051988 ================================= +============ Partial average of Adjusted Rand Index = 0.0735115920453875 ================================= +============ Value of Jaccard Index = 0.4209912536443149 ================================= +============ Partial average of Jaccard Index = 0.44569989240054486 ====== +============ Precision = 0.6301369863013698, Recall = 0.71875, F1 = 0.6715328467153284 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 73.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 76 : "fast food nation" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 12, 14, 16, 17, 18, 19, 21, 23, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 44, 45, 47, 48, 49, 50, 52, 53, 55, 57, 59, 61, 62, 64, 65, 67, 69, 70, 71, 73, 74, 77, 79, 80, 81, 83, 84, 85, 86, 90, 91, 92, 93, 94, 95, 96, 97, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 12, 14, 16, 17, 18, 19, 21, 23, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 44, 45, 47, 48, 49, 50, 52, 53, 55, 57, 59, 61, 62, 64, 65, 67, 69, 70, 71, 73, 74, 77, 79, 80, 81, 83, 84, 85, 86, 90, 91, 92, 93, 94, 95, 96, 97, 98, 10, 11, 13, 15, 20, 22, 24, 29, 30, 37, 41, 43, 46, 51, 54, 56, 58, 60, 63, 66, 68, 72, 75, 76, 78, 82, 87, 88, 89, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "fast food nation" =============== +============ Value of Rand Index = 0.601010101010101 ================================= +============ Partial average Rand Index = 0.5478096757044127 ====== +============ Value of Adjusted Rand Index = 0.2109254361154005 ================================= +============ Partial average of Adjusted Rand Index = 0.07531966894104554 ================================= +============ Value of Jaccard Index = 0.42302074203914697 ================================= +============ Partial average of Jaccard Index = 0.4454014825273686 ====== +============ Precision = 0.6666666666666666, Recall = 0.5111111111111111, F1 = 0.5786163522012578 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 69.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 77 : "the da vinci code" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 71, 72, 73, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 71, 72, 73, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 23, 70, 74] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the da vinci code" =============== +============ Value of Rand Index = 0.3115151515151515 ================================= +============ Partial average Rand Index = 0.5447409156500067 ====== +============ Value of Adjusted Rand Index = -0.00764971238990862 ================================= +============ Partial average of Adjusted Rand Index = 0.07424214450817601 ================================= +============ Value of Jaccard Index = 0.2832807570977918 ================================= +============ Partial average of Jaccard Index = 0.44329601856075074 ====== +============ Precision = 0.36082474226804123, Recall = 0.5, F1 = 0.41916167664670656 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 97.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 78 : "civil war" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +The cluster 2 contains the snippets: [14] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 14, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "civil war" =============== +============ Value of Rand Index = 0.4385858585858586 ================================= +============ Partial average Rand Index = 0.5433799533799535 ====== +============ Value of Adjusted Rand Index = -0.006840282306566421 ================================= +============ Partial average of Adjusted Rand Index = 0.07320262621567931 ================================= +============ Value of Jaccard Index = 0.4333197389885807 ================================= +============ Partial average of Jaccard Index = 0.44316811754059476 ====== +============ Precision = 0.54, Recall = 0.8852459016393442, F1 = 0.670807453416149 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 50.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 79 : "trip the light fantastic" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 5, 6, 8, 11, 15, 16, 17, 24, 25, 29, 32, 33, 42, 45, 47, 59, 69, 75, 76, 82, 84, 87, 94, 95, 97] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 5, 6, 8, 11, 15, 16, 17, 24, 25, 29, 32, 33, 42, 45, 47, 59, 69, 75, 76, 82, 84, 87, 94, 95, 97, 2, 4, 7, 9, 10, 12, 13, 14, 18, 19, 20, 21, 22, 23, 26, 27, 28, 30, 31, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 74, 77, 78, 79, 80, 81, 83, 85, 86, 88, 89, 90, 91, 92, 93, 96, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "trip the light fantastic" =============== +============ Value of Rand Index = 0.6834343434343434 ================================= +============ Partial average Rand Index = 0.5451527937603887 ====== +============ Value of Adjusted Rand Index = 0.34958349495952673 ================================= +============ Partial average of Adjusted Rand Index = 0.07670111822509512 ================================= +============ Value of Jaccard Index = 0.5732570806100218 ================================= +============ Partial average of Jaccard Index = 0.4448148132756508 ====== +============ Precision = 0.4074074074074074, Recall = 0.4230769230769231, F1 = 0.4150943396226415 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 27.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 80 : "ace of spades" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 5, 8, 13, 14, 16, 18, 20, 25, 26, 35, 36, 48, 51, 55, 56, 58, 62, 64, 66, 67, 68, 69, 80, 87, 88, 90, 92, 94, 97] +The cluster 2 contains the snippets: [2, 7, 19, 21, 33, 34, 38, 39, 44, 45, 47, 49, 50, 54, 57, 59, 70, 71, 74, 75, 76, 78, 79, 81, 85, 96, 98] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 7, 5, 19, 8, 21, 13, 33, 14, 34, 16, 38, 18, 39, 20, 44, 25, 45, 26, 47, 35, 49, 36, 50, 48, 54, 51, 57, 55, 59, 56, 70, 58, 71, 62, 74, 64, 75, 66, 76, 67, 78, 68, 79, 69, 81, 80, 85, 87, 96, 88, 98, 90, 92, 94, 97, 4, 6, 9, 10, 11, 12, 15, 17, 22, 23, 24, 27, 28, 29, 30, 31, 32, 37, 40, 41, 42, 43, 46, 52, 53, 60, 61, 63, 65, 72, 73, 77, 82, 83, 84, 86, 89, 91, 93, 95, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "ace of spades" =============== +============ Value of Rand Index = 0.5987878787878788 ================================= +============ Partial average Rand Index = 0.5458232323232324 ====== +============ Value of Adjusted Rand Index = 0.17033911050144238 ================================= +============ Partial average of Adjusted Rand Index = 0.07787159312854945 ================================= +============ Value of Jaccard Index = 0.3251783893985729 ================================= +============ Partial average of Jaccard Index = 0.44331935797718736 ====== +============ Precision = 0.27586206896551724, Recall = 0.47058823529411764, F1 = 0.34782608695652173 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 29.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 81 : "charles de gaulle" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] +The cluster 2 contains the snippets: [100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 100, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 73] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "charles de gaulle" =============== +============ Value of Rand Index = 0.2577777777777778 ================================= +============ Partial average Rand Index = 0.542267115600449 ====== +============ Value of Adjusted Rand Index = 0.0023272064821659158 ================================= +============ Partial average of Adjusted Rand Index = 0.07693894637982866 ================================= +============ Value of Jaccard Index = 0.2337851929092805 ================================= +============ Partial average of Jaccard Index = 0.4407325164331391 ====== +============ Precision = 0.3434343434343434, Recall = 0.4657534246575342, F1 = 0.3953488372093023 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 49.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 82 : "dive bomber" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 59, 60, 61, 62, 64, 65, 67, 68, 70, 71, 72, 73, 74, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 59, 60, 61, 62, 64, 65, 67, 68, 70, 71, 72, 73, 74, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 4, 13, 14, 19, 28, 46, 56, 58, 63, 66, 69, 75, 84] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "dive bomber" =============== +============ Value of Rand Index = 0.4985858585858586 ================================= +============ Partial average Rand Index = 0.5417344173441736 ====== +============ Value of Adjusted Rand Index = 0.12736547603573817 ================================= +============ Partial average of Adjusted Rand Index = 0.07755390405855928 ================================= +============ Value of Jaccard Index = 0.3868577075098814 ================================= +============ Partial average of Jaccard Index = 0.44007550656822125 ====== +============ Precision = 0.5747126436781609, Recall = 0.6944444444444444, F1 = 0.6289308176100629 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 87.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 83 : "catch a fire" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 5, 15, 21, 25, 26, 27, 28, 29, 30, 33, 37, 38, 40, 45, 47, 49, 53, 54, 55, 56, 61, 64, 65, 66, 68, 69, 71, 74, 75, 76, 78, 79, 80, 81, 82, 84, 86, 89, 90, 91, 92, 93, 95] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 3, 5, 15, 21, 25, 26, 27, 28, 29, 30, 33, 37, 38, 40, 45, 47, 49, 53, 54, 55, 56, 61, 64, 65, 66, 68, 69, 71, 74, 75, 76, 78, 79, 80, 81, 82, 84, 86, 89, 90, 91, 92, 93, 95, 1, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 31, 32, 34, 35, 36, 39, 41, 42, 43, 44, 46, 48, 50, 51, 52, 57, 58, 59, 60, 62, 63, 67, 70, 72, 73, 77, 83, 85, 87, 88, 94, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "catch a fire" =============== +============ Value of Rand Index = 0.5305050505050505 ================================= +============ Partial average Rand Index = 0.5415991237677986 ====== +============ Value of Adjusted Rand Index = 0.06101010101010101 ================================= +============ Partial average of Adjusted Rand Index = 0.0773545811302646 ================================= +============ Value of Jaccard Index = 0.41253791708796766 ================================= +============ Partial average of Jaccard Index = 0.43974372838171216 ====== +============ Precision = 0.6888888888888889, Recall = 0.34831460674157305, F1 = 0.4626865671641791 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 45.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 84 : "middle ages" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 26, 82, 85] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "middle ages" =============== +============ Value of Rand Index = 0.5923232323232324 ================================= +============ Partial average Rand Index = 0.5422029822029822 ====== +============ Value of Adjusted Rand Index = 0.08989727759103339 ================================= +============ Partial average of Adjusted Rand Index = 0.07750389894527375 ================================= +============ Value of Jaccard Index = 0.5726387124099958 ================================= +============ Partial average of Jaccard Index = 0.441325811524906 ====== +============ Precision = 0.7319587628865979, Recall = 0.9342105263157895, F1 = 0.8208092485549132 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 97.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 85 : "the marquise of o" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the marquise of o" =============== +============ Value of Rand Index = 0.3527272727272727 ================================= +============ Partial average Rand Index = 0.5399738562091505 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.076592088369447 ================================= +============ Value of Jaccard Index = 0.3527272727272727 ================================= +============ Partial average of Jaccard Index = 0.4402834757743456 ====== +============ Precision = 0.46, Recall = 0.6571428571428571, F1 = 0.5411764705882354 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 86 : "sean fallon" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "sean fallon" =============== +============ Value of Rand Index = 0.8317171717171717 ================================= +============ Partial average Rand Index = 0.5433662203429647 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.0757014826907325 ================================= +============ Value of Jaccard Index = 0.8317171717171717 ================================= +============ Partial average of Jaccard Index = 0.444835030378332 ====== +============ Precision = 0.07, Recall = 0.7777777777777778, F1 = 0.12844036697247707 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 87 : "tower of babel" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 4, 5, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 31, 32, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97, 98, 100] +The cluster 2 contains the snippets: [1, 3, 7, 9, 27, 29, 30, 33, 38, 54, 65, 68, 96] +The cluster 3 contains the snippets: [84] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 84, 4, 3, 5, 7, 6, 9, 8, 27, 10, 29, 11, 30, 12, 33, 13, 38, 14, 54, 15, 65, 16, 68, 17, 96, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 31, 32, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97, 98, 100, 66, 82, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "tower of babel" =============== +============ Value of Rand Index = 0.4074747474747475 ================================= +============ Partial average Rand Index = 0.5418042493904563 ====== +============ Value of Adjusted Rand Index = 0.056714532366360176 ================================= +============ Partial average of Adjusted Rand Index = 0.07548324188240638 ================================= +============ Value of Jaccard Index = 0.20038167938931298 ================================= +============ Partial average of Jaccard Index = 0.4420252217462743 ====== +============ Precision = 0.25773195876288657, Recall = 0.390625, F1 = 0.3105590062111801 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 32.333333333333336 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 88 : "special edition" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 2, 3, 4, 7, 9, 10, 14, 19, 23, 25, 26, 27, 30, 32, 35, 36, 37, 40, 41, 42, 46, 47, 48, 49, 50, 51, 52, 54, 57, 61, 64, 67, 68, 70, 71, 72, 73, 75, 76, 78, 80, 81, 82, 83, 84, 85, 86, 87, 88, 91, 92, 93, 95, 96, 97, 98] +The cluster 1 contains the snippets: [5, 6, 8, 11, 12, 13, 15, 16, 17, 18, 20, 21, 22, 24, 28, 29, 31, 33, 34, 38, 39, 43, 44, 45, 53, 55, 56, 58, 59, 60, 62, 63, 65, 66, 69, 74, 77, 79, 89, 90, 94, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [5, 1, 6, 2, 8, 3, 11, 4, 12, 7, 13, 9, 15, 10, 16, 14, 17, 19, 18, 23, 20, 25, 21, 26, 22, 27, 24, 30, 28, 32, 29, 35, 31, 36, 33, 37, 34, 40, 38, 41, 39, 42, 43, 46, 44, 47, 45, 48, 53, 49, 55, 50, 56, 51, 58, 52, 59, 54, 60, 57, 62, 61, 63, 64, 65, 67, 66, 68, 69, 70, 74, 71, 77, 72, 79, 73, 89, 75, 90, 76, 94, 78, 99, 80, 100, 81, 82, 83, 84, 85, 86, 87, 88, 91, 92, 93, 95, 96, 97, 98] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "special edition" =============== +============ Value of Rand Index = 0.49777777777777776 ================================= +============ Partial average Rand Index = 0.541303948576676 ====== +============ Value of Adjusted Rand Index = -0.013105488537698905 ================================= +============ Partial average of Adjusted Rand Index = 0.07447655176399609 ================================= +============ Value of Jaccard Index = 0.4843393486828459 ================================= +============ Partial average of Jaccard Index = 0.4425060640978263 ====== +============ Precision = 0.02, Recall = 0.6666666666666666, F1 = 0.038834951456310676 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 50.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 89 : "the colour of magic" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 28, 29, 31, 33, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 69, 70, 72, 73, 75, 77, 78, 81, 82, 83, 85, 86, 88, 89, 90, 91, 92, 93, 94, 96, 97, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 28, 29, 31, 33, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 59, 60, 62, 63, 64, 65, 66, 67, 69, 70, 72, 73, 75, 77, 78, 81, 82, 83, 85, 86, 88, 89, 90, 91, 92, 93, 94, 96, 97, 99, 100, 3, 22, 26, 27, 30, 32, 39, 40, 54, 58, 61, 68, 71, 74, 76, 79, 80, 84, 87, 95, 98] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the colour of magic" =============== +============ Value of Rand Index = 0.49818181818181817 ================================= +============ Partial average Rand Index = 0.5408194302576327 ====== +============ Value of Adjusted Rand Index = 0.07420311671539559 ================================= +============ Partial average of Adjusted Rand Index = 0.07447347946007923 ================================= +============ Value of Jaccard Index = 0.3402390438247012 ================================= +============ Partial average of Jaccard Index = 0.441356996454308 ====== +============ Precision = 0.5063291139240507, Recall = 0.5970149253731343, F1 = 0.547945205479452 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 79.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 90 : "iron butterly" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "iron butterly" =============== +============ Value of Rand Index = 0.4595959595959596 ================================= +============ Partial average Rand Index = 0.5399169472502807 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07364599635496724 ================================= +============ Value of Jaccard Index = 0.4595959595959596 ================================= +============ Partial average of Jaccard Index = 0.4415596516003263 ====== +============ Precision = 0.55, Recall = 0.9166666666666666, F1 = 0.6874999999999999 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 91 : "reign of terror" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 97, 98, 99, 100] +The cluster 3 contains the snippets: [23, 53, 63, 65, 66, 67, 68] +The cluster 2 contains the snippets: [43, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 43, 23, 2, 64, 53, 3, 63, 4, 65, 5, 66, 6, 67, 7, 68, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 97, 98, 99, 100, 32, 84, 91, 96] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "reign of terror" =============== +============ Value of Rand Index = 0.46989898989898987 ================================= +============ Partial average Rand Index = 0.5391475191475191 ====== +============ Value of Adjusted Rand Index = -0.012301337966708887 ================================= +============ Partial average of Adjusted Rand Index = 0.07270152015363014 ================================= +============ Value of Jaccard Index = 0.3928736695974086 ================================= +============ Partial average of Jaccard Index = 0.44102464080908543 ====== +============ Precision = 0.3020833333333333, Recall = 0.7631578947368421, F1 = 0.43283582089552236 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 32.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 92 : "heavy rotation" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 27, 40, 89] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "heavy rotation" =============== +============ Value of Rand Index = 0.4402020202020202 ================================= +============ Partial average Rand Index = 0.5380720245937638 ====== +============ Value of Adjusted Rand Index = -0.03349537134162147 ================================= +============ Partial average of Adjusted Rand Index = 0.07154720611563828 ================================= +============ Value of Jaccard Index = 0.4270057899090157 ================================= +============ Partial average of Jaccard Index = 0.4408722619949543 ====== +============ Precision = 0.2268041237113402, Recall = 0.5641025641025641, F1 = 0.32352941176470584 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 97.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 93 : "the edge of heaven" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [48, 50, 55, 57, 90, 92, 96, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [48, 50, 55, 57, 90, 92, 96, 99, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 49, 51, 52, 53, 54, 56, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 91, 93, 94, 95, 97, 98, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the edge of heaven" =============== +============ Value of Rand Index = 0.5133333333333333 ================================= +============ Partial average Rand Index = 0.537806017160856 ====== +============ Value of Adjusted Rand Index = 0.08192084958285689 ================================= +============ Partial average of Adjusted Rand Index = 0.07165875066904923 ================================= +============ Value of Jaccard Index = 0.4577987846049966 ================================= +============ Partial average of Jaccard Index = 0.441054267614417 ====== +============ Precision = 0.375, Recall = 0.058823529411764705, F1 = 0.10169491525423728 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 8.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 94 : "top of the pops" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "top of the pops" =============== +============ Value of Rand Index = 0.49656565656565654 ================================= +============ Partial average Rand Index = 0.5373672899204816 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07089642353427211 ================================= +============ Value of Jaccard Index = 0.49656565656565654 ================================= +============ Partial average of Jaccard Index = 0.4416448143053877 ====== +============ Precision = 0.62, Recall = 0.9393939393939394, F1 = 0.7469879518072288 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 95 : "manor house" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 72] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "manor house" =============== +============ Value of Rand Index = 0.6585858585858586 ================================= +============ Partial average Rand Index = 0.5386432748538013 ====== +============ Value of Adjusted Rand Index = -0.016174295467710403 ================================= +============ Partial average of Adjusted Rand Index = 0.06997988965004072 ================================= +============ Value of Jaccard Index = 0.6572703305617522 ================================= +============ Partial average of Jaccard Index = 0.44391455658177054 ====== +============ Precision = 0.12121212121212122, Recall = 0.6, F1 = 0.20168067226890757 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 99.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 96 : "bus driver" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 75, 76] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bus driver" =============== +============ Value of Rand Index = 0.4214141414141414 ================================= +============ Partial average Rand Index = 0.5374221380471381 ====== +============ Value of Adjusted Rand Index = -0.0016153769096722268 ================================= +============ Partial average of Adjusted Rand Index = 0.06923410562337703 ================================= +============ Value of Jaccard Index = 0.4078974571015092 ================================= +============ Partial average of Jaccard Index = 0.4435393784621844 ====== +============ Precision = 0.5816326530612245, Recall = 0.6263736263736264, F1 = 0.603174603174603 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 98.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 97 : "american beauty" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 8, 11, 13, 14, 16, 17, 19, 20, 21, 22, 24, 27, 28, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 44, 45, 47, 48, 49, 52, 53, 54, 55, 57, 58, 60, 61, 62, 63, 66, 67, 68, 69, 71, 75, 76, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 93, 95, 96, 97, 98, 99, 100] +The cluster 2 contains the snippets: [10, 18, 30, 59, 72, 77, 78] +The cluster 3 contains the snippets: [46, 56, 94] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 10, 46, 2, 18, 56, 3, 30, 94, 4, 59, 5, 72, 6, 77, 8, 78, 11, 13, 14, 16, 17, 19, 20, 21, 22, 24, 27, 28, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 44, 45, 47, 48, 49, 52, 53, 54, 55, 57, 58, 60, 61, 62, 63, 66, 67, 68, 69, 71, 75, 76, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 93, 95, 96, 97, 98, 99, 100, 7, 9, 12, 15, 23, 25, 26, 29, 34, 42, 43, 50, 51, 64, 65, 70, 73, 74, 92] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "american beauty" =============== +============ Value of Rand Index = 0.47535353535353536 ================================= +============ Partial average Rand Index = 0.5367822555451424 ====== +============ Value of Adjusted Rand Index = -0.054019617408872116 ================================= +============ Partial average of Adjusted Rand Index = 0.06796344868490024 ================================= +============ Value of Jaccard Index = 0.3413644433172711 ================================= +============ Partial average of Jaccard Index = 0.4424860286153299 ====== +============ Precision = 0.32098765432098764, Recall = 0.8125, F1 = 0.4601769911504424 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 27.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 98 : "soldier of fortune" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 8, 9, 10, 12, 15, 16, 19, 21, 26, 27, 28, 31, 32, 34, 35, 38, 39, 40, 41, 42, 43, 45, 49, 50, 52, 53, 54, 55, 56, 57, 61, 63, 72, 74, 75, 77, 81, 82, 84, 86, 87, 89, 90, 91, 95, 96, 98, 99, 100] +The cluster 2 contains the snippets: [1, 5, 11, 23, 33, 37, 44, 46, 48, 58, 62, 64, 68, 70, 78, 80, 83, 85, 92, 93, 94] +The cluster 3 contains the snippets: [7, 20, 24] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 7, 3, 5, 20, 4, 11, 24, 8, 23, 9, 33, 10, 37, 12, 44, 15, 46, 16, 48, 19, 58, 21, 62, 26, 64, 27, 68, 28, 70, 31, 78, 32, 80, 34, 83, 35, 85, 38, 92, 39, 93, 40, 94, 41, 42, 43, 45, 49, 50, 52, 53, 54, 55, 56, 57, 61, 63, 72, 74, 75, 77, 81, 82, 84, 86, 87, 89, 90, 91, 95, 96, 98, 99, 100, 6, 13, 14, 17, 18, 22, 25, 29, 30, 36, 47, 51, 59, 60, 65, 66, 67, 69, 71, 73, 76, 79, 88, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "soldier of fortune" =============== +============ Value of Rand Index = 0.6323232323232323 ================================= +============ Partial average Rand Index = 0.5377571634714493 ====== +============ Value of Adjusted Rand Index = 0.1571212448670845 ================================= +============ Partial average of Adjusted Rand Index = 0.0688732221153307 ================================= +============ Value of Jaccard Index = 0.26106374340235483 ================================= +============ Partial average of Jaccard Index = 0.44063478080703417 ====== +============ Precision = 0.39473684210526316, Recall = 0.5357142857142857, F1 = 0.45454545454545453 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 25.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 99 : "fight night" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 4, 5, 6, 7, 9, 10, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 33, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 49, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 67, 68, 70, 71, 74, 76, 78, 79, 80, 82, 84, 86, 87, 89, 90, 91, 93, 95, 98, 99, 100] +The cluster 2 contains the snippets: [1, 3, 8, 11, 13, 16, 27, 31, 32, 34, 35, 39, 48, 55, 61, 64, 65, 66, 72, 73, 75, 77, 81, 83, 94, 96, 97] +The cluster 4 contains the snippets: [15, 50, 88] +The cluster 3 contains the snippets: [69, 85] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 69, 15, 4, 3, 85, 50, 5, 8, 88, 6, 11, 7, 13, 9, 16, 10, 27, 14, 31, 17, 32, 18, 34, 19, 35, 20, 39, 21, 48, 22, 55, 23, 61, 24, 64, 25, 65, 26, 66, 28, 72, 29, 73, 30, 75, 33, 77, 36, 81, 37, 83, 38, 94, 40, 96, 41, 97, 42, 43, 44, 45, 46, 47, 49, 51, 52, 53, 54, 56, 57, 58, 59, 60, 62, 63, 67, 68, 70, 71, 74, 76, 78, 79, 80, 82, 84, 86, 87, 89, 90, 91, 93, 95, 98, 99, 100, 12, 92] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "fight night" =============== +============ Value of Rand Index = 0.5078787878787879 ================================= +============ Partial average Rand Index = 0.5374553616977861 ====== +============ Value of Adjusted Rand Index = 0.016725821421517833 ================================= +============ Partial average of Adjusted Rand Index = 0.06834648069418107 ================================= +============ Value of Jaccard Index = 0.32144846796657384 ================================= +============ Partial average of Jaccard Index = 0.43943087865713054 ====== +============ Precision = 0.6326530612244898, Recall = 0.8378378378378378, F1 = 0.7209302325581396 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 24.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 100 : "magic lantern" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 11, 12, 13, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 28, 29, 31, 33, 35, 37, 39, 40, 41, 42, 43, 44, 45, 47, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 61, 63, 65, 66, 67, 68, 70, 71, 72, 75, 78, 79, 81, 84, 85, 86, 88, 90, 92, 93, 95, 96, 97, 98, 99, 100] +The cluster 2 contains the snippets: [8, 27, 30, 36, 38, 46, 62, 64, 69, 73, 77, 87, 89] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 8, 2, 27, 3, 30, 5, 36, 6, 38, 7, 46, 11, 62, 12, 64, 13, 69, 15, 73, 17, 77, 18, 87, 19, 89, 20, 21, 23, 24, 25, 26, 28, 29, 31, 33, 35, 37, 39, 40, 41, 42, 43, 44, 45, 47, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 61, 63, 65, 66, 67, 68, 70, 71, 72, 75, 78, 79, 81, 84, 85, 86, 88, 90, 92, 93, 95, 96, 97, 98, 99, 100, 4, 9, 10, 14, 16, 22, 32, 34, 48, 55, 74, 76, 80, 82, 83, 91, 94] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "magic lantern" =============== +============ Value of Rand Index = 0.45151515151515154 ================================= +============ Partial average Rand Index = 0.5365959595959597 ====== +============ Value of Adjusted Rand Index = -0.11939888257100302 ================================= +============ Partial average of Adjusted Rand Index = 0.06646902706152923 ================================= +============ Value of Jaccard Index = 0.3697771587743733 ================================= +============ Partial average of Jaccard Index = 0.43873434145830303 ====== +============ Precision = 0.0963855421686747, Recall = 0.42105263157894735, F1 = 0.15686274509803924 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 41.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 101 : "train of thought" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [2, 3, 4, 5, 6, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 29, 30, 33, 35, 36, 37, 39, 40, 41, 42, 43, 44, 47, 49, 51, 53, 56, 57, 61, 62, 63, 64, 65, 67, 68, 70, 71, 72, 73, 74, 75, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 92, 93, 94, 96, 98, 99, 100] +The cluster 1 contains the snippets: [7, 26, 27, 38, 52, 59, 66, 87, 95] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [7, 2, 26, 3, 27, 4, 38, 5, 52, 6, 59, 8, 66, 9, 87, 10, 95, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 28, 29, 30, 33, 35, 36, 37, 39, 40, 41, 42, 43, 44, 47, 49, 51, 53, 56, 57, 61, 62, 63, 64, 65, 67, 68, 70, 71, 72, 73, 74, 75, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 92, 93, 94, 96, 98, 99, 100, 1, 13, 25, 31, 32, 34, 45, 46, 48, 50, 54, 55, 58, 60, 69, 76, 77, 88, 91, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "train of thought" =============== +============ Value of Rand Index = 0.4894949494949495 ================================= +============ Partial average Rand Index = 0.5361296129612962 ====== +============ Value of Adjusted Rand Index = -0.021190035344208855 ================================= +============ Partial average of Adjusted Rand Index = 0.06560111555256153 ================================= +============ Value of Jaccard Index = 0.3225201072386059 ================================= +============ Partial average of Jaccard Index = 0.43758370547592973 ====== +============ Precision = 0.37499999999999994, Recall = 0.7317073170731707, F1 = 0.4958677685950413 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 40.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 102 : "heart to heart" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 8, 9, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 29, 30, 31, 32, 33, 34, 36, 37, 38, 40, 41, 42, 44, 46, 48, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 89, 91, 92, 93, 94, 95, 96, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 8, 9, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 29, 30, 31, 32, 33, 34, 36, 37, 38, 40, 41, 42, 44, 46, 48, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 89, 91, 92, 93, 94, 95, 96, 98, 99, 100, 5, 6, 7, 10, 13, 15, 24, 27, 28, 35, 39, 43, 45, 47, 49, 52, 63, 67, 83, 87, 88, 90, 97] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "heart to heart" =============== +============ Value of Rand Index = 0.5547474747474748 ================================= +============ Partial average Rand Index = 0.5363121410180235 ====== +============ Value of Adjusted Rand Index = -0.09546857293072615 ================================= +============ Partial average of Adjusted Rand Index = 0.06402200095958811 ================================= +============ Value of Jaccard Index = 0.535315201349357 ================================= +============ Partial average of Jaccard Index = 0.43854185739625745 ====== +============ Precision = 0.05194805194805195, Recall = 0.4444444444444444, F1 = 0.09302325581395349 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 77.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 103 : "bed of roses" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [6, 8, 9, 14, 17, 18, 25, 37, 40, 44, 45, 59, 61, 63, 67, 69, 72, 73, 82, 86, 88, 89, 97] +The cluster 2 contains the snippets: [1, 4, 5, 12, 32, 53, 68, 84, 98, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [6, 1, 8, 4, 9, 5, 14, 12, 17, 32, 18, 53, 25, 68, 37, 84, 40, 98, 44, 100, 45, 59, 61, 63, 67, 69, 72, 73, 82, 86, 88, 89, 97, 2, 3, 7, 10, 11, 13, 15, 16, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 38, 39, 41, 42, 43, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 62, 64, 65, 66, 70, 71, 74, 75, 76, 77, 78, 79, 80, 81, 83, 85, 87, 90, 91, 92, 93, 94, 95, 96, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bed of roses" =============== +============ Value of Rand Index = 0.7355555555555555 ================================= +============ Partial average Rand Index = 0.5382465431009121 ====== +============ Value of Adjusted Rand Index = 0.4734520976346118 ================================= +============ Partial average of Adjusted Rand Index = 0.06799705044186989 ================================= +============ Value of Jaccard Index = 0.523306627822287 ================================= +============ Partial average of Jaccard Index = 0.4393648163324325 ====== +============ Precision = 0.6363636363636364, Recall = 0.4666666666666667, F1 = 0.5384615384615385 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 16.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 104 : "food for thought" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 2 contains the snippets: [4, 6, 8, 10, 12, 16, 20, 21, 24, 25, 29, 36, 41, 42, 45, 47, 50, 51, 52, 53, 54, 56, 57, 59, 62, 64, 65, 68, 69, 71, 73, 75, 80, 81, 82, 84, 85, 87, 89, 93, 94, 95, 96, 97, 99] +The cluster 1 contains the snippets: [19, 23, 31, 32, 33, 34, 35, 38, 40, 43, 44, 55, 60, 61, 74, 90, 91, 98, 100] +The cluster 3 contains the snippets: [13, 18, 27, 58, 67, 70, 72, 76, 77, 88, 92] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [19, 4, 13, 23, 6, 18, 31, 8, 27, 32, 10, 58, 33, 12, 67, 34, 16, 70, 35, 20, 72, 38, 21, 76, 40, 24, 77, 43, 25, 88, 44, 29, 92, 55, 36, 60, 41, 61, 42, 74, 45, 90, 47, 91, 50, 98, 51, 100, 52, 53, 54, 56, 57, 59, 62, 64, 65, 68, 69, 71, 73, 75, 80, 81, 82, 84, 85, 87, 89, 93, 94, 95, 96, 97, 99, 1, 2, 3, 5, 7, 9, 11, 14, 15, 17, 22, 26, 28, 30, 37, 39, 46, 48, 49, 63, 66, 78, 79, 83, 86] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "food for thought" =============== +============ Value of Rand Index = 0.39636363636363636 ================================= +============ Partial average Rand Index = 0.5368822843822845 ====== +============ Value of Adjusted Rand Index = 0.01979073458690184 ================================= +============ Partial average of Adjusted Rand Index = 0.06753352817403366 ================================= +============ Value of Jaccard Index = 0.29859154929577464 ================================= +============ Partial average of Jaccard Index = 0.43801122722631075 ====== +============ Precision = 0.06666666666666667, Recall = 0.45454545454545453, F1 = 0.11627906976744184 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 25.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 105 : "burden of proof" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +The cluster 2 contains the snippets: [4, 7, 9, 59] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 4, 2, 7, 3, 9, 5, 59, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 55, 71, 81, 86] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "burden of proof" =============== +============ Value of Rand Index = 0.6050505050505051 ================================= +============ Partial average Rand Index = 0.5375315055315056 ====== +============ Value of Adjusted Rand Index = 0.1674823586008285 ================================= +============ Partial average of Adjusted Rand Index = 0.06848542179714599 ================================= +============ Value of Jaccard Index = 0.5561861520998865 ================================= +============ Partial average of Jaccard Index = 0.4391367027012972 ====== +============ Precision = 0.7083333333333334, Recall = 0.9444444444444444, F1 = 0.8095238095238096 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 48.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 106 : "dial tone" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 96, 97, 98, 99] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 96, 97, 98, 99, 3, 13, 14, 19, 26, 33, 35, 36, 38, 43, 49, 52, 63, 85, 95, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "dial tone" =============== +============ Value of Rand Index = 0.5709090909090909 ================================= +============ Partial average Rand Index = 0.5378463884124263 ====== +============ Value of Adjusted Rand Index = 0.03349961059791437 ================================= +============ Partial average of Adjusted Rand Index = 0.06815536697451173 ================================= +============ Value of Jaccard Index = 0.5179300953245575 ================================= +============ Partial average of Jaccard Index = 0.43988003659396946 ====== +============ Precision = 0.7738095238095238, Recall = 0.8333333333333334, F1 = 0.8024691358024691 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 84.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 107 : "stranger in town" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 9, 10, 19, 20, 21, 22, 23, 38, 41, 42, 44, 47, 50, 51, 52, 56, 57, 58, 61, 67, 71, 72, 73, 84, 88, 89, 94, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 6, 9, 10, 19, 20, 21, 22, 23, 38, 41, 42, 44, 47, 50, 51, 52, 56, 57, 58, 61, 67, 71, 72, 73, 84, 88, 89, 94, 100, 5, 7, 8, 11, 12, 13, 14, 15, 16, 17, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 43, 45, 46, 48, 49, 53, 54, 55, 59, 60, 62, 63, 64, 65, 66, 68, 69, 70, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 90, 91, 92, 93, 95, 96, 97, 98, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "stranger in town" =============== +============ Value of Rand Index = 0.6248484848484849 ================================= +============ Partial average Rand Index = 0.5386594921174361 ====== +============ Value of Adjusted Rand Index = 0.2700509955398557 ================================= +============ Partial average of Adjusted Rand Index = 0.0700422420078327 ================================= +============ Value of Jaccard Index = 0.42185554171855544 ================================= +============ Partial average of Jaccard Index = 0.43971158337083477 ====== +============ Precision = 0.5757575757575758, Recall = 0.4318181818181818, F1 = 0.49350649350649356 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 33.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 108 : "beer for my horses" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 10, 11, 12, 16, 19, 23, 24, 25, 26, 29, 30, 32, 33, 35, 36, 39, 40, 42, 43, 47, 48, 49, 52, 53, 54, 55, 56, 58, 60, 61, 62, 64, 65, 70, 71, 72, 74, 82, 84, 85, 86, 88, 89, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 10, 11, 12, 16, 19, 23, 24, 25, 26, 29, 30, 32, 33, 35, 36, 39, 40, 42, 43, 47, 48, 49, 52, 53, 54, 55, 56, 58, 60, 61, 62, 64, 65, 70, 71, 72, 74, 82, 84, 85, 86, 88, 89, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 7, 8, 9, 13, 14, 15, 17, 18, 20, 21, 22, 27, 28, 31, 34, 37, 38, 41, 44, 45, 46, 50, 51, 57, 59, 63, 66, 67, 68, 69, 73, 75, 76, 77, 78, 79, 80, 81, 83, 87, 90] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "beer for my horses" =============== +============ Value of Rand Index = 0.6698989898989899 ================================= +============ Partial average Rand Index = 0.5398746726524506 ====== +============ Value of Adjusted Rand Index = 0.32522688082623546 ================================= +============ Partial average of Adjusted Rand Index = 0.07240506273763272 ================================= +============ Value of Jaccard Index = 0.456781914893617 ================================= +============ Partial average of Jaccard Index = 0.4398696419960457 ====== +============ Precision = 0.6949152542372882, Recall = 0.4939759036144578, F1 = 0.5774647887323943 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 59.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 109 : "peter and the wolf" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 10, 14, 18, 41, 48, 57, 62, 75, 92, 93] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "peter and the wolf" =============== +============ Value of Rand Index = 0.4036363636363636 ================================= +============ Partial average Rand Index = 0.5386247799091838 ====== +============ Value of Adjusted Rand Index = -0.07076436061465406 ================================= +============ Partial average of Adjusted Rand Index = 0.0710915817894466 ================================= +============ Value of Jaccard Index = 0.3464688952844808 ================================= +============ Partial average of Jaccard Index = 0.4390127544115359 ====== +============ Precision = 0.28888888888888886, Recall = 0.6190476190476191, F1 = 0.3939393939393939 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 90.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 110 : "gorky park" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 8, 10, 11, 12, 14, 16, 25, 29, 35, 36, 37, 38, 39, 40, 42, 43, 44, 46, 47, 49, 50, 52, 55, 56, 60, 61, 64, 70, 71, 74, 78, 79, 80, 81, 82, 83, 84, 85, 89, 91, 92, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 5, 6, 7, 8, 10, 11, 12, 14, 16, 25, 29, 35, 36, 37, 38, 39, 40, 42, 43, 44, 46, 47, 49, 50, 52, 55, 56, 60, 61, 64, 70, 71, 74, 78, 79, 80, 81, 82, 83, 84, 85, 89, 91, 92, 94, 95, 96, 97, 98, 99, 100, 4, 9, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 41, 45, 48, 51, 53, 54, 57, 58, 59, 62, 63, 65, 66, 67, 68, 69, 72, 73, 75, 76, 77, 86, 87, 88, 90, 93] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "gorky park" =============== +============ Value of Rand Index = 0.5135353535353535 ================================= +============ Partial average Rand Index = 0.5383966942148762 ====== +============ Value of Adjusted Rand Index = 0.023956176118245385 ================================= +============ Partial average of Adjusted Rand Index = 0.0706630781015266 ================================= +============ Value of Jaccard Index = 0.21049180327868852 ================================= +============ Partial average of Jaccard Index = 0.4369352912194191 ====== +============ Precision = 0.2962962962962963, Recall = 0.17582417582417584, F1 = 0.2206896551724138 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 54.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 111 : "neutron star" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "neutron star" =============== +============ Value of Rand Index = 0.8317171717171717 ================================= +============ Partial average Rand Index = 0.5410392210392212 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.07002647379430564 ================================= +============ Value of Jaccard Index = 0.8317171717171717 ================================= +============ Partial average of Jaccard Index = 0.4404918847374169 ====== +============ Precision = 0.91, Recall = 0.978494623655914, F1 = 0.9430051813471503 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 112 : "death by chocolate" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "death by chocolate" =============== +============ Value of Rand Index = 0.6951515151515152 ================================= +============ Partial average Rand Index = 0.5424152236652239 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.0694012374211422 ================================= +============ Value of Jaccard Index = 0.6951515151515152 ================================= +============ Partial average of Jaccard Index = 0.4427656314375428 ====== +============ Precision = 0.82, Recall = 0.9647058823529412, F1 = 0.8864864864864864 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 100.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 113 : "before the storm" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 5, 12, 14, 15, 16, 17, 19, 21, 22, 25, 28, 29, 30, 31, 32, 34, 37, 38, 39, 40, 42, 46, 47, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 60, 61, 63, 64, 65, 67, 68, 70, 72, 73, 74, 76, 80, 81, 82, 84, 85, 87, 88, 89, 90, 92, 93, 94, 97, 98, 99, 100] +The cluster 2 contains the snippets: [1, 4, 6, 7, 8, 10, 13, 23, 24, 26, 27, 36, 41, 43, 44, 45, 48, 55, 62, 66, 69, 75, 77, 83, 86, 91, 95] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 3, 4, 5, 6, 12, 7, 14, 8, 15, 10, 16, 13, 17, 23, 19, 24, 21, 26, 22, 27, 25, 36, 28, 41, 29, 43, 30, 44, 31, 45, 32, 48, 34, 55, 37, 62, 38, 66, 39, 69, 40, 75, 42, 77, 46, 83, 47, 86, 49, 91, 50, 95, 51, 52, 53, 54, 56, 57, 58, 59, 60, 61, 63, 64, 65, 67, 68, 70, 72, 73, 74, 76, 80, 81, 82, 84, 85, 87, 88, 89, 90, 92, 93, 94, 97, 98, 99, 100, 9, 11, 18, 20, 33, 35, 71, 78, 79, 96] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "before the storm" =============== +============ Value of Rand Index = 0.6016161616161616 ================================= +============ Partial average Rand Index = 0.5429391257709844 ====== +============ Value of Adjusted Rand Index = 0.2235591547789998 ================================= +============ Partial average of Adjusted Rand Index = 0.07076546677829139 ================================= +============ Value of Jaccard Index = 0.4868592245641426 ================================= +============ Partial average of Jaccard Index = 0.44315584022627375 ====== +============ Precision = 0.1111111111111111, Recall = 0.5263157894736842, F1 = 0.1834862385321101 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 45.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 114 : "music of the spheres" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 10, 11, 12, 14, 15, 17, 19, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 37, 39, 41, 42, 43, 44, 45, 47, 49, 51, 53, 54, 57, 58, 60, 61, 63, 64, 68, 69, 72, 73, 74, 75, 76, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 90, 93, 95, 96, 100] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 10, 11, 12, 14, 15, 17, 19, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 37, 39, 41, 42, 43, 44, 45, 47, 49, 51, 53, 54, 57, 58, 60, 61, 63, 64, 68, 69, 72, 73, 74, 75, 76, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 90, 93, 95, 96, 100, 6, 7, 8, 9, 13, 16, 18, 20, 25, 34, 35, 36, 38, 40, 46, 48, 50, 52, 55, 56, 59, 62, 65, 66, 67, 70, 71, 77, 85, 89, 91, 92, 94, 97, 98, 99] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "music of the spheres" =============== +============ Value of Rand Index = 0.47878787878787876 ================================= +============ Partial average Rand Index = 0.5423763955342904 ====== +============ Value of Adjusted Rand Index = -0.04356037206346958 ================================= +============ Partial average of Adjusted Rand Index = 0.06976260854283735 ================================= +============ Value of Jaccard Index = 0.3333333333333333 ================================= +============ Partial average of Jaccard Index = 0.4421924849026515 ====== +============ Precision = 0.234375, Recall = 0.4838709677419355, F1 = 0.3157894736842105 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ INFO ] WSIEvaluator - + +=========== Final average value of S-recall@K: ============= +1 0.2894 +2 0.4199 +3 0.4896 +4 0.5369 +5 0.5808 +6 0.6104 +7 0.6400 +8 0.6554 +9 0.6797 +10 0.7056 +11 0.7089 +12 0.7211 +13 0.7276 +14 0.7417 +15 0.7497 +16 0.7531 +17 0.7564 +18 0.7613 +19 0.7688 +20 0.7723 +21 0.7769 +22 0.7820 +23 0.7892 +24 0.7945 +25 0.8019 +26 0.8049 +27 0.8154 +28 0.8202 +29 0.8239 +30 0.8311 +31 0.8355 +32 0.8364 +33 0.8420 +34 0.8438 +35 0.8469 +36 0.8583 +37 0.8605 +38 0.8613 +39 0.8624 +40 0.8633 +41 0.8642 +42 0.8649 +43 0.8660 +44 0.8699 +45 0.8734 +46 0.8751 +47 0.8761 +48 0.8813 +49 0.8813 +50 0.8843 +51 0.8843 +52 0.8889 +53 0.8965 +54 0.8980 +55 0.9015 +56 0.9083 +57 0.9098 +58 0.9173 +59 0.9216 +60 0.9216 +61 0.9227 +62 0.9227 +63 0.9265 +64 0.9317 +65 0.9324 +66 0.9324 +67 0.9383 +68 0.9383 +69 0.9412 +70 0.9434 +71 0.9456 +72 0.9464 +73 0.9493 +74 0.9510 +75 0.9510 +76 0.9532 +77 0.9567 +78 0.9576 +79 0.9576 +80 0.9635 +81 0.9652 +82 0.9652 +83 0.9652 +84 0.9703 +85 0.9718 +86 0.9718 +87 0.9736 +88 0.9736 +89 0.9776 +90 0.9776 +91 0.9798 +92 0.9825 +93 0.9825 +94 0.9861 +95 0.9923 +96 0.9932 +97 0.9932 +98 0.9941 +99 0.9991 +100 1.0000 + +=========== Final average value of S-precision@r: ============= +0.4000 0.5724 +0.4500 0.4059 +0.5000 0.3601 +0.5500 0.2690 +0.6000 0.2250 +0.6500 0.2192 +0.7000 0.1764 +0.7500 0.1668 +0.8000 0.1529 +0.8500 0.1419 +0.9000 0.1237 +0.9500 0.1271 +1.0000 0.0658 + +=========== Final average value of F1: ===================== +average F1 = 0.5140040577013422 + +=========== Final average value of Rand Index: ============= +average Rand Index = 0.5423763955342904 + +=========== Final average value of Adjusted Rand Index: ==== +average Adj Rand Index = 0.06976260854283735 + +=========== Final average value of Jaccard Index: ========== +average Jaccard Index = 0.4421924849026515 + +================ Statistics: ==================================== +============ average number of created clusters: 1.6666666666666667 +============ average cluster size: 64.38794903926483 + +[ WARN ] WSIEvaluator - Simulation started at: 03:01 and completed at 03:01 +Execution time: 6.652 sec diff --git a/results/try5.log b/results/try5.log new file mode 100644 index 0000000..b682a93 --- /dev/null +++ b/results/try5.log @@ -0,0 +1,3347 @@ +[ INFO ] Configuration - Loading /eval.properties FROM /home/students/zimmermann/Courses/ws17/fsem/absinth/WSI-Evaluator/config/eval.properties +[ INFO ] WSIEvaluator - Run started at 11:45 +[ INFO ] Dataset - Loading the datasets/dataset/ +[ INFO ] Dataset - Loading the topics data datasets/dataset/ +[ INFO ] Dataset - Loading the subtopics data +[ INFO ] Dataset - Loading the snippets data +[ INFO ] Dataset - Loading the relations data +[ INFO ] Dataset - Loading the relations data +[ INFO ] WSIEvaluator - +=================================================== +Starting the evaluation +=================================================== +[ INFO ] WSIEvaluator - +=================================================== +subtopic-recall@K default: 100 +=================================================== +[ WARN ] WSIEvaluator - +============= Query 1 : "aetna" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 2, 4, 18, 34, 45, 53, 57] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "aetna" =============== +============ Value of Rand Index = 0.7321428571428571 ================================= +============ Partial average Rand Index = 0.7321428571428571 ====== +============ Value of Adjusted Rand Index = 0.06449633666582427 ================================= +============ Partial average of Adjusted Rand Index = 0.06449633666582427 ================================= +============ Value of Jaccard Index = 0.7215059308922125 ================================= +============ Partial average of Jaccard Index = 0.7215059308922125 ====== +============ Precision = 0.9298245614035088, Recall = 0.828125, F1 = 0.8760330578512396 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 57.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 2 : "kangaroo" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 5 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 6, 8, 9, 14, 16, 17, 21, 23, 24, 28, 29, 31, 32, 33, 35, 36, 38, 40, 42, 43, 45, 46, 47, 49, 53, 54, 55, 58, 59, 60, 61] +The cluster 4 contains the snippets: [1, 2, 5, 7, 10, 11, 12, 15, 18, 19, 20, 22, 25, 27, 30, 37, 39, 41, 44, 50, 51, 56, 57, 64] +The cluster 2 contains the snippets: [4, 26, 48, 62] +The cluster 3 contains the snippets: [13, 63] +The cluster 5 contains the snippets: [34] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 4, 13, 1, 34, 6, 26, 63, 2, 8, 48, 5, 9, 62, 7, 14, 10, 16, 11, 17, 12, 21, 15, 23, 18, 24, 19, 28, 20, 29, 22, 31, 25, 32, 27, 33, 30, 35, 37, 36, 39, 38, 41, 40, 44, 42, 50, 43, 51, 45, 56, 46, 57, 47, 64, 49, 53, 54, 55, 58, 59, 60, 61, 52] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "kangaroo" =============== +============ Value of Rand Index = 0.6215277777777778 ================================= +============ Partial average Rand Index = 0.6768353174603174 ====== +============ Value of Adjusted Rand Index = 0.1503753750436354 ================================= +============ Partial average of Adjusted Rand Index = 0.10743585585472984 ================================= +============ Value of Jaccard Index = 0.26137463697967084 ================================= +============ Partial average of Jaccard Index = 0.49144028393594164 ====== +============ Precision = 0.5079365079365079, Recall = 0.5, F1 = 0.5039370078740157 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 5 ============ +============ average size of the created clusters: 12.6 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 3 : "mustang" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 6 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 14, 16, 18, 20, 21, 23, 24, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 43, 44, 46, 47, 48, 50, 51, 53, 54, 56, 58, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [12, 13, 19, 22, 25, 30, 42, 45, 49, 55] +The cluster 3 contains the snippets: [3, 15, 40, 59] +The cluster 6 contains the snippets: [17, 26] +The cluster 5 contains the snippets: [57] +The cluster 4 contains the snippets: [52] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 12, 3, 52, 57, 17, 2, 13, 15, 26, 4, 19, 40, 5, 22, 59, 6, 25, 7, 30, 8, 42, 9, 45, 10, 49, 11, 55, 14, 16, 18, 20, 21, 23, 24, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 43, 44, 46, 47, 48, 50, 51, 53, 54, 56, 58, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "mustang" =============== +============ Value of Rand Index = 0.5972222222222222 ================================= +============ Partial average Rand Index = 0.6502976190476191 ====== +============ Value of Adjusted Rand Index = 0.22903187217596813 ================================= +============ Partial average of Adjusted Rand Index = 0.1479678612951426 ================================= +============ Value of Jaccard Index = 0.30300429184549355 ================================= +============ Partial average of Jaccard Index = 0.42862828657245894 ====== +============ Precision = 0.53125, Recall = 0.53125, F1 = 0.53125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 6 ============ +============ average size of the created clusters: 10.666666666666666 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 4 : "brett butler" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "brett butler" =============== +============ Value of Rand Index = 0.5049603174603174 ================================= +============ Partial average Rand Index = 0.6139632936507937 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.11097589597135696 ================================= +============ Value of Jaccard Index = 0.5049603174603174 ================================= +============ Partial average of Jaccard Index = 0.4477112942944236 ====== +============ Precision = 0.671875, Recall = 0.671875, F1 = 0.671875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 5 : "poison ivy" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 2 contains the snippets: [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 32, 33, 34, 35, 37, 39, 40, 42, 44, 45, 49, 51, 53, 54, 56, 57, 59, 60, 61, 63] +The cluster 1 contains the snippets: [3, 17, 28, 31, 36, 38, 41, 43, 46, 47, 48, 52, 62] +The cluster 3 contains the snippets: [55] +The cluster 4 contains the snippets: [58] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 2, 55, 58, 17, 4, 28, 5, 31, 6, 36, 7, 38, 8, 41, 9, 43, 10, 46, 11, 47, 12, 48, 13, 52, 14, 62, 15, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 32, 33, 34, 35, 37, 39, 40, 42, 44, 45, 49, 51, 53, 54, 56, 57, 59, 60, 61, 63, 1, 16, 50, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "poison ivy" =============== +============ Value of Rand Index = 0.6770833333333334 ================================= +============ Partial average Rand Index = 0.6265873015873017 ====== +============ Value of Adjusted Rand Index = 0.346397260519569 ================================= +============ Partial average of Adjusted Rand Index = 0.15806016888099936 ================================= +============ Value of Jaccard Index = 0.5534979423868313 ================================= +============ Partial average of Jaccard Index = 0.4688686239129051 ====== +============ Precision = 0.8, Recall = 0.75, F1 = 0.7741935483870969 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 6 : "lakota" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 26, 27, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 58, 59, 60, 62, 63, 64] +The cluster 2 contains the snippets: [1, 17, 24, 28, 52, 57, 61] +The cluster 3 contains the snippets: [25, 33] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 25, 3, 17, 33, 4, 24, 5, 28, 6, 52, 7, 57, 8, 61, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 26, 27, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 58, 59, 60, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "lakota" =============== +============ Value of Rand Index = 0.3566468253968254 ================================= +============ Partial average Rand Index = 0.5815972222222222 ====== +============ Value of Adjusted Rand Index = -0.01306611164233784 ================================= +============ Partial average of Adjusted Rand Index = 0.12953912212710983 ================================= +============ Value of Jaccard Index = 0.20478234212139793 ================================= +============ Partial average of Jaccard Index = 0.42485424361432056 ====== +============ Precision = 0.375, Recall = 0.375, F1 = 0.375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 7 : "cerberus" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 8 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 8, 12, 14, 17, 18, 21, 22, 23, 25, 28, 29, 34, 35, 40, 42, 44, 45, 46, 47, 50, 51, 52, 55, 57, 58, 59, 62, 64] +The cluster 7 contains the snippets: [1, 5, 6, 11, 13, 15, 16, 20, 30, 36, 43] +The cluster 6 contains the snippets: [26, 27, 31, 33, 37, 38, 39, 41, 53, 63] +The cluster 2 contains the snippets: [10, 32, 54, 61] +The cluster 5 contains the snippets: [7, 48] +The cluster 8 contains the snippets: [19, 60] +The cluster 4 contains the snippets: [56] +The cluster 3 contains the snippets: [9] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 10, 9, 56, 7, 26, 1, 19, 3, 32, 48, 27, 5, 60, 4, 54, 31, 6, 8, 61, 33, 11, 12, 37, 13, 14, 38, 15, 17, 39, 16, 18, 41, 20, 21, 53, 30, 22, 63, 36, 23, 43, 25, 28, 29, 34, 35, 40, 42, 44, 45, 46, 47, 50, 51, 52, 55, 57, 58, 59, 62, 64, 24, 49] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "cerberus" =============== +============ Value of Rand Index = 0.6458333333333334 ================================= +============ Partial average Rand Index = 0.5907738095238095 ====== +============ Value of Adjusted Rand Index = 0.11089588377723969 ================================= +============ Partial average of Adjusted Rand Index = 0.12687580236284265 ================================= +============ Value of Jaccard Index = 0.2153846153846154 ================================= +============ Partial average of Jaccard Index = 0.394930011010077 ====== +============ Precision = 0.6129032258064516, Recall = 0.59375, F1 = 0.6031746031746031 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 8 ============ +============ average size of the created clusters: 7.75 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 8 : "mighty mouse" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 5, 7, 9, 10, 11, 13, 14, 15, 19, 20, 22, 23, 24, 28, 30, 32, 33, 34, 35, 38, 41, 42, 43, 44, 46, 50, 53, 55, 57, 58, 60, 61, 63, 64] +The cluster 2 contains the snippets: [4, 17, 18, 31, 37, 39, 47, 51, 52, 56, 59, 62] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 4, 2, 17, 5, 18, 7, 31, 9, 37, 10, 39, 11, 47, 13, 51, 14, 52, 15, 56, 19, 59, 20, 62, 22, 23, 24, 28, 30, 32, 33, 34, 35, 38, 41, 42, 43, 44, 46, 50, 53, 55, 57, 58, 60, 61, 63, 64, 3, 6, 8, 12, 16, 21, 25, 26, 27, 29, 36, 40, 45, 48, 49, 54] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "mighty mouse" =============== +============ Value of Rand Index = 0.6170634920634921 ================================= +============ Partial average Rand Index = 0.5940600198412699 ====== +============ Value of Adjusted Rand Index = 0.2059169278996865 ================================= +============ Partial average of Adjusted Rand Index = 0.13675594305494815 ================================= +============ Value of Jaccard Index = 0.3588039867109635 ================================= +============ Partial average of Jaccard Index = 0.39041425797268786 ====== +============ Precision = 0.625, Recall = 0.46875, F1 = 0.5357142857142857 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 24.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 9 : "lord of the flies" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63] +The cluster 2 contains the snippets: [19] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 19, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 2, 6, 7, 22, 33, 47, 51, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "lord of the flies" =============== +============ Value of Rand Index = 0.5798611111111112 ================================= +============ Partial average Rand Index = 0.5924823633156966 ====== +============ Value of Adjusted Rand Index = 0.18089192995652018 ================================= +============ Partial average of Adjusted Rand Index = 0.14165994159956727 ================================= +============ Value of Jaccard Index = 0.48914354644149577 ================================= +============ Partial average of Jaccard Index = 0.4013841789136665 ====== +============ Precision = 0.7321428571428571, Recall = 0.640625, F1 = 0.6833333333333332 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 28.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 10 : "sense and sensibility" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 4, 30] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "sense and sensibility" =============== +============ Value of Rand Index = 0.42857142857142855 ================================= +============ Partial average Rand Index = 0.5760912698412698 ====== +============ Value of Adjusted Rand Index = -0.04138208115709125 ================================= +============ Partial average of Adjusted Rand Index = 0.1233557393239014 ================================= +============ Value of Jaccard Index = 0.4152284263959391 ================================= +============ Partial average of Jaccard Index = 0.4027686036618937 ====== +============ Precision = 0.6290322580645161, Recall = 0.609375, F1 = 0.6190476190476191 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 62.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 11 : "century 21" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 3 contains the snippets: [1, 2, 6, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64] +The cluster 2 contains the snippets: [3, 4, 7, 31, 40, 47] +The cluster 4 contains the snippets: [5, 10] +The cluster 1 contains the snippets: [32] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [32, 3, 1, 5, 4, 2, 10, 7, 6, 31, 8, 40, 9, 47, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 24, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "century 21" =============== +============ Value of Rand Index = 0.8611111111111112 ================================= +============ Partial average Rand Index = 0.6020021645021644 ====== +============ Value of Adjusted Rand Index = 0.6481030555337366 ================================= +============ Partial average of Adjusted Rand Index = 0.17106004079752274 ================================= +============ Value of Jaccard Index = 0.826946847960445 ================================= +============ Partial average of Jaccard Index = 0.44133026223448935 ====== +============ Precision = 0.967741935483871, Recall = 0.9375, F1 = 0.9523809523809523 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 12 : "one tree hill" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 7, 8, 9, 11, 12, 13, 15, 16, 17, 18, 22, 23, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 45, 47, 52, 56, 57, 58] +The cluster 3 contains the snippets: [10, 14, 19, 20, 24, 25, 26, 37, 39, 40, 44, 46, 48, 49, 50, 53, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [51, 54, 55] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 51, 10, 2, 54, 14, 3, 55, 19, 5, 20, 7, 24, 8, 25, 9, 26, 11, 37, 12, 39, 13, 40, 15, 44, 16, 46, 17, 48, 18, 49, 22, 50, 23, 53, 27, 59, 28, 60, 29, 61, 30, 62, 31, 63, 32, 64, 33, 34, 35, 36, 38, 41, 42, 43, 45, 47, 52, 56, 57, 58, 4, 6, 21] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "one tree hill" =============== +============ Value of Rand Index = 0.5079365079365079 ================================= +============ Partial average Rand Index = 0.5941633597883597 ====== +============ Value of Adjusted Rand Index = 0.0845968993312552 ================================= +============ Partial average of Adjusted Rand Index = 0.1638547790086671 ================================= +============ Value of Jaccard Index = 0.41784037558685444 ================================= +============ Partial average of Jaccard Index = 0.43937277168051975 ====== +============ Precision = 0.8852459016393442, Recall = 0.84375, F1 = 0.864 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 13 : "stone cold" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64] +The cluster 2 contains the snippets: [61] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 61, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 47, 48] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "stone cold" =============== +============ Value of Rand Index = 0.5451388888888888 ================================= +============ Partial average Rand Index = 0.5903922466422465 ====== +============ Value of Adjusted Rand Index = 0.05507019993743642 ================================= +============ Partial average of Adjusted Rand Index = 0.1554867344647263 ================================= +============ Value of Jaccard Index = 0.5176223040504997 ================================= +============ Partial average of Jaccard Index = 0.44539196647821044 ====== +============ Precision = 0.7096774193548387, Recall = 0.6875, F1 = 0.6984126984126984 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 31.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 14 : "flight 93" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 11, 30, 34, 54] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "flight 93" =============== +============ Value of Rand Index = 0.37648809523809523 ================================= +============ Partial average Rand Index = 0.5751133786848072 ====== +============ Value of Adjusted Rand Index = -0.028561408977556126 ================================= +============ Partial average of Adjusted Rand Index = 0.14234043850456327 ================================= +============ Value of Jaccard Index = 0.3313829787234043 ================================= +============ Partial average of Jaccard Index = 0.4372484673528671 ====== +============ Precision = 0.45, Recall = 0.421875, F1 = 0.435483870967742 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 60.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 15 : "monte carlo" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 7 snippet clusters: ==================== +The cluster 6 contains the snippets: [1, 2, 6, 7, 9, 10, 12, 13, 14, 20, 21, 22, 25, 27, 28, 30, 33, 35, 37, 38, 39, 40, 42, 43, 47, 48, 52, 53, 54, 56, 57, 60, 61, 62, 63] +The cluster 1 contains the snippets: [11, 15, 19, 23, 24, 34, 49, 51, 64] +The cluster 7 contains the snippets: [8, 36, 46, 50, 59] +The cluster 4 contains the snippets: [17, 26, 31, 45] +The cluster 5 contains the snippets: [3, 18, 41, 44] +The cluster 3 contains the snippets: [4, 29, 32, 55] +The cluster 2 contains the snippets: [5, 16, 58] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [11, 5, 4, 17, 3, 1, 8, 15, 16, 29, 26, 18, 2, 36, 19, 58, 32, 31, 41, 6, 46, 23, 55, 45, 44, 7, 50, 24, 9, 59, 34, 10, 49, 12, 51, 13, 64, 14, 20, 21, 22, 25, 27, 28, 30, 33, 35, 37, 38, 39, 40, 42, 43, 47, 48, 52, 53, 54, 56, 57, 60, 61, 62, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "monte carlo" =============== +============ Value of Rand Index = 0.6731150793650794 ================================= +============ Partial average Rand Index = 0.5816468253968253 ====== +============ Value of Adjusted Rand Index = 0.1271775492666826 ================================= +============ Partial average of Adjusted Rand Index = 0.1413295792220379 ================================= +============ Value of Jaccard Index = 0.1721105527638191 ================================= +============ Partial average of Jaccard Index = 0.4195726063802639 ====== +============ Precision = 0.359375, Recall = 0.359375, F1 = 0.359375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 7 ============ +============ average size of the created clusters: 9.142857142857142 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 16 : "prince of persia" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 15, 29, 61] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "prince of persia" =============== +============ Value of Rand Index = 0.21478174603174602 ================================= +============ Partial average Rand Index = 0.5587177579365079 ====== +============ Value of Adjusted Rand Index = 0.005887432294528613 ================================= +============ Partial average of Adjusted Rand Index = 0.13286444503906858 ================================= +============ Value of Jaccard Index = 0.14663072776280323 ================================= +============ Partial average of Jaccard Index = 0.4025137389666726 ====== +============ Precision = 0.2459016393442623, Recall = 0.234375, F1 = 0.24 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 61.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 17 : "guild wars" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 20, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 20, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 1, 11, 12, 15, 19, 21, 25, 41, 50, 51, 61] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "guild wars" =============== +============ Value of Rand Index = 0.49702380952380953 ================================= +============ Partial average Rand Index = 0.5550887021475257 ====== +============ Value of Adjusted Rand Index = -0.00385291925173026 ================================= +============ Partial average of Adjusted Rand Index = 0.12482224713960981 ================================= +============ Value of Jaccard Index = 0.4121739130434783 ================================= +============ Partial average of Jaccard Index = 0.40308198450060234 ====== +============ Precision = 0.6037735849056604, Recall = 0.5, F1 = 0.5470085470085471 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 53.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 18 : "silent hill" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 5, 25, 26, 35] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "silent hill" =============== +============ Value of Rand Index = 0.29365079365079366 ================================= +============ Partial average Rand Index = 0.5405643738977073 ====== +============ Value of Adjusted Rand Index = 0.0010689470871191838 ================================= +============ Partial average of Adjusted Rand Index = 0.11794706380336034 ================================= +============ Value of Jaccard Index = 0.22185792349726777 ================================= +============ Partial average of Jaccard Index = 0.3930139811115282 ====== +============ Precision = 0.4166666666666667, Recall = 0.390625, F1 = 0.40322580645161293 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 60.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 19 : "kawasaki" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 0 snippet clusters: ==================== + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "kawasaki" =============== +============ Value of Rand Index = 0.25992063492063494 ================================= +============ Partial average Rand Index = 0.5257936507936508 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.11173932360318349 ================================= +============ Value of Jaccard Index = 0.25992063492063494 ================================= +============ Partial average of Jaccard Index = 0.3860090681541128 ====== +============ Precision = 0.0, Recall = 0.0, F1 = 0.0 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 0 ============ +============ average size of the created clusters: 0.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 20 : "battle of the bulge" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 2, 4, 5, 7, 8, 10, 14, 19, 22, 23, 24, 27, 30, 34, 36, 37, 38, 39, 41, 44, 45, 46, 47, 48, 55, 56, 57, 59, 62, 63] +The cluster 1 contains the snippets: [3, 6, 11, 12, 13, 15, 16, 17, 18, 20, 21, 26, 28, 29, 31, 32, 33, 35, 40, 42, 43, 49, 50, 51, 52, 53, 54, 58, 60, 61] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 6, 2, 11, 4, 12, 5, 13, 7, 15, 8, 16, 10, 17, 14, 18, 19, 20, 22, 21, 23, 26, 24, 28, 27, 29, 30, 31, 34, 32, 36, 33, 37, 35, 38, 40, 39, 42, 41, 43, 44, 49, 45, 50, 46, 51, 47, 52, 48, 53, 55, 54, 56, 58, 57, 60, 59, 61, 62, 63, 9, 25, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "battle of the bulge" =============== +============ Value of Rand Index = 0.5267857142857143 ================================= +============ Partial average Rand Index = 0.5258432539682539 ====== +============ Value of Adjusted Rand Index = 0.030220885660433263 ================================= +============ Partial average of Adjusted Rand Index = 0.10766340170604598 ================================= +============ Value of Jaccard Index = 0.2750759878419453 ================================= +============ Partial average of Jaccard Index = 0.3804624141385044 ====== +============ Precision = 0.5737704918032787, Recall = 0.546875, F1 = 0.5599999999999999 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 30.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 21 : "dead or alive" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 27, 28, 29, 32, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 57, 58, 59, 60, 61, 63, 64] +The cluster 2 contains the snippets: [4, 8, 10, 23, 24, 62] +The cluster 3 contains the snippets: [9] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 4, 9, 2, 8, 3, 10, 5, 23, 6, 24, 7, 62, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 27, 28, 29, 32, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 57, 58, 59, 60, 61, 63, 64, 21, 25, 26, 30, 31, 33, 38, 53, 56] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "dead or alive" =============== +============ Value of Rand Index = 0.6235119047619048 ================================= +============ Partial average Rand Index = 0.530494142101285 ====== +============ Value of Adjusted Rand Index = 0.2505554184152061 ================================= +============ Partial average of Adjusted Rand Index = 0.11446778345410122 ================================= +============ Value of Jaccard Index = 0.47978067169294036 ================================= +============ Partial average of Jaccard Index = 0.3851918549744299 ====== +============ Precision = 0.7636363636363637, Recall = 0.65625, F1 = 0.7058823529411765 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 18.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 22 : "babel fish" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "babel fish" =============== +============ Value of Rand Index = 0.24404761904761904 ================================= +============ Partial average Rand Index = 0.5174738455988456 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.1092647023880057 ================================= +============ Value of Jaccard Index = 0.24404761904761904 ================================= +============ Partial average of Jaccard Index = 0.37877620788684757 ====== +============ Precision = 0.328125, Recall = 0.328125, F1 = 0.328125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 23 : "queen" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 2 contains the snippets: [3, 5, 8, 10, 13, 16, 17, 18, 22, 24, 26, 27, 28, 31, 35, 36, 39, 40, 45, 46, 47, 48, 49, 50, 52, 54, 55, 56, 57, 58, 60, 62, 63] +The cluster 3 contains the snippets: [2, 4, 7, 9, 15, 19, 20, 23, 29, 32, 34, 38, 51, 53, 59] +The cluster 1 contains the snippets: [1, 42, 43, 44, 61, 64] +The cluster 4 contains the snippets: [11, 12, 33, 41] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 2, 11, 42, 5, 4, 12, 43, 8, 7, 33, 44, 10, 9, 41, 61, 13, 15, 64, 16, 19, 17, 20, 18, 23, 22, 29, 24, 32, 26, 34, 27, 38, 28, 51, 31, 53, 35, 59, 36, 39, 40, 45, 46, 47, 48, 49, 50, 52, 54, 55, 56, 57, 58, 60, 62, 63, 6, 14, 21, 25, 30, 37] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "queen" =============== +============ Value of Rand Index = 0.5868055555555556 ================================= +============ Partial average Rand Index = 0.5204882677708764 ====== +============ Value of Adjusted Rand Index = 0.03594604648599494 ================================= +============ Partial average of Adjusted Rand Index = 0.10607693474009222 ================================= +============ Value of Jaccard Index = 0.19980787704130643 ================================= +============ Partial average of Jaccard Index = 0.3709949761109545 ====== +============ Precision = 0.5344827586206896, Recall = 0.484375, F1 = 0.5081967213114754 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 14.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 24 : "noggin" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 4, 5, 6, 7, 8, 9, 10, 11, 15, 17, 18, 20, 23, 25, 26, 27, 29, 30, 32, 35, 36, 37, 42, 43, 44, 47, 48, 49, 56, 57, 61, 63, 64] +The cluster 2 contains the snippets: [2, 14, 24, 28, 33, 38, 39, 45, 46, 50, 51, 58, 60] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 14, 4, 24, 5, 28, 6, 33, 7, 38, 8, 39, 9, 45, 10, 46, 11, 50, 15, 51, 17, 58, 18, 60, 20, 23, 25, 26, 27, 29, 30, 32, 35, 36, 37, 42, 43, 44, 47, 48, 49, 56, 57, 61, 63, 64, 12, 13, 16, 19, 21, 22, 31, 34, 40, 41, 52, 53, 54, 55, 59, 62] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "noggin" =============== +============ Value of Rand Index = 0.6121031746031746 ================================= +============ Partial average Rand Index = 0.5243055555555556 ====== +============ Value of Adjusted Rand Index = 0.1843369043221278 ================================= +============ Partial average of Adjusted Rand Index = 0.10933776680601032 ================================= +============ Value of Jaccard Index = 0.33503401360544216 ================================= +============ Partial average of Jaccard Index = 0.36949660267322487 ====== +============ Precision = 0.6458333333333334, Recall = 0.484375, F1 = 0.5535714285714286 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 24.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 25 : "romeo and juliet" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [53] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 53, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "romeo and juliet" =============== +============ Value of Rand Index = 0.42956349206349204 ================================= +============ Partial average Rand Index = 0.520515873015873 ====== +============ Value of Adjusted Rand Index = 0.03881314318549862 ================================= +============ Partial average of Adjusted Rand Index = 0.10651678186118986 ================================= +============ Value of Jaccard Index = 0.4117647058823529 ================================= +============ Partial average of Jaccard Index = 0.37118732680159006 ====== +============ Precision = 0.640625, Recall = 0.640625, F1 = 0.640625 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 32.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 26 : "yellow" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 6 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 9, 11, 13, 16, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 35, 36, 38, 39, 41, 43, 44, 45, 46, 47, 50, 52, 54, 55, 56, 57, 58, 59, 60] +The cluster 4 contains the snippets: [1, 4, 8, 12, 20, 21, 34, 49, 61, 64] +The cluster 6 contains the snippets: [6, 10, 14, 32, 40, 42, 48, 62] +The cluster 5 contains the snippets: [3, 7, 15, 17] +The cluster 2 contains the snippets: [37, 63] +The cluster 3 contains the snippets: [53] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 37, 53, 1, 3, 6, 9, 63, 4, 7, 10, 11, 8, 15, 14, 13, 12, 17, 32, 16, 20, 40, 18, 21, 42, 19, 34, 48, 22, 49, 62, 23, 61, 24, 64, 25, 26, 27, 28, 29, 30, 31, 33, 35, 36, 38, 39, 41, 43, 44, 45, 46, 47, 50, 52, 54, 55, 56, 57, 58, 59, 60, 5, 51] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "yellow" =============== +============ Value of Rand Index = 0.5674603174603174 ================================= +============ Partial average Rand Index = 0.5223214285714285 ====== +============ Value of Adjusted Rand Index = 0.1333623206410336 ================================= +============ Partial average of Adjusted Rand Index = 0.10754930258349155 ================================= +============ Value of Jaccard Index = 0.33435114503816793 ================================= +============ Partial average of Jaccard Index = 0.3697705505799199 ====== +============ Precision = 0.7580645161290323, Recall = 0.734375, F1 = 0.7460317460317459 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 6 ============ +============ average size of the created clusters: 10.333333333333334 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 27 : "bermuda triangle" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 3 contains the snippets: [1, 2, 5, 6, 7, 8, 11, 13, 14, 18, 19, 22, 23, 24, 25, 27, 32, 34, 35, 37, 38, 42, 43, 47, 54, 56, 58, 59, 60, 61] +The cluster 1 contains the snippets: [3, 4, 9, 10, 12, 16, 17, 20, 26, 28, 29, 30, 31, 33, 36, 39, 45, 46, 50, 51, 55, 57] +The cluster 2 contains the snippets: [49, 53, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 49, 1, 4, 53, 2, 9, 64, 5, 10, 6, 12, 7, 16, 8, 17, 11, 20, 13, 26, 14, 28, 18, 29, 19, 30, 22, 31, 23, 33, 24, 36, 25, 39, 27, 45, 32, 46, 34, 50, 35, 51, 37, 55, 38, 57, 42, 43, 47, 54, 56, 58, 59, 60, 61, 15, 21, 40, 41, 44, 48, 52, 62, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bermuda triangle" =============== +============ Value of Rand Index = 0.59375 ================================= +============ Partial average Rand Index = 0.5249669312169312 ====== +============ Value of Adjusted Rand Index = 0.15262817551963045 ================================= +============ Partial average of Adjusted Rand Index = 0.10921889047001519 ================================= +============ Value of Jaccard Index = 0.3157894736842105 ================================= +============ Partial average of Jaccard Index = 0.36777125143563444 ====== +============ Precision = 0.6909090909090909, Recall = 0.59375, F1 = 0.6386554621848739 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 18.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 28 : "black planet" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 15, 16, 18, 19, 20, 22, 24, 25, 27, 28, 30, 31, 32, 33, 34, 35, 37, 41, 43, 44, 45, 46, 47, 49, 50, 51, 53, 54, 55, 56, 58, 60, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 15, 16, 18, 19, 20, 22, 24, 25, 27, 28, 30, 31, 32, 33, 34, 35, 37, 41, 43, 44, 45, 46, 47, 49, 50, 51, 53, 54, 55, 56, 58, 60, 62, 63, 64, 11, 12, 14, 17, 21, 23, 26, 29, 36, 38, 39, 40, 42, 48, 52, 57, 59, 61] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "black planet" =============== +============ Value of Rand Index = 0.466765873015873 ================================= +============ Partial average Rand Index = 0.5228883219954648 ====== +============ Value of Adjusted Rand Index = -0.008746941921646151 ================================= +============ Partial average of Adjusted Rand Index = 0.10500582502745585 ================================= +============ Value of Jaccard Index = 0.2706919945725916 ================================= +============ Partial average of Jaccard Index = 0.36430413511909715 ====== +============ Precision = 0.4782608695652174, Recall = 0.34375, F1 = 0.4 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 46.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 29 : "chase" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 8 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 4, 14, 21, 23, 25, 29, 30, 31, 34, 35, 37, 41, 42, 48, 50, 51, 52, 56, 60, 63] +The cluster 5 contains the snippets: [1, 3, 5, 11, 15, 17, 20, 24, 28, 33, 39, 43, 44, 61] +The cluster 3 contains the snippets: [9, 13, 16, 18, 19, 26, 27, 40, 49, 58, 64] +The cluster 2 contains the snippets: [7, 22, 47, 53, 57, 62] +The cluster 8 contains the snippets: [6, 12, 36, 54, 55, 59] +The cluster 7 contains the snippets: [45, 46] +The cluster 6 contains the snippets: [10] +The cluster 4 contains the snippets: [8] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 7, 9, 8, 1, 10, 45, 6, 4, 22, 13, 3, 46, 12, 14, 47, 16, 5, 36, 21, 53, 18, 11, 54, 23, 57, 19, 15, 55, 25, 62, 26, 17, 59, 29, 27, 20, 30, 40, 24, 31, 49, 28, 34, 58, 33, 35, 64, 39, 37, 43, 41, 44, 42, 61, 48, 50, 51, 52, 56, 60, 63, 32, 38] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "chase" =============== +============ Value of Rand Index = 0.6016865079365079 ================================= +============ Partial average Rand Index = 0.525605500821018 ====== +============ Value of Adjusted Rand Index = 0.10323464110506936 ================================= +============ Partial average of Adjusted Rand Index = 0.10494474971978734 ================================= +============ Value of Jaccard Index = 0.20337301587301587 ================================= +============ Partial average of Jaccard Index = 0.3587547861795771 ====== +============ Precision = 0.6612903225806451, Recall = 0.640625, F1 = 0.6507936507936509 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 8 ============ +============ average size of the created clusters: 7.75 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 30 : "ice age" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 26, 28, 29, 30, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [3, 5, 17, 27, 31, 37, 39] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 2, 5, 4, 17, 6, 27, 7, 31, 8, 37, 9, 39, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 26, 28, 29, 30, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 25] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "ice age" =============== +============ Value of Rand Index = 0.3655753968253968 ================================= +============ Partial average Rand Index = 0.520271164021164 ====== +============ Value of Adjusted Rand Index = 0.05436322934423203 ================================= +============ Partial average of Adjusted Rand Index = 0.10325869904060217 ================================= +============ Value of Jaccard Index = 0.20559006211180125 ================================= +============ Partial average of Jaccard Index = 0.3536492953773179 ====== +============ Precision = 0.3492063492063492, Recall = 0.34375, F1 = 0.3464566929133858 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 31.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 31 : "ghost" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 8 snippet clusters: ==================== +The cluster 1 contains the snippets: [6, 14, 16, 17, 20, 24, 26, 27, 28, 34, 40, 41, 44, 53, 54, 57, 58, 59, 61, 62, 63] +The cluster 2 contains the snippets: [3, 5, 12, 18, 22, 23, 29, 30, 32, 38, 39, 43, 45, 46, 48, 55] +The cluster 3 contains the snippets: [1, 4, 10, 13, 19, 21, 25, 47, 51, 56] +The cluster 5 contains the snippets: [2, 11, 49, 52, 64] +The cluster 6 contains the snippets: [7, 15, 33, 37, 42] +The cluster 7 contains the snippets: [31, 35, 36] +The cluster 8 contains the snippets: [8, 9, 50] +The cluster 4 contains the snippets: [60] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [6, 3, 1, 60, 2, 7, 31, 8, 14, 5, 4, 11, 15, 35, 9, 16, 12, 10, 49, 33, 36, 50, 17, 18, 13, 52, 37, 20, 22, 19, 64, 42, 24, 23, 21, 26, 29, 25, 27, 30, 47, 28, 32, 51, 34, 38, 56, 40, 39, 41, 43, 44, 45, 53, 46, 54, 48, 57, 55, 58, 59, 61, 62, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "ghost" =============== +============ Value of Rand Index = 0.7088293650793651 ================================= +============ Partial average Rand Index = 0.5263536866359446 ====== +============ Value of Adjusted Rand Index = 0.007254790107714515 ================================= +============ Partial average of Adjusted Rand Index = 0.10016179875244452 ================================= +============ Value of Jaccard Index = 0.09969325153374232 ================================= +============ Partial average of Jaccard Index = 0.34545716493075096 ====== +============ Precision = 0.40625, Recall = 0.40625, F1 = 0.40625 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 8 ============ +============ average size of the created clusters: 8.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 32 : "sisters of mercy" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 20, 21, 23, 24, 25, 26, 28, 30, 31, 34, 35, 37, 38, 41, 42, 43, 44, 45, 46, 47, 49, 50, 51, 52, 53, 54, 55, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [2, 3, 8, 13, 16, 19, 27, 29, 32, 33, 36, 39, 40, 48, 57] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 5, 3, 6, 8, 7, 13, 9, 16, 10, 19, 11, 27, 12, 29, 14, 32, 15, 33, 17, 36, 18, 39, 20, 40, 21, 48, 23, 57, 24, 25, 26, 28, 30, 31, 34, 35, 37, 38, 41, 42, 43, 44, 45, 46, 47, 49, 50, 51, 52, 53, 54, 55, 58, 59, 60, 61, 62, 63, 64, 4, 22, 56] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "sisters of mercy" =============== +============ Value of Rand Index = 0.9156746031746031 ================================= +============ Partial average Rand Index = 0.5385199652777778 ====== +============ Value of Adjusted Rand Index = 0.8305612658070143 ================================= +============ Partial average of Adjusted Rand Index = 0.12298678209789984 ================================= +============ Value of Jaccard Index = 0.8556876061120543 ================================= +============ Partial average of Jaccard Index = 0.3614018662176666 ====== +============ Precision = 0.9016393442622951, Recall = 0.859375, F1 = 0.88 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 30.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 33 : "indiana university" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 6, 10, 11, 13, 14, 15, 16, 19, 22, 23, 24, 25, 26, 27, 28, 34, 38, 39, 40, 43, 44, 46, 48, 49, 50, 51, 53, 55, 58, 59, 60, 62, 63] +The cluster 2 contains the snippets: [4, 7, 8, 9, 12, 17, 18, 20, 21, 29, 30, 31, 32, 33, 35, 36, 37, 41, 42, 47, 52, 54, 56, 57, 61, 64] +The cluster 3 contains the snippets: [5] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 4, 5, 2, 7, 3, 8, 6, 9, 10, 12, 11, 17, 13, 18, 14, 20, 15, 21, 16, 29, 19, 30, 22, 31, 23, 32, 24, 33, 25, 35, 26, 36, 27, 37, 28, 41, 34, 42, 38, 47, 39, 52, 40, 54, 43, 56, 44, 57, 46, 61, 48, 64, 49, 50, 51, 53, 55, 58, 59, 60, 62, 63, 45] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "indiana university" =============== +============ Value of Rand Index = 0.5079365079365079 ================================= +============ Partial average Rand Index = 0.5375931938431939 ====== +============ Value of Adjusted Rand Index = 0.037609731543301175 ================================= +============ Partial average of Adjusted Rand Index = 0.12039959874776049 ================================= +============ Value of Jaccard Index = 0.41440377804014167 ================================= +============ Partial average of Jaccard Index = 0.36300798475774165 ====== +============ Precision = 0.8571428571428571, Recall = 0.84375, F1 = 0.8503937007874015 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 34 : "fandango" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 8, 12, 15, 16, 17, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 58, 59, 60, 61, 62, 64] +The cluster 2 contains the snippets: [5, 11, 13, 21, 57] +The cluster 3 contains the snippets: [9, 19, 20] +The cluster 4 contains the snippets: [10, 56, 63] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 5, 9, 10, 2, 11, 19, 56, 3, 13, 20, 63, 4, 21, 6, 57, 7, 8, 12, 15, 16, 17, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 58, 59, 60, 61, 62, 64, 14, 44, 45, 46, 47, 48] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "fandango" =============== +============ Value of Rand Index = 0.7068452380952381 ================================= +============ Partial average Rand Index = 0.5425711951447247 ====== +============ Value of Adjusted Rand Index = 0.41518695075117995 ================================= +============ Partial average of Adjusted Rand Index = 0.12906981498315517 ================================= +============ Value of Jaccard Index = 0.5599404318689502 ================================= +============ Partial average of Jaccard Index = 0.3688001155551302 ====== +============ Precision = 0.7931034482758621, Recall = 0.71875, F1 = 0.7540983606557378 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 14.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 35 : "nickelodeon" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [45, 50] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 45, 2, 50, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 28] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "nickelodeon" =============== +============ Value of Rand Index = 0.5401785714285714 ================================= +============ Partial average Rand Index = 0.5425028344671203 ====== +============ Value of Adjusted Rand Index = 0.018336537552396816 ================================= +============ Partial average of Adjusted Rand Index = 0.12590600705656207 ================================= +============ Value of Jaccard Index = 0.5176899063475546 ================================= +============ Partial average of Jaccard Index = 0.37305410957777085 ====== +============ Precision = 0.7301587301587301, Recall = 0.71875, F1 = 0.7244094488188977 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 31.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 36 : "soul food" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 15, 16, 17, 18, 19, 24, 27, 28, 29, 31, 35, 36, 37, 38, 39, 41, 42, 46, 47, 49, 51, 53, 54, 55, 56, 57, 59, 61, 62, 64] +The cluster 3 contains the snippets: [12, 13, 14, 23, 26, 32, 34, 40, 43, 44, 45, 48, 50, 52, 60, 63] +The cluster 2 contains the snippets: [20, 22, 30, 33, 58] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 20, 12, 2, 22, 13, 3, 30, 14, 4, 33, 23, 5, 58, 26, 6, 32, 7, 34, 8, 40, 9, 43, 10, 44, 11, 45, 15, 48, 16, 50, 17, 52, 18, 60, 19, 63, 24, 27, 28, 29, 31, 35, 36, 37, 38, 39, 41, 42, 46, 47, 49, 51, 53, 54, 55, 56, 57, 59, 61, 62, 64, 21, 25] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "soul food" =============== +============ Value of Rand Index = 0.5208333333333334 ================================= +============ Partial average Rand Index = 0.5419009038800707 ====== +============ Value of Adjusted Rand Index = 0.0370750549584215 ================================= +============ Partial average of Adjusted Rand Index = 0.12343848060939148 ================================= +============ Value of Jaccard Index = 0.31971830985915495 ================================= +============ Partial average of Jaccard Index = 0.37157255958558705 ====== +============ Precision = 0.6451612903225806, Recall = 0.625, F1 = 0.634920634920635 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 37 : "judas" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 6, 9, 10, 12, 13, 14, 15, 18, 20, 21, 22, 23, 24, 29, 30, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 46, 47, 48, 49, 55, 56, 58, 59, 64] +The cluster 2 contains the snippets: [1, 2, 4, 5, 7, 8, 11, 16, 17, 19, 25, 26, 27, 28, 31, 32, 38, 42, 45, 50, 52, 53, 54, 57, 60, 61, 62, 63] +The cluster 3 contains the snippets: [51] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 51, 6, 2, 9, 4, 10, 5, 12, 7, 13, 8, 14, 11, 15, 16, 18, 17, 20, 19, 21, 25, 22, 26, 23, 27, 24, 28, 29, 31, 30, 32, 33, 38, 34, 42, 35, 45, 36, 50, 37, 52, 39, 53, 40, 54, 41, 57, 43, 60, 44, 61, 46, 62, 47, 63, 48, 49, 55, 56, 58, 59, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "judas" =============== +============ Value of Rand Index = 0.5808531746031746 ================================= +============ Partial average Rand Index = 0.5429536679536681 ====== +============ Value of Adjusted Rand Index = 0.13862185159490875 ================================= +============ Partial average of Adjusted Rand Index = 0.12384884198737844 ================================= +============ Value of Jaccard Index = 0.1748046875 ================================= +============ Partial average of Jaccard Index = 0.3662545089886793 ====== +============ Precision = 0.3125, Recall = 0.3125, F1 = 0.3125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 38 : "jungle fever" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 7, 8, 10, 13, 15, 16, 17, 18, 20, 22, 24, 25, 26, 30, 32, 33, 34, 35, 37, 40, 41, 42, 43, 46, 48, 50, 52, 58, 61, 62, 63] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 7, 8, 10, 13, 15, 16, 17, 18, 20, 22, 24, 25, 26, 30, 32, 33, 34, 35, 37, 40, 41, 42, 43, 46, 48, 50, 52, 58, 61, 62, 63, 3, 6, 9, 11, 12, 14, 19, 21, 23, 27, 28, 29, 31, 36, 38, 39, 44, 45, 47, 49, 51, 53, 54, 55, 56, 57, 59, 60, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "jungle fever" =============== +============ Value of Rand Index = 0.5793650793650794 ================================= +============ Partial average Rand Index = 0.5439118629908105 ====== +============ Value of Adjusted Rand Index = 0.15677243379484165 ================================= +============ Partial average of Adjusted Rand Index = 0.12471525229810117 ================================= +============ Value of Jaccard Index = 0.326984126984127 ================================= +============ Partial average of Jaccard Index = 0.36522107788329644 ====== +============ Precision = 0.5714285714285714, Recall = 0.3125, F1 = 0.404040404040404 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 35.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 39 : "bald eagle" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 5, 6, 8, 9, 10, 11, 12, 13, 16, 17, 18, 19, 21, 22, 27, 28, 29, 31, 32, 34, 35, 37, 39, 41, 43, 44, 45, 46, 51, 53, 54, 56, 57, 58, 59, 60, 61, 64] +The cluster 2 contains the snippets: [4, 7, 14, 15, 20, 23, 24, 25, 26, 30, 33, 36, 42, 47, 48, 49, 50, 52, 55, 62, 63] +The cluster 3 contains the snippets: [38, 40] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 4, 38, 2, 7, 40, 3, 14, 5, 15, 6, 20, 8, 23, 9, 24, 10, 25, 11, 26, 12, 30, 13, 33, 16, 36, 17, 42, 18, 47, 19, 48, 21, 49, 22, 50, 27, 52, 28, 55, 29, 62, 31, 63, 32, 34, 35, 37, 39, 41, 43, 44, 45, 46, 51, 53, 54, 56, 57, 58, 59, 60, 61, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bald eagle" =============== +============ Value of Rand Index = 0.5882936507936508 ================================= +============ Partial average Rand Index = 0.5450498575498577 ====== +============ Value of Adjusted Rand Index = 0.16706572459129343 ================================= +============ Partial average of Adjusted Rand Index = 0.12580116184408047 ================================= +============ Value of Jaccard Index = 0.5080023710729105 ================================= +============ Partial average of Jaccard Index = 0.36888213668303005 ====== +============ Precision = 0.859375, Recall = 0.859375, F1 = 0.859375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 40 : "boomerang" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 10 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 6, 7, 9, 19, 22, 23, 27, 29, 31, 35, 40, 44, 49, 51, 52, 55, 56, 60] +The cluster 3 contains the snippets: [8, 12, 14, 15, 34, 36, 37, 42, 57] +The cluster 2 contains the snippets: [4, 17, 18, 21, 24, 33, 62] +The cluster 6 contains the snippets: [3, 11, 26, 38, 43, 48] +The cluster 4 contains the snippets: [13, 16, 28, 45, 54] +The cluster 9 contains the snippets: [32, 39, 41, 47] +The cluster 7 contains the snippets: [46, 53, 64] +The cluster 10 contains the snippets: [10, 30, 58] +The cluster 5 contains the snippets: [5, 61] +The cluster 8 contains the snippets: [63] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 4, 8, 13, 5, 3, 46, 63, 32, 10, 6, 17, 12, 16, 61, 11, 53, 39, 30, 7, 18, 14, 28, 26, 64, 41, 58, 9, 21, 15, 45, 38, 47, 19, 24, 34, 54, 43, 22, 33, 36, 48, 23, 62, 37, 27, 42, 29, 57, 31, 35, 40, 44, 49, 51, 52, 55, 56, 60, 1, 20, 25, 50, 59] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "boomerang" =============== +============ Value of Rand Index = 0.685515873015873 ================================= +============ Partial average Rand Index = 0.548561507936508 ====== +============ Value of Adjusted Rand Index = 0.01469010175763184 ================================= +============ Partial average of Adjusted Rand Index = 0.12302338534191923 ================================= +============ Value of Jaccard Index = 0.10451977401129943 ================================= +============ Partial average of Jaccard Index = 0.36227307761623684 ====== +============ Precision = 0.559322033898305, Recall = 0.515625, F1 = 0.5365853658536586 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 10 ============ +============ average size of the created clusters: 5.9 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 41 : "far cry" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 3, 4, 5, 6, 9, 10, 12, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64] +The cluster 1 contains the snippets: [14, 16, 43, 45, 53] +The cluster 3 contains the snippets: [8, 11] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [14, 1, 8, 16, 3, 11, 43, 4, 45, 5, 53, 6, 9, 10, 12, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 63, 64, 2, 7, 25, 29, 61, 62] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "far cry" =============== +============ Value of Rand Index = 0.6865079365079365 ================================= +============ Partial average Rand Index = 0.5519260549748356 ====== +============ Value of Adjusted Rand Index = 0.21245424415233788 ================================= +============ Partial average of Adjusted Rand Index = 0.12520462580070993 ================================= +============ Value of Jaccard Index = 0.6535087719298246 ================================= +============ Partial average of Jaccard Index = 0.3693763872336414 ====== +============ Precision = 0.9310344827586207, Recall = 0.84375, F1 = 0.8852459016393444 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 19.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 42 : "harry potter" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [7, 32, 53] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 7, 2, 32, 3, 53, 4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "harry potter" =============== +============ Value of Rand Index = 0.30853174603174605 ================================= +============ Partial average Rand Index = 0.5461309523809526 ====== +============ Value of Adjusted Rand Index = 8.085109106307142E-4 ================================= +============ Partial average of Adjusted Rand Index = 0.12224281354142232 ================================= +============ Value of Jaccard Index = 0.25890483785220625 ================================= +============ Partial average of Jaccard Index = 0.36674611224836917 ====== +============ Precision = 0.390625, Recall = 0.390625, F1 = 0.390625 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 32.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 43 : "atom" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 0 snippet clusters: ==================== + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "atom" =============== +============ Value of Rand Index = 0.33134920634920634 ================================= +============ Partial average Rand Index = 0.5411360280546329 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.11939995741255204 ================================= +============ Value of Jaccard Index = 0.33134920634920634 ================================= +============ Partial average of Jaccard Index = 0.3659229283902491 ====== +============ Precision = 0.0, Recall = 0.0, F1 = 0.0 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 0 ============ +============ average size of the created clusters: 0.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 44 : "eros" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 0 snippet clusters: ==================== + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "eros" =============== +============ Value of Rand Index = 0.21626984126984128 ================================= +============ Partial average Rand Index = 0.5337527056277058 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.11668632201681221 ================================= +============ Value of Jaccard Index = 0.21626984126984128 ================================= +============ Partial average of Jaccard Index = 0.3625217218647853 ====== +============ Precision = 0.0, Recall = 0.0, F1 = 0.0 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 0 ============ +============ average size of the created clusters: 0.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 45 : "magic" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 8 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 12, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 35, 37, 39, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64] +The cluster 4 contains the snippets: [13, 21, 38] +The cluster 7 contains the snippets: [14, 40, 58] +The cluster 6 contains the snippets: [22, 32] +The cluster 5 contains the snippets: [34] +The cluster 2 contains the snippets: [7] +The cluster 3 contains the snippets: [36] +The cluster 8 contains the snippets: [47] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 7, 36, 13, 34, 22, 14, 47, 2, 21, 32, 40, 3, 38, 58, 4, 5, 6, 8, 9, 10, 11, 12, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 35, 37, 39, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "magic" =============== +============ Value of Rand Index = 0.3933531746031746 ================================= +============ Partial average Rand Index = 0.5306327160493829 ====== +============ Value of Adjusted Rand Index = 0.02647842478247893 ================================= +============ Partial average of Adjusted Rand Index = 0.11468170207827147 ================================= +============ Value of Jaccard Index = 0.12455261274158912 ================================= +============ Partial average of Jaccard Index = 0.35723351943982534 ====== +============ Precision = 0.34375, Recall = 0.34375, F1 = 0.34375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 8 ============ +============ average size of the created clusters: 8.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 46 : "carrot top" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [11, 22, 44, 47] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [11, 22, 44, 47, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "carrot top" =============== +============ Value of Rand Index = 0.6949404761904762 ================================= +============ Partial average Rand Index = 0.5342046238785372 ====== +============ Value of Adjusted Rand Index = 0.29931640625000006 ================================= +============ Partial average of Adjusted Rand Index = 0.11869549999504816 ================================= +============ Value of Jaccard Index = 0.6554621848739496 ================================= +============ Partial average of Jaccard Index = 0.36371675129708886 ====== +============ Precision = 0.75, Recall = 0.046875, F1 = 0.08823529411764706 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 4.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 47 : "mannequin" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 9, 10, 12, 14, 21, 22, 28, 29, 30, 31, 34, 35, 36, 38, 39, 40, 43, 46, 47, 51, 54, 55, 58, 59, 61, 62, 63] +The cluster 3 contains the snippets: [1, 11, 17, 18, 26, 27, 32, 37, 42, 49, 52, 60, 64] +The cluster 4 contains the snippets: [6, 13, 15, 16, 20, 23, 33, 41, 48, 53] +The cluster 2 contains the snippets: [8, 19, 24, 44, 50, 56] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 8, 1, 6, 3, 19, 11, 13, 4, 24, 17, 15, 5, 44, 18, 16, 9, 50, 26, 20, 10, 56, 27, 23, 12, 32, 33, 14, 37, 41, 21, 42, 48, 22, 49, 53, 28, 52, 29, 60, 30, 64, 31, 34, 35, 36, 38, 39, 40, 43, 46, 47, 51, 54, 55, 58, 59, 61, 62, 63, 7, 25, 45, 57] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "mannequin" =============== +============ Value of Rand Index = 0.6483134920634921 ================================= +============ Partial average Rand Index = 0.5366324721377915 ====== +============ Value of Adjusted Rand Index = 0.11788491446345256 ================================= +============ Partial average of Adjusted Rand Index = 0.11867825349437593 ================================= +============ Value of Jaccard Index = 0.2165745856353591 ================================= +============ Partial average of Jaccard Index = 0.3605860669213074 ====== +============ Precision = 0.48333333333333334, Recall = 0.453125, F1 = 0.46774193548387094 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 48 : "the last supper" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the last supper" =============== +============ Value of Rand Index = 0.27331349206349204 ================================= +============ Partial average Rand Index = 0.5311466600529102 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.11620578987990976 ================================= +============ Value of Jaccard Index = 0.27331349206349204 ================================= +============ Partial average of Jaccard Index = 0.3587678882784362 ====== +============ Precision = 0.46875, Recall = 0.46875, F1 = 0.46875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 49 : "bausch" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 7, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 49, 50, 51, 52, 53, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [3, 9, 10, 11, 15, 30, 32, 36, 45, 48, 54, 55] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 2, 9, 4, 10, 7, 11, 8, 15, 12, 30, 13, 32, 14, 36, 16, 45, 17, 48, 18, 54, 19, 55, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 49, 50, 51, 52, 53, 56, 57, 58, 59, 60, 61, 62, 63, 64, 5, 6] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "bausch" =============== +============ Value of Rand Index = 0.65625 ================================= +============ Partial average Rand Index = 0.5336997894395854 ====== +============ Value of Adjusted Rand Index = 0.36617924066069263 ================================= +============ Partial average of Adjusted Rand Index = 0.12130728887543599 ================================= +============ Value of Jaccard Index = 0.48475836431226765 ================================= +============ Partial average of Jaccard Index = 0.3613391224832084 ====== +============ Precision = 0.7419354838709677, Recall = 0.71875, F1 = 0.7301587301587302 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 31.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 50 : "coyote ugly" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 18, 19, 21, 25, 29, 30, 31, 32, 33, 34, 40, 41, 42, 44, 45, 46, 47, 50, 52, 53, 54, 55, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 18, 19, 21, 25, 29, 30, 31, 32, 33, 34, 40, 41, 42, 44, 45, 46, 47, 50, 52, 53, 54, 55, 58, 59, 60, 61, 62, 63, 64, 2, 4, 14, 15, 16, 17, 20, 22, 23, 24, 26, 27, 28, 35, 36, 37, 38, 39, 43, 48, 49, 51, 56, 57] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "coyote ugly" =============== +============ Value of Rand Index = 0.49255952380952384 ================================= +============ Partial average Rand Index = 0.532876984126984 ====== +============ Value of Adjusted Rand Index = -0.009776733254994147 ================================= +============ Partial average of Adjusted Rand Index = 0.11868560843282738 ================================= +============ Value of Jaccard Index = 0.31342281879194633 ================================= +============ Partial average of Jaccard Index = 0.3603807964093831 ====== +============ Precision = 0.55, Recall = 0.34375, F1 = 0.42307692307692313 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 40.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 51 : "stand by me" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 5, 7, 8, 9, 12, 14, 15, 16, 17, 18, 19, 21, 23, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 40, 41, 45, 47, 48, 51, 52, 53, 54, 55, 57, 58, 60, 61, 62] +The cluster 2 contains the snippets: [1, 2, 4, 6, 10, 11, 13, 20, 22, 24, 30, 35, 38, 39, 42, 46, 49, 50, 56, 59, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 5, 2, 7, 4, 8, 6, 9, 10, 12, 11, 14, 13, 15, 20, 16, 22, 17, 24, 18, 30, 19, 35, 21, 38, 23, 39, 26, 42, 27, 46, 28, 49, 29, 50, 31, 56, 32, 59, 33, 63, 34, 64, 36, 37, 40, 41, 45, 47, 48, 51, 52, 53, 54, 55, 57, 58, 60, 61, 62, 25, 43, 44] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "stand by me" =============== +============ Value of Rand Index = 0.5178571428571429 ================================= +============ Partial average Rand Index = 0.5325824774354185 ====== +============ Value of Adjusted Rand Index = 0.02324705037907674 ================================= +============ Partial average of Adjusted Rand Index = 0.11681426415726363 ================================= +============ Value of Jaccard Index = 0.24121779859484777 ================================= +============ Partial average of Jaccard Index = 0.3580442670404707 ====== +============ Precision = 0.5081967213114754, Recall = 0.484375, F1 = 0.496 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 30.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 52 : "shockwave" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 8 snippet clusters: ==================== +The cluster 6 contains the snippets: [1, 2, 3, 4, 7, 8, 13, 16, 17, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 37, 38, 40, 42, 43, 44, 45, 46, 47, 49, 51, 52, 61, 62] +The cluster 1 contains the snippets: [6, 9, 11, 12, 14, 15, 24, 32, 36, 41, 48, 50, 55, 56, 57, 58, 60, 63] +The cluster 7 contains the snippets: [10, 18] +The cluster 8 contains the snippets: [5, 20] +The cluster 5 contains the snippets: [39] +The cluster 2 contains the snippets: [54] +The cluster 3 contains the snippets: [64] +The cluster 4 contains the snippets: [59] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [6, 54, 64, 59, 39, 1, 10, 5, 9, 2, 18, 20, 11, 3, 12, 4, 14, 7, 15, 8, 24, 13, 32, 16, 36, 17, 41, 19, 48, 21, 50, 23, 55, 25, 56, 26, 57, 27, 58, 28, 60, 29, 63, 30, 31, 33, 34, 35, 37, 38, 40, 42, 43, 44, 45, 46, 47, 49, 51, 52, 61, 62, 22, 53] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "shockwave" =============== +============ Value of Rand Index = 0.6731150793650794 ================================= +============ Partial average Rand Index = 0.5352850274725274 ====== +============ Value of Adjusted Rand Index = 0.26874021624977706 ================================= +============ Partial average of Adjusted Rand Index = 0.11973591708211967 ================================= +============ Value of Jaccard Index = 0.33028455284552843 ================================= +============ Partial average of Jaccard Index = 0.3575104263828755 ====== +============ Precision = 0.5483870967741935, Recall = 0.53125, F1 = 0.5396825396825397 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 8 ============ +============ average size of the created clusters: 7.75 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 53 : "texas rangers" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 26, 30, 32, 33, 34, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 49, 50, 51, 53, 54, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [5, 8, 10, 24, 27, 28, 29, 31, 37, 42, 48, 52, 55, 56] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 5, 2, 8, 3, 10, 4, 24, 6, 27, 7, 28, 9, 29, 11, 31, 12, 37, 13, 42, 14, 48, 15, 52, 16, 55, 17, 56, 18, 19, 20, 21, 22, 23, 26, 30, 32, 33, 34, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 49, 50, 51, 53, 54, 57, 58, 59, 60, 61, 62, 63, 64, 25] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "texas rangers" =============== +============ Value of Rand Index = 0.71875 ================================= +============ Partial average Rand Index = 0.5387466307277629 ====== +============ Value of Adjusted Rand Index = 0.39888682745825604 ================================= +============ Partial average of Adjusted Rand Index = 0.12500291539110336 ================================= +============ Value of Jaccard Index = 0.6334841628959276 ================================= +============ Partial average of Jaccard Index = 0.3627174780151973 ====== +============ Precision = 0.8095238095238095, Recall = 0.796875, F1 = 0.8031496062992126 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 31.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 54 : "john carroll" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 7, 8, 9, 10, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64] +The cluster 2 contains the snippets: [3, 6, 32, 40, 61] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 2, 6, 4, 32, 5, 40, 7, 61, 8, 9, 10, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 11, 12, 18] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "john carroll" =============== +============ Value of Rand Index = 0.42857142857142855 ================================= +============ Partial average Rand Index = 0.5367063492063493 ====== +============ Value of Adjusted Rand Index = 0.06604285752202352 ================================= +============ Partial average of Adjusted Rand Index = 0.12391106246760189 ================================= +============ Value of Jaccard Index = 0.30097087378640774 ================================= +============ Partial average of Jaccard Index = 0.3615740223813309 ====== +============ Precision = 0.47540983606557374, Recall = 0.453125, F1 = 0.46399999999999997 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 30.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 55 : "courtney cox" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "courtney cox" =============== +============ Value of Rand Index = 0.5124007936507936 ================================= +============ Partial average Rand Index = 0.53626443001443 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12165813405910005 ================================= +============ Value of Jaccard Index = 0.5124007936507936 ================================= +============ Partial average of Jaccard Index = 0.36431632731350294 ====== +============ Precision = 0.671875, Recall = 0.671875, F1 = 0.671875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 56 : "man in black" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 4 contains the snippets: [1, 2, 4, 5, 11, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 61] +The cluster 1 contains the snippets: [3, 6, 7, 8, 9, 10, 15, 26, 59, 62, 63, 64] +The cluster 2 contains the snippets: [33, 36, 53] +The cluster 3 contains the snippets: [35, 60] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 33, 35, 1, 6, 36, 60, 2, 7, 53, 4, 8, 5, 9, 11, 10, 12, 15, 13, 26, 14, 59, 16, 62, 17, 63, 19, 64, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 61, 18, 47] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "man in black" =============== +============ Value of Rand Index = 0.8774801587301587 ================================= +============ Partial average Rand Index = 0.542357568027211 ====== +============ Value of Adjusted Rand Index = 0.7537012672252614 ================================= +============ Partial average of Adjusted Rand Index = 0.13294461857992432 ================================= +============ Value of Jaccard Index = 0.7953603976801988 ================================= +============ Partial average of Jaccard Index = 0.3720135428557653 ====== +============ Precision = 0.8387096774193549, Recall = 0.8125, F1 = 0.8253968253968254 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 57 : "hoover" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 3 contains the snippets: [15, 47] +The cluster 2 contains the snippets: [9] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 9, 15, 2, 47, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "hoover" =============== +============ Value of Rand Index = 0.20833333333333334 ================================= +============ Partial average Rand Index = 0.536497493734336 ====== +============ Value of Adjusted Rand Index = 0.01849030703293016 ================================= +============ Partial average of Adjusted Rand Index = 0.13093664820190687 ================================= +============ Value of Jaccard Index = 0.13213703099510604 ================================= +============ Partial average of Jaccard Index = 0.36780518299856074 ====== +============ Precision = 0.296875, Recall = 0.296875, F1 = 0.296875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 58 : "apache" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 2, 4, 6, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64] +The cluster 1 contains the snippets: [3, 5, 7, 8, 9, 42, 44] +The cluster 3 contains the snippets: [10, 17, 61] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 10, 5, 2, 17, 7, 4, 61, 8, 6, 9, 11, 42, 12, 44, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "apache" =============== +============ Value of Rand Index = 0.5858134920634921 ================================= +============ Partial average Rand Index = 0.5373477695675973 ====== +============ Value of Adjusted Rand Index = 0.2913433559650825 ================================= +============ Partial average of Adjusted Rand Index = 0.13370228109437543 ================================= +============ Value of Jaccard Index = 0.426904598490048 ================================= +============ Partial average of Jaccard Index = 0.36882413843806916 ====== +============ Precision = 0.546875, Recall = 0.546875, F1 = 0.546875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 59 : "fort recovery" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 5, 8, 9, 10, 12, 13, 14, 17, 18, 19, 21, 25, 26, 27, 29, 31, 32, 33, 37, 43, 44, 46, 47, 48, 49, 50, 53, 54, 55, 57, 59, 60, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 4, 5, 8, 9, 10, 12, 13, 14, 17, 18, 19, 21, 25, 26, 27, 29, 31, 32, 33, 37, 43, 44, 46, 47, 48, 49, 50, 53, 54, 55, 57, 59, 60, 63, 64, 3, 6, 7, 11, 15, 16, 20, 22, 23, 24, 28, 30, 34, 35, 36, 38, 39, 40, 41, 42, 45, 51, 52, 56, 58, 61, 62] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "fort recovery" =============== +============ Value of Rand Index = 0.5014880952380952 ================================= +============ Partial average Rand Index = 0.5367399784772668 ====== +============ Value of Adjusted Rand Index = 3.907498845511382E-4 ================================= +============ Partial average of Adjusted Rand Index = 0.13144276361624282 ================================= +============ Value of Jaccard Index = 0.39494280553883204 ================================= +============ Partial average of Jaccard Index = 0.36926682771096353 ====== +============ Precision = 0.7837837837837838, Recall = 0.453125, F1 = 0.5742574257425742 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 37.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 60 : "strongman" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64] +The cluster 3 contains the snippets: [16, 32, 52, 59] +The cluster 2 contains the snippets: [28, 40] +The cluster 4 contains the snippets: [26] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 28, 16, 26, 2, 40, 32, 3, 52, 4, 59, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "strongman" =============== +============ Value of Rand Index = 0.5119047619047619 ================================= +============ Partial average Rand Index = 0.5363260582010584 ====== +============ Value of Adjusted Rand Index = 0.09923906755579849 ================================= +============ Partial average of Adjusted Rand Index = 0.13090603534856873 ================================= +============ Value of Jaccard Index = 0.4298957126303592 ================================= +============ Partial average of Jaccard Index = 0.37027730912628676 ====== +============ Precision = 0.625, Recall = 0.625, F1 = 0.625 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 16.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 61 : "lemonade stand" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "lemonade stand" =============== +============ Value of Rand Index = 0.3298611111111111 ================================= +============ Partial average Rand Index = 0.5329413869372887 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12876003476908401 ================================= +============ Value of Jaccard Index = 0.3298611111111111 ================================= +============ Partial average of Jaccard Index = 0.36961474850308706 ====== +============ Precision = 0.375, Recall = 0.375, F1 = 0.375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 62 : "the da vinci code" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 12, 18, 30, 35] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the da vinci code" =============== +============ Value of Rand Index = 0.37648809523809523 ================================= +============ Partial average Rand Index = 0.530417946748592 ====== +============ Value of Adjusted Rand Index = 0.0626065340909091 ================================= +============ Partial average of Adjusted Rand Index = 0.12769304282266183 ================================= +============ Value of Jaccard Index = 0.30244173140954494 ================================= +============ Partial average of Jaccard Index = 0.3685313127435138 ====== +============ Precision = 0.4666666666666667, Recall = 0.4375, F1 = 0.45161290322580644 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 60.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 63 : "sherlock holmes" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "sherlock holmes" =============== +============ Value of Rand Index = 0.18551587301587302 ================================= +============ Partial average Rand Index = 0.5249433106575965 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12566616912706402 ================================= +============ Value of Jaccard Index = 0.18551587301587302 ================================= +============ Partial average of Jaccard Index = 0.36562630576370997 ====== +============ Precision = 0.359375, Recall = 0.359375, F1 = 0.359375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 64 : "ten commandments" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 5, 7, 8, 9, 10, 12, 13, 19, 20, 21, 23, 28, 30, 31, 32, 33, 34, 35, 36, 39, 40, 41, 42, 43, 46, 47, 49, 51, 54, 57, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [1, 6, 17, 18, 22, 27, 37, 45, 50, 53, 56, 59] +The cluster 3 contains the snippets: [4, 11, 14, 15, 29, 44, 55, 58] +The cluster 4 contains the snippets: [16, 24, 38, 48, 52] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 4, 16, 3, 6, 11, 24, 5, 17, 14, 38, 7, 18, 15, 48, 8, 22, 29, 52, 9, 27, 44, 10, 37, 55, 12, 45, 58, 13, 50, 19, 53, 20, 56, 21, 59, 23, 28, 30, 31, 32, 33, 34, 35, 36, 39, 40, 41, 42, 43, 46, 47, 49, 51, 54, 57, 60, 61, 62, 63, 64, 25, 26] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "ten commandments" =============== +============ Value of Rand Index = 0.6056547619047619 ================================= +============ Partial average Rand Index = 0.5262044270833335 ====== +============ Value of Adjusted Rand Index = 0.16412679538129363 ================================= +============ Partial average of Adjusted Rand Index = 0.12626711641228638 ================================= +============ Value of Jaccard Index = 0.3181818181818182 ================================= +============ Partial average of Jaccard Index = 0.36488498564524297 ====== +============ Precision = 0.6451612903225806, Recall = 0.625, F1 = 0.634920634920635 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 65 : "agent orange" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 7, 9, 10, 11, 12, 13, 14, 16, 18, 19, 21, 22, 23, 24, 27, 29, 30, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 47, 48, 49, 51, 53, 55, 57, 58, 59, 61, 62, 64] +The cluster 2 contains the snippets: [8, 17, 20, 50, 54, 56, 60] +The cluster 3 contains the snippets: [6, 15, 45, 46] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 8, 6, 2, 17, 15, 3, 20, 45, 4, 50, 46, 5, 54, 7, 56, 9, 60, 10, 11, 12, 13, 14, 16, 18, 19, 21, 22, 23, 24, 27, 29, 30, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 47, 48, 49, 51, 53, 55, 57, 58, 59, 61, 62, 64, 25, 26, 28, 33, 37, 44, 52, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "agent orange" =============== +============ Value of Rand Index = 0.7723214285714286 ================================= +============ Partial average Rand Index = 0.5299908424908426 ====== +============ Value of Adjusted Rand Index = 0.5413021581022025 ================================= +============ Partial average of Adjusted Rand Index = 0.13265227089982354 ================================= +============ Value of Jaccard Index = 0.661504424778761 ================================= +============ Partial average of Jaccard Index = 0.36944836163191236 ====== +============ Precision = 0.875, Recall = 0.765625, F1 = 0.8166666666666667 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 18.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 66 : "heron island" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 7, 8, 10, 11, 12, 13, 17, 18, 23, 24, 25, 26, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 50, 51, 53, 54, 55, 57, 58, 60, 61, 62, 63] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 7, 8, 10, 11, 12, 13, 17, 18, 23, 24, 25, 26, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 50, 51, 53, 54, 55, 57, 58, 60, 61, 62, 63, 6, 9, 14, 15, 16, 19, 20, 21, 22, 27, 28, 32, 42, 43, 44, 45, 46, 47, 48, 49, 52, 56, 59, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "heron island" =============== +============ Value of Rand Index = 0.5238095238095238 ================================= +============ Partial average Rand Index = 0.5298971861471864 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.13064238800740197 ================================= +============ Value of Jaccard Index = 0.5238095238095238 ================================= +============ Partial average of Jaccard Index = 0.371787167119452 ====== +============ Precision = 1.0, Recall = 0.625, F1 = 0.7692307692307693 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 40.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 67 : "mortal kombat" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "mortal kombat" =============== +============ Value of Rand Index = 0.2718253968253968 ================================= +============ Partial average Rand Index = 0.5260453683961149 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.1286925016192318 ================================= +============ Value of Jaccard Index = 0.2718253968253968 ================================= +============ Partial average of Jaccard Index = 0.3702952003986451 ====== +============ Precision = 0.375, Recall = 0.375, F1 = 0.375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 68 : "marble" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 8 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 10, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 54, 59, 60, 61, 62, 63, 64] +The cluster 5 contains the snippets: [11, 24, 25, 27, 41] +The cluster 4 contains the snippets: [15, 26, 55, 58] +The cluster 2 contains the snippets: [18, 46, 57] +The cluster 3 contains the snippets: [9] +The cluster 6 contains the snippets: [32] +The cluster 7 contains the snippets: [8] +The cluster 8 contains the snippets: [56] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 18, 9, 15, 11, 32, 8, 56, 2, 46, 26, 24, 3, 57, 55, 25, 4, 58, 27, 5, 41, 6, 7, 10, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 54, 59, 60, 61, 62, 63, 64, 52] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "marble" =============== +============ Value of Rand Index = 0.49255952380952384 ================================= +============ Partial average Rand Index = 0.5255529295051357 ====== +============ Value of Adjusted Rand Index = 0.03567460807307738 ================================= +============ Partial average of Adjusted Rand Index = 0.12732459142002361 ================================= +============ Value of Jaccard Index = 0.19827586206896552 ================================= +============ Partial average of Jaccard Index = 0.3677655042467381 ====== +============ Precision = 0.4603174603174603, Recall = 0.453125, F1 = 0.4566929133858268 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 8 ============ +============ average size of the created clusters: 7.875 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 69 : "neptune" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 4, 6, 7, 8, 9, 13, 14, 16, 19, 23, 26, 27, 31, 32, 33, 36, 37, 38, 39, 40, 43, 47, 48, 53, 54, 57, 59, 60, 63, 64] +The cluster 2 contains the snippets: [3, 5, 10, 12, 15, 17, 18, 20, 21, 22, 24, 28, 29, 30, 34, 35, 41, 44, 45, 46, 49, 50, 51, 52, 58, 62] +The cluster 3 contains the snippets: [11, 25, 42, 56, 61] +The cluster 4 contains the snippets: [55] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 3, 11, 55, 2, 5, 25, 4, 10, 42, 6, 12, 56, 7, 15, 61, 8, 17, 9, 18, 13, 20, 14, 21, 16, 22, 19, 24, 23, 28, 26, 29, 27, 30, 31, 34, 32, 35, 33, 41, 36, 44, 37, 45, 38, 46, 39, 49, 40, 50, 43, 51, 47, 52, 48, 58, 53, 62, 54, 57, 59, 60, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "neptune" =============== +============ Value of Rand Index = 0.6840277777777778 ================================= +============ Partial average Rand Index = 0.5278496664366233 ====== +============ Value of Adjusted Rand Index = 0.29947304683664455 ================================= +============ Partial average of Adjusted Rand Index = 0.12981949657098915 ================================= +============ Value of Jaccard Index = 0.3343782654127482 ================================= +============ Partial average of Jaccard Index = 0.3672816312201586 ====== +============ Precision = 0.546875, Recall = 0.546875, F1 = 0.546875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 16.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 70 : "full moon" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 28, 30, 32, 33, 34, 36, 37, 38, 39, 41, 43, 44, 45, 46, 47, 49, 50, 51, 54, 55, 57, 58, 59, 60, 61, 62, 64] +The cluster 2 contains the snippets: [6, 18, 26, 40, 42, 52, 53, 63] +The cluster 4 contains the snippets: [25, 35, 48, 56] +The cluster 3 contains the snippets: [29, 31] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 6, 29, 25, 2, 18, 31, 35, 3, 26, 48, 4, 40, 56, 5, 42, 7, 52, 8, 53, 9, 63, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 28, 30, 32, 33, 34, 36, 37, 38, 39, 41, 43, 44, 45, 46, 47, 49, 50, 51, 54, 55, 57, 58, 59, 60, 61, 62, 64, 22, 27] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "full moon" =============== +============ Value of Rand Index = 0.5287698412698413 ================================= +============ Partial average Rand Index = 0.5278628117913836 ====== +============ Value of Adjusted Rand Index = 0.08096280087527348 ================================= +============ Partial average of Adjusted Rand Index = 0.12912154377533608 ================================= +============ Value of Jaccard Index = 0.3572395128552097 ================================= +============ Partial average of Jaccard Index = 0.3671381723863736 ====== +============ Precision = 0.5483870967741935, Recall = 0.53125, F1 = 0.5396825396825397 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 71 : "dsl" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [39, 42, 43, 44, 45] +The cluster 3 contains the snippets: [17, 21, 30] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 39, 17, 2, 42, 21, 3, 43, 30, 4, 44, 5, 45, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 29] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "dsl" =============== +============ Value of Rand Index = 0.5744047619047619 ================================= +============ Partial average Rand Index = 0.5285183322155156 ====== +============ Value of Adjusted Rand Index = 0.26198838792918067 ================================= +============ Partial average of Adjusted Rand Index = 0.1309929077775029 ================================= +============ Value of Jaccard Index = 0.4366382140512147 ================================= +============ Partial average of Jaccard Index = 0.36811704621263897 ====== +============ Precision = 0.6507936507936508, Recall = 0.640625, F1 = 0.6456692913385828 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 21.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 72 : "blood work" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "blood work" =============== +============ Value of Rand Index = 0.31398809523809523 ================================= +============ Partial average Rand Index = 0.5255387455908292 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12917356183614867 ================================= +============ Value of Jaccard Index = 0.31398809523809523 ================================= +============ Partial average of Jaccard Index = 0.3673652552268814 ====== +============ Precision = 0.4375, Recall = 0.4375, F1 = 0.4375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 73 : "medal of honor" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 25, 26, 28, 43, 49] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "medal of honor" =============== +============ Value of Rand Index = 0.4955357142857143 ================================= +============ Partial average Rand Index = 0.525127745161992 ====== +============ Value of Adjusted Rand Index = 0.05100561544998578 ================================= +============ Partial average of Adjusted Rand Index = 0.12810276805003687 ================================= +============ Value of Jaccard Index = 0.4436542669584245 ================================= +============ Partial average of Jaccard Index = 0.368410310182108 ====== +============ Precision = 0.6440677966101694, Recall = 0.59375, F1 = 0.6178861788617885 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 59.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 74 : "the wizard of oz" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 0 snippet clusters: ==================== + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "the wizard of oz" =============== +============ Value of Rand Index = 0.3159722222222222 ================================= +============ Partial average Rand Index = 0.5223013191763194 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.1263716495628742 ================================= +============ Value of Jaccard Index = 0.3159722222222222 ================================= +============ Partial average of Jaccard Index = 0.3677016873718393 ====== +============ Precision = 0.0, Recall = 0.0, F1 = 0.0 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 0 ============ +============ average size of the created clusters: 0.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 75 : "snake" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 5, 6, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 21, 25, 29, 30, 34, 36, 37, 41, 43, 44, 46, 49, 50, 51, 52, 53, 54, 59, 60, 62, 63] +The cluster 2 contains the snippets: [13, 19, 23, 24, 26, 28, 31, 32, 33, 35, 39, 42, 45, 47, 56, 61, 64] +The cluster 3 contains the snippets: [2, 3, 4, 7, 20, 27, 55, 57] +The cluster 4 contains the snippets: [22, 40] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 13, 2, 22, 5, 19, 3, 40, 6, 23, 4, 8, 24, 7, 9, 26, 20, 10, 28, 27, 11, 31, 55, 12, 32, 57, 14, 33, 15, 35, 16, 39, 17, 42, 18, 45, 21, 47, 25, 56, 29, 61, 30, 64, 34, 36, 37, 41, 43, 44, 46, 49, 50, 51, 52, 53, 54, 59, 60, 62, 63, 38, 48, 58] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "snake" =============== +============ Value of Rand Index = 0.6473214285714286 ================================= +============ Partial average Rand Index = 0.5239682539682542 ====== +============ Value of Adjusted Rand Index = 0.16916720572585192 ================================= +============ Partial average of Adjusted Rand Index = 0.12694225697838057 ================================= +============ Value of Jaccard Index = 0.2507903055848261 ================================= +============ Partial average of Jaccard Index = 0.3661428689480124 ====== +============ Precision = 0.5245901639344263, Recall = 0.5, F1 = 0.512 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.25 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 76 : "apple" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 7 snippet clusters: ==================== +The cluster 4 contains the snippets: [1, 4, 6, 7, 10, 11, 16, 17, 19, 20, 21, 23, 24, 28, 29, 30, 31, 32, 35, 36, 37, 38, 41, 42, 44, 45, 49, 51, 52, 56, 58, 61, 62, 64] +The cluster 6 contains the snippets: [2, 3, 18, 27, 34, 39, 50, 55, 57, 59, 60] +The cluster 1 contains the snippets: [8, 12, 13, 14, 22, 26, 33, 40, 43, 63] +The cluster 2 contains the snippets: [5, 25, 53] +The cluster 5 contains the snippets: [9] +The cluster 3 contains the snippets: [15] +The cluster 7 contains the snippets: [54] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [8, 5, 15, 1, 9, 2, 54, 12, 25, 4, 3, 13, 53, 6, 18, 14, 7, 27, 22, 10, 34, 26, 11, 39, 33, 16, 50, 40, 17, 55, 43, 19, 57, 63, 20, 59, 21, 60, 23, 24, 28, 29, 30, 31, 32, 35, 36, 37, 38, 41, 42, 44, 45, 49, 51, 52, 56, 58, 61, 62, 64, 46, 47, 48] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "apple" =============== +============ Value of Rand Index = 0.3621031746031746 ================================= +============ Partial average Rand Index = 0.521838450292398 ====== +============ Value of Adjusted Rand Index = 0.031398578355222896 ================================= +============ Partial average of Adjusted Rand Index = 0.12568510331228638 ================================= +============ Value of Jaccard Index = 0.3415258576548899 ================================= +============ Partial average of Jaccard Index = 0.36581896090468186 ====== +============ Precision = 1.0, Recall = 0.953125, F1 = 0.976 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 7 ============ +============ average size of the created clusters: 8.714285714285714 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 77 : "pizza" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 5 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 44, 45, 50, 52, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64] +The cluster 4 contains the snippets: [5, 24, 36, 37, 43, 46, 49, 51, 58] +The cluster 5 contains the snippets: [27, 48] +The cluster 2 contains the snippets: [53] +The cluster 3 contains the snippets: [47] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 53, 47, 5, 27, 2, 24, 48, 3, 36, 4, 37, 6, 43, 7, 46, 8, 49, 9, 51, 10, 58, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 44, 45, 50, 52, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "pizza" =============== +============ Value of Rand Index = 0.626984126984127 ================================= +============ Partial average Rand Index = 0.5232039785611217 ====== +============ Value of Adjusted Rand Index = 0.03140333660451412 ================================= +============ Partial average of Adjusted Rand Index = 0.12446066478361402 ================================= +============ Value of Jaccard Index = 0.6083333333333333 ================================= +============ Partial average of Jaccard Index = 0.3689684982089501 ====== +============ Precision = 0.953125, Recall = 0.953125, F1 = 0.953125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 5 ============ +============ average size of the created clusters: 12.8 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 78 : "shakira" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "shakira" =============== +============ Value of Rand Index = 0.96875 ================================= +============ Partial average Rand Index = 0.5289161070411073 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12286501523510615 ================================= +============ Value of Jaccard Index = 0.96875 ================================= +============ Partial average of Jaccard Index = 0.3766580046421687 ====== +============ Precision = 0.984375, Recall = 0.984375, F1 = 0.984375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 79 : "zero hour" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 9, 10, 11, 13, 14, 16, 17, 18, 19, 21, 23, 24, 27, 29, 30, 31, 33, 34, 37, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 59, 61, 63, 64] +The cluster 3 contains the snippets: [8, 15, 38, 40, 42] +The cluster 4 contains the snippets: [12, 20, 28, 35, 36] +The cluster 2 contains the snippets: [22, 55, 60] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 22, 8, 12, 2, 55, 15, 20, 3, 60, 38, 28, 4, 40, 35, 5, 42, 36, 6, 7, 9, 10, 11, 13, 14, 16, 17, 18, 19, 21, 23, 24, 27, 29, 30, 31, 33, 34, 37, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 59, 61, 63, 64, 25, 26, 32, 56, 62] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "zero hour" =============== +============ Value of Rand Index = 0.5138888888888888 ================================= +============ Partial average Rand Index = 0.5287258890898133 ====== +============ Value of Adjusted Rand Index = 0.055443363319258296 ================================= +============ Partial average of Adjusted Rand Index = 0.12201157660325998 ================================= +============ Value of Jaccard Index = 0.234375 ================================= +============ Partial average of Jaccard Index = 0.3748569539504957 ====== +============ Precision = 0.5254237288135594, Recall = 0.484375, F1 = 0.5040650406504066 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 14.75 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 80 : "soldier of fortune" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 2 contains the snippets: [2, 4, 10, 14, 16, 26, 28, 43, 44, 46, 47, 52, 54, 56, 60, 61, 62] +The cluster 1 contains the snippets: [1, 8, 12, 13, 17, 18, 20, 27, 31, 32, 36, 37, 57, 64] +The cluster 4 contains the snippets: [5, 6, 23, 33, 35, 48, 51, 58, 59] +The cluster 3 contains the snippets: [15, 24, 30, 34, 38, 45, 50, 55] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 15, 5, 8, 4, 24, 6, 12, 10, 30, 23, 13, 14, 34, 33, 17, 16, 38, 35, 18, 26, 45, 48, 20, 28, 50, 51, 27, 43, 55, 58, 31, 44, 59, 32, 46, 36, 47, 37, 52, 57, 54, 64, 56, 60, 61, 62, 3, 7, 9, 11, 19, 21, 22, 25, 29, 39, 40, 41, 42, 49, 53, 63] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "soldier of fortune" =============== +============ Value of Rand Index = 0.7673611111111112 ================================= +============ Partial average Rand Index = 0.5317088293650796 ====== +============ Value of Adjusted Rand Index = 0.1767975426792319 ================================= +============ Partial average of Adjusted Rand Index = 0.12269640117920963 ================================= +============ Value of Jaccard Index = 0.18292682926829268 ================================= +============ Partial average of Jaccard Index = 0.3724578273919681 ====== +============ Precision = 0.5, Recall = 0.375, F1 = 0.42857142857142855 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 12.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 81 : "hedonism" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 30, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 49, 50, 51, 52, 55, 56, 58, 59, 61, 62, 63, 64] +The cluster 2 contains the snippets: [9, 29, 36, 53, 54, 57] +The cluster 3 contains the snippets: [22, 31] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 9, 22, 2, 29, 31, 3, 36, 4, 53, 5, 54, 6, 57, 7, 8, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 30, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 49, 50, 51, 52, 55, 56, 58, 59, 61, 62, 63, 64, 16, 45, 48, 60] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "hedonism" =============== +============ Value of Rand Index = 0.5466269841269841 ================================= +============ Partial average Rand Index = 0.5318930041152266 ====== +============ Value of Adjusted Rand Index = 0.18685570649871494 ================================= +============ Partial average of Adjusted Rand Index = 0.12348849136833934 ================================= +============ Value of Jaccard Index = 0.3752563226247437 ================================= +============ Partial average of Jaccard Index = 0.3724923767158295 ====== +============ Precision = 0.5833333333333334, Recall = 0.546875, F1 = 0.564516129032258 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 82 : "steam" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 6 snippet clusters: ==================== +The cluster 4 contains the snippets: [1, 2, 3, 5, 6, 7, 9, 10, 11, 14, 17, 18, 23, 26, 27, 28, 30, 31, 32, 33, 35, 37, 40, 41, 43, 45, 49, 54, 56, 58, 59, 60, 61, 62] +The cluster 2 contains the snippets: [4, 16, 20, 21, 22, 25, 42, 44, 48, 52, 53, 57, 64] +The cluster 1 contains the snippets: [12, 13, 15, 19, 24, 34, 38, 51, 63] +The cluster 3 contains the snippets: [8, 29, 36, 47, 50] +The cluster 5 contains the snippets: [55] +The cluster 6 contains the snippets: [39] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [12, 4, 8, 1, 55, 39, 13, 16, 29, 2, 15, 20, 36, 3, 19, 21, 47, 5, 24, 22, 50, 6, 34, 25, 7, 38, 42, 9, 51, 44, 10, 63, 48, 11, 52, 14, 53, 17, 57, 18, 64, 23, 26, 27, 28, 30, 31, 32, 33, 35, 37, 40, 41, 43, 45, 49, 54, 56, 58, 59, 60, 61, 62, 46] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "steam" =============== +============ Value of Rand Index = 0.5892857142857143 ================================= +============ Partial average Rand Index = 0.5325929152148666 ====== +============ Value of Adjusted Rand Index = 0.21903822635263165 ================================= +============ Partial average of Adjusted Rand Index = 0.12465373203887949 ================================= +============ Value of Jaccard Index = 0.3830104321907601 ================================= +============ Partial average of Jaccard Index = 0.37262064568503594 ====== +============ Precision = 0.7777777777777778, Recall = 0.765625, F1 = 0.7716535433070867 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 6 ============ +============ average size of the created clusters: 10.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 83 : "jurassic park" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [18, 46] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 18, 2, 46, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 11, 22, 31, 33] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "jurassic park" =============== +============ Value of Rand Index = 0.43154761904761907 ================================= +============ Partial average Rand Index = 0.5313755020080324 ====== +============ Value of Adjusted Rand Index = 0.057781025898689116 ================================= +============ Partial average of Adjusted Rand Index = 0.12384803678417841 ================================= +============ Value of Jaccard Index = 0.3436426116838488 ================================= +============ Partial average of Jaccard Index = 0.3722715127452626 ====== +============ Precision = 0.5833333333333334, Recall = 0.546875, F1 = 0.564516129032258 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 30.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 84 : "match point" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [5, 6, 7, 9, 10, 11, 14, 15, 16, 19, 20, 21, 24, 25, 27, 29, 30, 31, 34, 35, 36, 37, 38, 39, 46, 49, 51, 52, 54, 56, 57, 59, 61, 62, 63] +The cluster 2 contains the snippets: [1, 2, 3, 4, 22, 23, 26, 40, 42, 43, 47, 50, 55] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [5, 1, 6, 2, 7, 3, 9, 4, 10, 22, 11, 23, 14, 26, 15, 40, 16, 42, 19, 43, 20, 47, 21, 50, 24, 55, 25, 27, 29, 30, 31, 34, 35, 36, 37, 38, 39, 46, 49, 51, 52, 54, 56, 57, 59, 61, 62, 63, 8, 12, 13, 17, 18, 28, 32, 33, 41, 44, 45, 48, 53, 58, 60, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "match point" =============== +============ Value of Rand Index = 0.5228174603174603 ================================= +============ Partial average Rand Index = 0.5312736205593351 ====== +============ Value of Adjusted Rand Index = 0.01542610385535829 ================================= +============ Partial average of Adjusted Rand Index = 0.12255729948740673 ================================= +============ Value of Jaccard Index = 0.26508785332314744 ================================= +============ Partial average of Jaccard Index = 0.3709955167997613 ====== +============ Precision = 0.5833333333333334, Recall = 0.4375, F1 = 0.5 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 24.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 85 : "equinox" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 7 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 6, 7, 9, 10, 12, 20, 21, 22, 23, 24, 26, 27, 29, 30, 33, 35, 38, 39, 40, 45, 46, 49, 55, 61, 64] +The cluster 3 contains the snippets: [1, 11, 15, 25, 28, 37, 47, 50, 51, 53, 57, 58, 60, 62, 63] +The cluster 6 contains the snippets: [4, 17, 18, 31, 32, 34, 43, 52, 56] +The cluster 7 contains the snippets: [5, 14, 19, 42, 59] +The cluster 5 contains the snippets: [8, 48, 54] +The cluster 4 contains the snippets: [3, 13, 36] +The cluster 2 contains the snippets: [44] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 44, 1, 3, 8, 4, 5, 6, 11, 13, 48, 17, 14, 7, 15, 36, 54, 18, 19, 9, 25, 31, 42, 10, 28, 32, 59, 12, 37, 34, 20, 47, 43, 21, 50, 52, 22, 51, 56, 23, 53, 24, 57, 26, 58, 27, 60, 29, 62, 30, 63, 33, 35, 38, 39, 40, 45, 46, 49, 55, 61, 64, 16, 41] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "equinox" =============== +============ Value of Rand Index = 0.7242063492063492 ================================= +============ Partial average Rand Index = 0.533543417366947 ====== +============ Value of Adjusted Rand Index = 0.16230892369503122 ================================= +============ Partial average of Adjusted Rand Index = 0.12302496565455526 ================================= +============ Value of Jaccard Index = 0.1976911976911977 ================================= +============ Partial average of Jaccard Index = 0.36895664245730764 ====== +============ Precision = 0.532258064516129, Recall = 0.515625, F1 = 0.5238095238095237 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 7 ============ +============ average size of the created clusters: 8.857142857142858 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 86 : "veracruz" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "veracruz" =============== +============ Value of Rand Index = 0.25992063492063494 ================================= +============ Partial average Rand Index = 0.5303617571059434 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12159444279810694 ================================= +============ Value of Jaccard Index = 0.25992063492063494 ================================= +============ Partial average of Jaccard Index = 0.36768878190455556 ====== +============ Precision = 0.40625, Recall = 0.40625, F1 = 0.40625 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 87 : "heaven and hell" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 2, 4, 5, 7, 10, 12, 14, 17, 21, 25, 28, 35, 36, 37, 40, 41, 42, 43, 45, 48, 50, 51, 53, 55, 56, 59, 64] +The cluster 1 contains the snippets: [3, 6, 8, 11, 13, 15, 16, 18, 19, 20, 23, 24, 27, 29, 32, 33, 34, 44, 46, 49, 52, 54, 57, 58, 60, 61, 63] +The cluster 3 contains the snippets: [9, 26, 30, 31, 38, 39, 47] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 9, 6, 2, 26, 8, 4, 30, 11, 5, 31, 13, 7, 38, 15, 10, 39, 16, 12, 47, 18, 14, 19, 17, 20, 21, 23, 25, 24, 28, 27, 35, 29, 36, 32, 37, 33, 40, 34, 41, 44, 42, 46, 43, 49, 45, 52, 48, 54, 50, 57, 51, 58, 53, 60, 55, 61, 56, 63, 59, 64, 22, 62] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "heaven and hell" =============== +============ Value of Rand Index = 0.6507936507936508 ================================= +============ Partial average Rand Index = 0.531746031746032 ====== +============ Value of Adjusted Rand Index = 0.15001814634216457 ================================= +============ Partial average of Adjusted Rand Index = 0.12192115203424553 ================================= +============ Value of Jaccard Index = 0.19908987485779295 ================================= +============ Partial average of Jaccard Index = 0.36575086343275376 ====== +============ Precision = 0.41935483870967744, Recall = 0.40625, F1 = 0.4126984126984127 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 88 : "billy the kid" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 4, 5, 6, 7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 25, 26, 27, 29, 30, 31, 32, 33, 36, 37, 38, 40, 41, 43, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64] +The cluster 2 contains the snippets: [1, 2, 8, 10, 21, 24, 35, 39, 42, 44, 49, 57] +The cluster 3 contains the snippets: [28] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 1, 28, 4, 2, 5, 8, 6, 10, 7, 21, 11, 24, 12, 35, 13, 39, 14, 42, 15, 44, 16, 49, 17, 57, 18, 19, 20, 22, 25, 26, 27, 29, 30, 31, 32, 33, 36, 37, 38, 40, 41, 43, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 9, 23, 34] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "billy the kid" =============== +============ Value of Rand Index = 0.43452380952380953 ================================= +============ Partial average Rand Index = 0.530641233766234 ====== +============ Value of Adjusted Rand Index = -0.07136563876651983 ================================= +============ Partial average of Adjusted Rand Index = 0.11972471122969136 ================================= +============ Value of Jaccard Index = 0.25147734734077476 ================================= +============ Partial average of Jaccard Index = 0.3644523007498904 ====== +============ Precision = 0.45901639344262296, Recall = 0.4375, F1 = 0.44799999999999995 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.333333333333332 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 89 : "dog eat dog" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 6, 7, 9, 10, 14, 18, 22, 27, 28, 32, 37, 38, 39, 42, 43, 44, 45, 49, 50, 53, 58, 59, 60, 61, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 6, 7, 9, 10, 14, 18, 22, 27, 28, 32, 37, 38, 39, 42, 43, 44, 45, 49, 50, 53, 58, 59, 60, 61, 63, 64, 2, 3, 4, 5, 8, 11, 12, 13, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 29, 30, 31, 33, 34, 35, 36, 40, 41, 46, 47, 48, 51, 52, 54, 55, 56, 57, 62] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "dog eat dog" =============== +============ Value of Rand Index = 0.5381944444444444 ================================= +============ Partial average Rand Index = 0.5307261013019442 ====== +============ Value of Adjusted Rand Index = 0.08233886014010632 ================================= +============ Partial average of Adjusted Rand Index = 0.11930464548711177 ================================= +============ Value of Jaccard Index = 0.16276978417266186 ================================= +============ Partial average of Jaccard Index = 0.36218620505801136 ====== +============ Precision = 0.2962962962962963, Recall = 0.125, F1 = 0.1758241758241758 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 27.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 90 : "polaroid" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 2 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63] +The cluster 2 contains the snippets: [46, 50, 59] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 46, 2, 50, 3, 59, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "polaroid" =============== +============ Value of Rand Index = 0.33382936507936506 ================================= +============ Partial average Rand Index = 0.5285383597883601 ====== +============ Value of Adjusted Rand Index = 0.030987076907219142 ================================= +============ Partial average of Adjusted Rand Index = 0.11832333916955741 ================================= +============ Value of Jaccard Index = 0.2592388306674021 ================================= +============ Partial average of Jaccard Index = 0.3610423453425602 ====== +============ Precision = 0.3968253968253968, Recall = 0.390625, F1 = 0.3937007874015748 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 2 ============ +============ average size of the created clusters: 31.5 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 91 : "beauty and the beast" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 27, 30, 31, 32, 49, 50] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "beauty and the beast" =============== +============ Value of Rand Index = 0.30158730158730157 ================================= +============ Partial average Rand Index = 0.5260443921158209 ====== +============ Value of Adjusted Rand Index = 0.003286646104060249 ================================= +============ Partial average of Adjusted Rand Index = 0.11705919968532118 ================================= +============ Value of Jaccard Index = 0.18753606462781305 ================================= +============ Partial average of Jaccard Index = 0.35913568291712344 ====== +============ Precision = 0.29310344827586204, Recall = 0.265625, F1 = 0.2786885245901639 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 58.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 92 : "iron man" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 5 snippet clusters: ==================== +The cluster 2 contains the snippets: [2, 3, 4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 22, 23, 25, 26, 27, 28, 31, 32, 33, 34, 37, 38, 39, 40, 41, 43, 44, 46, 47, 48, 49, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63] +The cluster 4 contains the snippets: [1, 18, 21, 24, 29, 45, 50, 51, 52, 64] +The cluster 1 contains the snippets: [30, 42] +The cluster 3 contains the snippets: [36] +The cluster 5 contains the snippets: [35] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [30, 2, 36, 1, 35, 42, 3, 18, 4, 21, 5, 24, 6, 29, 8, 45, 9, 50, 10, 51, 11, 52, 12, 64, 13, 14, 15, 16, 17, 19, 20, 22, 23, 25, 26, 27, 28, 31, 32, 33, 34, 37, 38, 39, 40, 41, 43, 44, 46, 47, 48, 49, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 7] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "iron man" =============== +============ Value of Rand Index = 0.48214285714285715 ================================= +============ Partial average Rand Index = 0.5255672015182887 ====== +============ Value of Adjusted Rand Index = 0.07703318060944547 ================================= +============ Partial average of Adjusted Rand Index = 0.11662413426058339 ================================= +============ Value of Jaccard Index = 0.22494432071269488 ================================= +============ Partial average of Jaccard Index = 0.3576770811540318 ====== +============ Precision = 0.4603174603174603, Recall = 0.453125, F1 = 0.4566929133858268 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 5 ============ +============ average size of the created clusters: 12.6 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 93 : "independence day" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [3, 4, 5, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 30, 31, 33, 35, 37, 38, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 56, 57, 58, 60, 61, 62, 63, 64] +The cluster 3 contains the snippets: [1, 2, 6, 9, 21, 24, 27, 32, 34, 36, 42, 47, 53, 55] +The cluster 2 contains the snippets: [59] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [3, 59, 1, 4, 2, 5, 6, 7, 9, 8, 21, 10, 24, 11, 27, 12, 32, 13, 34, 14, 36, 15, 42, 16, 47, 17, 53, 18, 55, 19, 20, 22, 23, 30, 31, 33, 35, 37, 38, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 56, 57, 58, 60, 61, 62, 63, 64, 25, 26, 28, 29] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "independence day" =============== +============ Value of Rand Index = 0.6041666666666666 ================================= +============ Partial average Rand Index = 0.5264123570575185 ====== +============ Value of Adjusted Rand Index = 0.23400243592832393 ================================= +============ Partial average of Adjusted Rand Index = 0.11788626653658062 ================================= +============ Value of Jaccard Index = 0.3517465475223396 ================================= +============ Partial average of Jaccard Index = 0.3576133119751964 ====== +============ Precision = 0.6333333333333333, Recall = 0.59375, F1 = 0.6129032258064516 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 94 : "aurora borealis" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 34, 35, 36, 38, 39, 41, 42, 43, 45, 46, 47, 49, 52, 53, 54, 55, 56, 57, 58, 60, 61, 63] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 34, 35, 36, 38, 39, 41, 42, 43, 45, 46, 47, 49, 52, 53, 54, 55, 56, 57, 58, 60, 61, 63, 5, 12, 20, 25, 32, 33, 37, 40, 44, 48, 50, 51, 59, 62, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "aurora borealis" =============== +============ Value of Rand Index = 0.6200396825396826 ================================= +============ Partial average Rand Index = 0.5274083924349884 ====== +============ Value of Adjusted Rand Index = 0.2184504198108195 ================================= +============ Partial average of Adjusted Rand Index = 0.11895609795439167 ================================= +============ Value of Jaccard Index = 0.5148828372387587 ================================= +============ Partial average of Jaccard Index = 0.3592863920311917 ====== +============ Precision = 0.7959183673469388, Recall = 0.609375, F1 = 0.6902654867256638 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 49.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 95 : "trojan horse" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 2 contains the snippets: [1, 3, 4, 5, 8, 11, 12, 13, 18, 20, 22, 23, 27, 29, 32, 33, 35, 36, 37, 38, 39, 40, 43, 46, 47, 54, 63] +The cluster 1 contains the snippets: [2, 6, 7, 9, 10, 14, 15, 16, 19, 28, 34, 44, 45, 48, 49, 51, 52, 53, 55, 56, 61, 62] +The cluster 3 contains the snippets: [25, 26, 57, 58, 59, 60] +The cluster 4 contains the snippets: [21, 24, 31, 41, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 1, 25, 21, 6, 3, 26, 24, 7, 4, 57, 31, 9, 5, 58, 41, 10, 8, 59, 64, 14, 11, 60, 15, 12, 16, 13, 19, 18, 28, 20, 34, 22, 44, 23, 45, 27, 48, 29, 49, 32, 51, 33, 52, 35, 53, 36, 55, 37, 56, 38, 61, 39, 62, 40, 43, 46, 47, 54, 63, 17, 30, 42, 50] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "trojan horse" =============== +============ Value of Rand Index = 0.6056547619047619 ================================= +============ Partial average Rand Index = 0.528232038429407 ====== +============ Value of Adjusted Rand Index = 0.10796857363578276 ================================= +============ Partial average of Adjusted Rand Index = 0.11884043980366947 ================================= +============ Value of Jaccard Index = 0.24929178470254956 ================================= +============ Partial average of Jaccard Index = 0.3581285540593113 ====== +============ Precision = 0.5333333333333333, Recall = 0.5, F1 = 0.5161290322580646 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 15.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 96 : "hud" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 3 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 7, 8, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63] +The cluster 2 contains the snippets: [6, 9, 32] +The cluster 3 contains the snippets: [10, 11, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 6, 10, 2, 9, 11, 3, 32, 64, 4, 5, 7, 8, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 43, 44] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "hud" =============== +============ Value of Rand Index = 0.9146825396825397 ================================= +============ Partial average Rand Index = 0.5322575644841271 ====== +============ Value of Adjusted Rand Index = 0.751437603492398 ================================= +============ Partial average of Adjusted Rand Index = 0.12542999359209372 ================================= +============ Value of Jaccard Index = 0.8963230861965039 ================================= +============ Partial average of Jaccard Index = 0.36373474710240705 ====== +============ Precision = 0.9354838709677419, Recall = 0.90625, F1 = 0.9206349206349206 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 3 ============ +============ average size of the created clusters: 20.666666666666668 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 97 : "virgo" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "virgo" =============== +============ Value of Rand Index = 0.3005952380952381 ================================= +============ Partial average Rand Index = 0.529869293078056 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12413690087464946 ================================= +============ Value of Jaccard Index = 0.3005952380952381 ================================= +============ Partial average of Jaccard Index = 0.3630838243291373 ====== +============ Precision = 0.4375, Recall = 0.4375, F1 = 0.4375 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 98 : "pods" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 4 snippet clusters: ==================== +The cluster 1 contains the snippets: [2, 3, 4, 5, 6, 7, 10, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 52, 53, 54, 56, 57, 58, 59, 60, 61, 62, 63, 64] +The cluster 3 contains the snippets: [1, 21, 32, 55] +The cluster 4 contains the snippets: [8, 9, 15] +The cluster 2 contains the snippets: [11] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [2, 11, 1, 8, 3, 21, 9, 4, 32, 15, 5, 55, 6, 7, 10, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 52, 53, 54, 56, 57, 58, 59, 60, 61, 62, 63, 64, 45, 46, 47, 48, 49, 50, 51] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "pods" =============== +============ Value of Rand Index = 0.5877976190476191 ================================= +============ Partial average Rand Index = 0.5304603984450924 ====== +============ Value of Adjusted Rand Index = 0.16303663603172605 ================================= +============ Partial average of Adjusted Rand Index = 0.12453383694768086 ================================= +============ Value of Jaccard Index = 0.4676489429852659 ================================= +============ Partial average of Jaccard Index = 0.3641508153358325 ====== +============ Precision = 0.7894736842105263, Recall = 0.703125, F1 = 0.743801652892562 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 4 ============ +============ average size of the created clusters: 14.25 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 99 : "arch of triumph" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 1 snippet clusters: ==================== +The cluster 1 contains the snippets: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "arch of triumph" =============== +============ Value of Rand Index = 0.12748015873015872 ================================= +============ Partial average Rand Index = 0.5263898909732243 ====== +============ Value of Adjusted Rand Index = 0.0 ================================= +============ Partial average of Adjusted Rand Index = 0.12327591940275479 ================================= +============ Value of Jaccard Index = 0.12748015873015872 ================================= +============ Partial average of Jaccard Index = 0.36176020264284586 ====== +============ Precision = 0.203125, Recall = 0.203125, F1 = 0.203125 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 1 ============ +============ average size of the created clusters: 64.0 ============ +=========================================================================== + +[ WARN ] WSIEvaluator - +============= Query 100 : "apartment" ============== + +[ INFO ] WSIEvaluator - +============== Cluster creation phase ================== + +[ WARN ] WSIEvaluator - ClusteredSnippets: + +================== 5 snippet clusters: ==================== +The cluster 2 contains the snippets: [2, 3, 4, 6, 8, 10, 13, 15, 16, 17, 18, 19, 21, 22, 24, 25, 26, 29, 30, 33, 37, 38, 39, 40, 43, 45, 46, 47, 49, 54, 55, 56] +The cluster 1 contains the snippets: [1, 11, 12, 20, 31, 32, 34, 35, 36, 41, 42, 44, 48, 50, 51, 58, 61] +The cluster 4 contains the snippets: [5, 7, 9, 23, 27, 28, 52, 53, 57, 59, 63, 64] +The cluster 3 contains the snippets: [60, 62] +The cluster 5 contains the snippets: [14] + +[ INFO ] WSIEvaluator - +================== Starting Evaluation ================== +Resulting list: [1, 2, 60, 5, 14, 11, 3, 62, 7, 12, 4, 9, 20, 6, 23, 31, 8, 27, 32, 10, 28, 34, 13, 52, 35, 15, 53, 36, 16, 57, 41, 17, 59, 42, 18, 63, 44, 19, 64, 48, 21, 50, 22, 51, 24, 58, 25, 61, 26, 29, 30, 33, 37, 38, 39, 40, 43, 45, 46, 47, 49, 54, 55, 56] +[ WARN ] WSIEvaluator - +================ Results of Rand Index for the topic "apartment" =============== +============ Value of Rand Index = 0.4399801587301587 ================================= +============ Partial average Rand Index = 0.5255257936507937 ====== +============ Value of Adjusted Rand Index = 0.025218548764255073 ================================= +============ Partial average of Adjusted Rand Index = 0.12229534569636978 ================================= +============ Value of Jaccard Index = 0.3211064341551413 ================================= +============ Partial average of Jaccard Index = 0.3613536649579688 ====== +============ Precision = 0.875, Recall = 0.875, F1 = 0.875 ============ + +[ WARN ] WSIEvaluator - +================ Statistics: ==================================== +============ number of created clusters: 5 ============ +============ average size of the created clusters: 12.8 ============ +=========================================================================== + +[ INFO ] WSIEvaluator - + +=========== Final average value of S-recall@K: ============= +1 0.1807 +2 0.2896 +3 0.3427 +4 0.3845 +5 0.4302 +6 0.4635 +7 0.4854 +8 0.5159 +9 0.5457 +10 0.5642 +11 0.5937 +12 0.6083 +13 0.6206 +14 0.6431 +15 0.6571 +16 0.6788 +17 0.6914 +18 0.7026 +19 0.7081 +20 0.7214 +21 0.7358 +22 0.7525 +23 0.7562 +24 0.7678 +25 0.7728 +26 0.7826 +27 0.7896 +28 0.7936 +29 0.7977 +30 0.8039 +31 0.8083 +32 0.8103 +33 0.8150 +34 0.8227 +35 0.8294 +36 0.8375 +37 0.8507 +38 0.8570 +39 0.8623 +40 0.8715 +41 0.8757 +42 0.8782 +43 0.8866 +44 0.8921 +45 0.8982 +46 0.9026 +47 0.9111 +48 0.9161 +49 0.9216 +50 0.9291 +51 0.9348 +52 0.9461 +53 0.9497 +54 0.9570 +55 0.9646 +56 0.9713 +57 0.9759 +58 0.9791 +59 0.9823 +60 0.9855 +61 0.9867 +62 0.9943 +63 0.9948 +64 1.0000 +65 0.0000 +66 0.0000 +67 0.0000 +68 0.0000 +69 0.0000 +70 0.0000 +71 0.0000 +72 0.0000 +73 0.0000 +74 0.0000 +75 0.0000 +76 0.0000 +77 0.0000 +78 0.0000 +79 0.0000 +80 0.0000 +81 0.0000 +82 0.0000 +83 0.0000 +84 0.0000 +85 0.0000 +86 0.0000 +87 0.0000 +88 0.0000 +89 0.0000 +90 0.0000 +91 0.0000 +92 0.0000 +93 0.0000 +94 0.0000 +95 0.0000 +96 0.0000 +97 0.0000 +98 0.0000 +99 0.0000 +100 0.0000 + +=========== Final average value of S-precision@r: ============= +0.4000 0.4380 +0.4500 0.4541 +0.5000 0.4312 +0.5500 0.4013 +0.6000 0.3257 +0.6500 0.3149 +0.7000 0.2804 +0.7500 0.2526 +0.8000 0.2452 +0.8500 0.2316 +0.9000 0.2096 +0.9500 0.2056 +1.0000 0.1493 + +=========== Final average value of F1: ===================== +average F1 = 0.5512548014934152 + +=========== Final average value of Rand Index: ============= +average Rand Index = 0.5255257936507937 + +=========== Final average value of Adjusted Rand Index: ==== +average Adj Rand Index = 0.12229534569636978 + +=========== Final average value of Jaccard Index: ========== +average Jaccard Index = 0.3613536649579688 + +================ Statistics: ==================================== +============ average number of created clusters: 2.94 +============ average cluster size: 29.503013392857145 + +[ WARN ] WSIEvaluator - Simulation started at: 11:45 and completed at 11:45 +Execution time: 1.502 sec -- GitLab