From bffb5a6c064c49a87f83435368a4f8f891b4e46e Mon Sep 17 00:00:00 2001 From: Yuren Hao Date: Tue, 24 Feb 2026 08:53:02 +0000 Subject: Add edge connectivity analysis, use official network_evaluation scripts - Switch accuracy computation to official network_evaluation scripts (clustering_accuracy with graph-tool NMI/AMI and sklearn ARI) - Add minimum edge cut / log10(n) and well-connectedness stats - Add edge connectivity boxplots and well-connected fraction bar chart - Add "What I Learned and Open Questions" section to discussion - Fix author name and minor LaTeX issues --- .../polblogs/ground_truth/cluster_details.json | 280 +++++++++++++++------ 1 file changed, 210 insertions(+), 70 deletions(-) (limited to 'results/stats/polblogs/ground_truth/cluster_details.json') diff --git a/results/stats/polblogs/ground_truth/cluster_details.json b/results/stats/polblogs/ground_truth/cluster_details.json index b2f1602..24634ad 100644 --- a/results/stats/polblogs/ground_truth/cluster_details.json +++ b/results/stats/polblogs/ground_truth/cluster_details.json @@ -6,7 +6,9 @@ "c_boundary": 2008, "edge_density": 0.44565217391304346, "degree_density": 5.125, - "conductance": 0.8908606921029282 + "conductance": 0.8908606921029282, + "mincut": 4, + "mincut_over_log10n": 2.8981071006490158 }, { "com_id": "1", @@ -15,7 +17,9 @@ "c_boundary": 976, "edge_density": 0.41025641025641024, "degree_density": 2.4615384615384617, - "conductance": 0.9384615384615385 + "conductance": 0.9384615384615385, + "mincut": 2, + "mincut_over_log10n": 1.7954234350052463 }, { "com_id": "10", @@ -24,7 +28,9 @@ "c_boundary": 2, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.5 + "conductance": 0.5, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "11", @@ -33,7 +39,9 @@ "c_boundary": 6, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.75 + "conductance": 0.75, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "12", @@ -42,7 +50,9 @@ "c_boundary": 6, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.75 + "conductance": 0.75, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "13", @@ -51,7 +61,9 @@ "c_boundary": 3, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.6 + "conductance": 0.6, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "14", @@ -60,7 +72,9 @@ "c_boundary": 7, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.7777777777777778 + "conductance": 0.7777777777777778, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "15", @@ -69,7 +83,9 @@ "c_boundary": 13, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8666666666666667 + "conductance": 0.8666666666666667, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "16", @@ -78,7 +94,9 @@ "c_boundary": 13, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8666666666666667 + "conductance": 0.8666666666666667, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "17", @@ -87,7 +105,9 @@ "c_boundary": 17, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8947368421052632 + "conductance": 0.8947368421052632, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "18", @@ -96,7 +116,9 @@ "c_boundary": 13, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8666666666666667 + "conductance": 0.8666666666666667, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "19", @@ -105,7 +127,9 @@ "c_boundary": 12, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.75 + "conductance": 0.75, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "2", @@ -114,7 +138,9 @@ "c_boundary": 8, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.6666666666666666 + "conductance": 0.6666666666666666, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "20", @@ -123,7 +149,9 @@ "c_boundary": 37, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.9024390243902439 + "conductance": 0.9024390243902439, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "21", @@ -132,7 +160,9 @@ "c_boundary": 1, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.3333333333333333 + "conductance": 0.3333333333333333, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "22", @@ -141,7 +171,9 @@ "c_boundary": 0, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.0 + "conductance": 0.0, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "23", @@ -150,7 +182,9 @@ "c_boundary": 3, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.6 + "conductance": 0.6, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "24", @@ -159,7 +193,9 @@ "c_boundary": 14, "edge_density": 0.4, "degree_density": 0.8, - "conductance": 0.6363636363636364 + "conductance": 0.6363636363636364, + "mincut": 1, + "mincut_over_log10n": 1.430676558073393 }, { "com_id": "25", @@ -168,7 +204,9 @@ "c_boundary": 3, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.6 + "conductance": 0.6, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "26", @@ -177,7 +215,9 @@ "c_boundary": 47, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.9591836734693877 + "conductance": 0.9591836734693877, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "27", @@ -186,7 +226,9 @@ "c_boundary": 17, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8947368421052632 + "conductance": 0.8947368421052632, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "28", @@ -195,7 +237,9 @@ "c_boundary": 13, "edge_density": 0.5, "degree_density": 0.75, - "conductance": 0.6842105263157895 + "conductance": 0.6842105263157895, + "mincut": 1, + "mincut_over_log10n": 1.660964047443681 }, { "com_id": "29", @@ -204,7 +248,9 @@ "c_boundary": 7, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.7777777777777778 + "conductance": 0.7777777777777778, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "3", @@ -213,7 +259,9 @@ "c_boundary": 164, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.9761904761904762 + "conductance": 0.9761904761904762, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "30", @@ -222,7 +270,9 @@ "c_boundary": 29, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.8787878787878788 + "conductance": 0.8787878787878788, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "31", @@ -231,7 +281,9 @@ "c_boundary": 10, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8333333333333334 + "conductance": 0.8333333333333334, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "32", @@ -240,7 +292,9 @@ "c_boundary": 1, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.3333333333333333 + "conductance": 0.3333333333333333, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "33", @@ -249,7 +303,9 @@ "c_boundary": 5, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.7142857142857143 + "conductance": 0.7142857142857143, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "34", @@ -258,7 +314,9 @@ "c_boundary": 2, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.5 + "conductance": 0.5, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "35", @@ -267,7 +325,9 @@ "c_boundary": 10, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8333333333333334 + "conductance": 0.8333333333333334, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "36", @@ -276,7 +336,9 @@ "c_boundary": 11, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8461538461538461 + "conductance": 0.8461538461538461, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "37", @@ -285,7 +347,9 @@ "c_boundary": 93, "edge_density": 0.5, "degree_density": 0.75, - "conductance": 0.9393939393939394 + "conductance": 0.9393939393939394, + "mincut": 1, + "mincut_over_log10n": 1.660964047443681 }, { "com_id": "38", @@ -294,7 +358,9 @@ "c_boundary": 3, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.42857142857142855 + "conductance": 0.42857142857142855, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "39", @@ -303,7 +369,9 @@ "c_boundary": 71, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.9726027397260274 + "conductance": 0.9726027397260274, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "4", @@ -312,7 +380,9 @@ "c_boundary": 384, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.9948186528497409 + "conductance": 0.9948186528497409, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "40", @@ -321,7 +391,9 @@ "c_boundary": 22, "edge_density": 0.5, "degree_density": 0.75, - "conductance": 0.7857142857142857 + "conductance": 0.7857142857142857, + "mincut": 1, + "mincut_over_log10n": 1.660964047443681 }, { "com_id": "41", @@ -330,7 +402,9 @@ "c_boundary": 31, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.9393939393939394 + "conductance": 0.9393939393939394, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "42", @@ -339,7 +413,9 @@ "c_boundary": 18, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.9 + "conductance": 0.9, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "43", @@ -348,7 +424,9 @@ "c_boundary": 11, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8461538461538461 + "conductance": 0.8461538461538461, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "44", @@ -357,7 +435,9 @@ "c_boundary": 69, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.971830985915493 + "conductance": 0.971830985915493, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "45", @@ -366,7 +446,9 @@ "c_boundary": 48, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.9230769230769231 + "conductance": 0.9230769230769231, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 }, { "com_id": "46", @@ -375,7 +457,9 @@ "c_boundary": 69, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.971830985915493 + "conductance": 0.971830985915493, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "47", @@ -384,7 +468,9 @@ "c_boundary": 11, "edge_density": 1.0, "degree_density": 1.0, - "conductance": 0.6470588235294118 + "conductance": 0.6470588235294118, + "mincut": 2, + "mincut_over_log10n": 4.19180654857877 }, { "com_id": "48", @@ -393,7 +479,9 @@ "c_boundary": 12, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8571428571428571 + "conductance": 0.8571428571428571, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "49", @@ -402,7 +490,9 @@ "c_boundary": 4, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.6666666666666666 + "conductance": 0.6666666666666666, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "5", @@ -411,7 +501,9 @@ "c_boundary": 4, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.6666666666666666 + "conductance": 0.6666666666666666, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "50", @@ -420,7 +512,9 @@ "c_boundary": 124, "edge_density": 0.5, "degree_density": 0.75, - "conductance": 0.9538461538461539 + "conductance": 0.9538461538461539, + "mincut": 1, + "mincut_over_log10n": 1.660964047443681 }, { "com_id": "51", @@ -429,7 +523,9 @@ "c_boundary": 5, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.7142857142857143 + "conductance": 0.7142857142857143, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "52", @@ -438,7 +534,9 @@ "c_boundary": 2, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.5 + "conductance": 0.5, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "53", @@ -447,7 +545,9 @@ "c_boundary": 4, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.6666666666666666 + "conductance": 0.6666666666666666, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "54", @@ -456,7 +556,9 @@ "c_boundary": 10, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8333333333333334 + "conductance": 0.8333333333333334, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "55", @@ -465,7 +567,9 @@ "c_boundary": 2673, "edge_density": 0.31216931216931215, "degree_density": 4.214285714285714, - "conductance": 0.9188724647645239 + "conductance": 0.9188724647645239, + "mincut": 2, + "mincut_over_log10n": 1.3820190723365764 }, { "com_id": "56", @@ -474,7 +578,9 @@ "c_boundary": 1075, "edge_density": 0.18758434547908232, "degree_density": 3.5641025641025643, - "conductance": 0.7945306725794531 + "conductance": 0.7945306725794531, + "mincut": 2, + "mincut_over_log10n": 1.2570199796837602 }, { "com_id": "57", @@ -483,7 +589,9 @@ "c_boundary": 2287, "edge_density": 0.3985200845665962, "degree_density": 8.568181818181818, - "conductance": 0.7520552449852023 + "conductance": 0.7520552449852023, + "mincut": 2, + "mincut_over_log10n": 1.2169501614589444 }, { "com_id": "58", @@ -492,7 +600,9 @@ "c_boundary": 1229, "edge_density": 0.36, "degree_density": 4.32, - "conductance": 0.8505190311418686 + "conductance": 0.8505190311418686, + "mincut": 3, + "mincut_over_log10n": 2.1460148371100893 }, { "com_id": "59", @@ -501,7 +611,9 @@ "c_boundary": 1485, "edge_density": 0.36, "degree_density": 4.32, - "conductance": 0.873015873015873 + "conductance": 0.873015873015873, + "mincut": 2, + "mincut_over_log10n": 1.430676558073393 }, { "com_id": "6", @@ -510,7 +622,9 @@ "c_boundary": 6, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.75 + "conductance": 0.75, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "60", @@ -519,7 +633,9 @@ "c_boundary": 1168, "edge_density": 0.17846153846153845, "degree_density": 2.230769230769231, - "conductance": 0.9096573208722741 + "conductance": 0.9096573208722741, + "mincut": 2, + "mincut_over_log10n": 1.4134541847506568 }, { "com_id": "61", @@ -528,7 +644,9 @@ "c_boundary": 1689, "edge_density": 0.6111111111111112, "degree_density": 2.4444444444444446, - "conductance": 0.9746105020196192 + "conductance": 0.9746105020196192, + "mincut": 3, + "mincut_over_log10n": 3.143854911434077 }, { "com_id": "62", @@ -537,7 +655,9 @@ "c_boundary": 1624, "edge_density": 0.22365591397849463, "degree_density": 3.3548387096774195, - "conductance": 0.8864628820960698 + "conductance": 0.8864628820960698, + "mincut": 2, + "mincut_over_log10n": 1.3410563032888585 }, { "com_id": "63", @@ -546,7 +666,9 @@ "c_boundary": 1081, "edge_density": 0.29411764705882354, "degree_density": 2.3529411764705883, - "conductance": 0.9310938845822567 + "conductance": 0.9310938845822567, + "mincut": 2, + "mincut_over_log10n": 1.625423018583918 }, { "com_id": "64", @@ -555,7 +677,9 @@ "c_boundary": 1589, "edge_density": 0.12372881355932204, "degree_density": 3.65, - "conductance": 0.7839171188949186 + "conductance": 0.7839171188949186, + "mincut": 2, + "mincut_over_log10n": 1.1247637115056954 }, { "com_id": "65", @@ -564,7 +688,9 @@ "c_boundary": 1638, "edge_density": 0.10853658536585366, "degree_density": 2.1707317073170733, - "conductance": 0.9019823788546255 + "conductance": 0.9019823788546255, + "mincut": 2, + "mincut_over_log10n": 1.2400917777462312 }, { "com_id": "66", @@ -573,7 +699,9 @@ "c_boundary": 347, "edge_density": 0.12298387096774194, "degree_density": 1.90625, - "conductance": 0.7398720682302772 + "conductance": 0.7398720682302772, + "mincut": 2, + "mincut_over_log10n": 1.3287712379549448 }, { "com_id": "67", @@ -582,7 +710,9 @@ "c_boundary": 609, "edge_density": 0.09634146341463415, "degree_density": 1.9268292682926829, - "conductance": 0.7940026075619296 + "conductance": 0.7940026075619296, + "mincut": 2, + "mincut_over_log10n": 1.2400917777462312 }, { "com_id": "68", @@ -591,7 +721,9 @@ "c_boundary": 125, "edge_density": 0.7, "degree_density": 1.4, - "conductance": 0.8992805755395683 + "conductance": 0.8992805755395683, + "mincut": 2, + "mincut_over_log10n": 2.861353116146786 }, { "com_id": "69", @@ -600,7 +732,9 @@ "c_boundary": 134, "edge_density": 1.0, "degree_density": 2.0, - "conductance": 0.8701298701298701 + "conductance": 0.8701298701298701, + "mincut": 4, + "mincut_over_log10n": 5.722706232293572 }, { "com_id": "7", @@ -609,7 +743,9 @@ "c_boundary": 25, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.9259259259259259 + "conductance": 0.9259259259259259, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "8", @@ -618,7 +754,9 @@ "c_boundary": 8, "edge_density": 1.0, "degree_density": 0.5, - "conductance": 0.8 + "conductance": 0.8, + "mincut": 1, + "mincut_over_log10n": 3.321928094887362 }, { "com_id": "9", @@ -627,6 +765,8 @@ "c_boundary": 22, "edge_density": 0.6666666666666666, "degree_density": 0.6666666666666666, - "conductance": 0.8461538461538461 + "conductance": 0.8461538461538461, + "mincut": 1, + "mincut_over_log10n": 2.095903274289385 } ] \ No newline at end of file -- cgit v1.2.3