-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathroute_triangles.sql
86 lines (71 loc) · 3.54 KB
/
route_triangles.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
-- To count triangles, first we have to form them
-- For this we first get the second neighbours (except the initail node itself)
-- Then the third neighbeours, with the condition that they are the initial node, thus completing triangles
-- Finally we add a new column for easier summation
-- DAYTIME--------------------------------------------------------------------------------------------------------------
SELECT t1.route_1,t1.route_2,t1.route_3,t2.route_2 AS route_4, COUNT(*) AS weight
INTO route_triangles_daytime
FROM (SELECT f.route_1,f.route_2,g.route_2 as route_3
FROM route_w_links_daytime f
JOIN route_w_links_daytime g
ON f.route_2=g.route_1
WHERE f.route_1!=g.route_2) t1
JOIN route_w_links_daytime t2
ON t1.route_3 = t2.route_1
WHERE t1.route_1=t2.route_2
GROUP BY t1.route_1,t1.route_2,t1.route_3,t2.route_2
ORDER BY t1.route_1;
-- GLOBAL CLUSTERING (possible triangles vs present triangles)
SELECT t3.c_1/t4.c_2 AS global_clustering FROM
(SELECT t1.c_1,COUNT(t1.c_1) AS cc FROM
(SELECT SUM(weight) AS c_1 FROM route_triangles_daytime) t1
GROUP BY t1.c_1) t3
JOIN
(SELECT t2.c_2,COUNT(t2.c_2) AS cc FROM
(SELECT SUM(degree*(degree-1)) AS c_2 FROM route_degree_daytime) t2
GROUP BY t2.c_2) t4
ON t3.cc = t4.cc;
-- GLOBAL CLUSTERING = 0.466
-- We can also count how many triangles each node has, and divide by the possible number of triangles (0.5*k*(k-1))
-- In the count there is a division by two, because in the triangles table every triangle is present twice. (a-b-c-a and a-c-b-a)
SELECT t1.route_1, t1.count/t2.count_max AS clustering
INTO route_clustering_daytime
FROM (SELECT DISTINCT route_1, (SELECT SUM(weight)/2 FROM route_triangles_daytime t2 WHERE t2.route_1=t1.route_1) AS count
FROM route_triangles_daytime t1
ORDER BY route_1) t1
JOIN (SELECT route_1,degree*(degree-1)*0.5 AS count_max FROM route_degree_daytime) t2
ON t1.route_1=t2.route_1;
SELECT AVG(clustering) FROM route_clustering_daytime;
-- AVG CLUSTERING = 0.57
-- NIGHTTIME------------------------------------------------------------------------------------------------------------
SELECT t1.route_1,t1.route_2,t1.route_3,t2.route_2 AS route_4, COUNT(*) AS weight
INTO route_triangles_nighttime
FROM (SELECT f.route_1,f.route_2,g.route_2 as route_3
FROM route_w_links_nighttime f
JOIN route_w_links_nighttime g
ON f.route_2=g.route_1
WHERE f.route_1!=g.route_2) t1
JOIN route_w_links_nighttime t2
ON t1.route_3 = t2.route_1
WHERE t1.route_1=t2.route_2
GROUP BY t1.route_1,t1.route_2,t1.route_3,t2.route_2
ORDER BY t1.route_1;
SELECT t3.c_1/t4.c_2 AS global_clustering FROM
(SELECT t1.c_1,COUNT(t1.c_1) AS cc FROM
(SELECT SUM(weight) AS c_1 FROM route_triangles_nighttime) t1
GROUP BY t1.c_1) t3
JOIN
(SELECT t2.c_2,COUNT(t2.c_2) AS cc FROM
(SELECT SUM(degree*(degree-1)) AS c_2 FROM route_degree_nighttime) t2
GROUP BY t2.c_2) t4
ON t3.cc = t4.cc;
-- GLOBAL CLUSTERING = 0.652
SELECT t1.route_1, t1.count/t2.count_max AS clustering
INTO route_clustering_nighttime
FROM (SELECT DISTINCT route_1, (SELECT SUM(weight)/2 FROM route_triangles_nighttime t2 WHERE t2.route_1=t1.route_1) AS count
FROM route_triangles_nighttime t1
ORDER BY route_1) t1
JOIN (SELECT route_1,degree*(degree-1)*0.5 AS count_max FROM route_degree_nighttime) t2
ON t1.route_1=t2.route_1;
SELECT AVG(clustering) FROM route_clustering_nighttime;
-- AVG CLUSTERING = 0.715