-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.py
128 lines (95 loc) · 3.62 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
from itertools import groupby
from sklearn.cluster import KMeans
import matplotlib.pyplot as plt
import worldle
from scipy.spatial.distance import cdist
from scipy.optimize import linear_sum_assignment
import numpy as np
from urllib import parse
SHOW_COUNTRIES = False
TEAMMEMBERS = [
"Nihar",
"Sam",
"Anitha",
"Suresh",
"Sonam",
"Sandeep",
"Jacek",
"Blake",
"Johnnie",
]
N_CLUSTERS = len(TEAMMEMBERS)
def get_country_tuples(countries):
for country in countries:
yield country.longitude, country.latitude, country.name
def plot_countries(longitudes, latitudes, labels, colours=None, title=None):
plt.figure(figsize=(18, 8))
plt.scatter(longitudes, latitudes, c=colours)
if title:
plt.title(title)
for i, label in enumerate(labels):
plt.annotate(label, (longitudes[i], latitudes[i]))
def make_clusters_even(clusters, cordinates):
cluster_size = int(np.ceil(len(cordinates) / N_CLUSTERS))
centers = clusters.cluster_centers_
centers = (
centers.reshape(-1, 1, cordinates.shape[-1])
.repeat(cluster_size, 1)
.reshape(-1, cordinates.shape[-1])
)
distance_matrix = cdist(cordinates, centers)
clusters = linear_sum_assignment(distance_matrix)[1] // cluster_size
return clusters
def even_kmeans_countries(longitudes, latitudes):
cordinates = np.array(list(zip(longitudes, latitudes)))
clusters = KMeans(n_clusters=N_CLUSTERS, random_state=1)
clusters.fit(cordinates)
return make_clusters_even(clusters, cordinates)
def group_by_cluster(longitudes, latitudes, labels, clusters):
key_function = lambda x: x[-1]
yield from groupby(
sorted(zip(longitudes, latitudes, labels, clusters), key=key_function),
key=key_function,
)
def generate_markdown():
countries = worldle.get_countries()
country_tuples = get_country_tuples(countries)
longitudes, latitudes, labels = zip(*(country_tuples))
clusters = even_kmeans_countries(longitudes, latitudes)
plot_countries(
longitudes,
latitudes,
labels,
colours=clusters,
title=f"Even cluster distribution among {len(TEAMMEMBERS)} team members.",
)
plt.savefig(f"images/total.png")
if SHOW_COUNTRIES:
plt.show()
print(f"# Even cluster distribution among {len(TEAMMEMBERS)} team members.")
print(
f"![All countries](https://github.com/gastlich/worldle-distribution/blob/main/images/total.png?raw=true)"
)
grouped_countries = group_by_cluster(longitudes, latitudes, labels, clusters)
for member_index, countries in grouped_countries:
generate_markdown_for_member(member_index, countries)
def generate_markdown_for_member(member_index, countries):
countries = list(countries)
unzipped_countries = zip(*list(countries))
longitudes, latitudes, labels, cluster = unzipped_countries
member = TEAMMEMBERS[member_index]
plot_countries(longitudes, latitudes, labels, title=member)
plt.savefig(f"images/{member.lower()}.png")
if SHOW_COUNTRIES:
plt.show()
print(f"\n\n# {member} is going to learn the following {len(countries)} countries:")
print(
f"![{member}'s countries](https://github.com/gastlich/worldle-distribution/blob/main/images/{member.lower()}.png?raw=true)\n"
)
print(f"| Country | Longitude | Latitude | Google Maps |")
print(f"| ------- | --------- | -------- | ----------- |")
for country in countries:
print(
f"| {country[2]} | {country[0]} | {country[1]} | [Link](https://www.google.co.uk/maps/place/{parse.quote_plus(country[2])}/)"
)
generate_markdown()