-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathwordle
executable file
·224 lines (194 loc) · 7.62 KB
/
wordle
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
#!/usr/bin/env python3
"""
Python CLI assistant for Wordle players.
"""
import os, re, sys
import requests
import pathlib
WORD_LENGTH = 5
DICTIONARY_URL = 'https://raw.githubusercontent.com/DevangThakkar/wordle_archive/23cfba6a97cd61cc6b01ed8a399eb6df90dad88d/src/data/words.js'
def download_dictionary():
response = requests.get(DICTIONARY_URL)
if response.status_code != 200:
raise Exception('Got HTTP status {response.status_code} when trying to download the dictionary')
all_words = ''
for line in response.text.split('\n'):
if ':' in line:
all_words += line.split(':')[0].strip() + '\n'
return all_words
def cache_directory_path():
home_dir = os.environ.get('HOME', os.path.expanduser('~'))
cache_dir = os.path.join(home_dir, '.cache')
xdg_cache_dir = os.environ.get('XDG_CACHE_HOME', cache_dir)
our_name = os.path.basename(sys.argv[0])
our_cache_dir = os.path.join(xdg_cache_dir, our_name)
return our_cache_dir
def cache_dictionary_path():
return os.path.join(cache_directory_path(), 'dictionary')
def store_dictionary(data):
cache_path = pathlib.Path(cache_directory_path())
cache_path.mkdir(parents=True, exist_ok=True)
with open(cache_dictionary_path(), 'w') as dict_filedesc:
dict_filedesc.write(data)
def open_cached_dictionary():
if not os.path.isfile(cache_dictionary_path()):
store_dictionary(download_dictionary())
return open(cache_dictionary_path())
def dictionary():
with open_cached_dictionary() as words_filedesc:
word_count = 0
for word in words_filedesc.readlines():
word = word.rstrip()
# Focus on candidate words:
if len(word) != WORD_LENGTH:
continue
# Ignore words with non alphabetic characters:
if not re.match(r'^[a-zA-Z]+$', word):
continue
word = word.lower()
yield word
def words_with_all_letters(required_letters):
for word in dictionary():
if has_required_letters(word, required_letters):
yield word
def words_with_most_letters(letters):
if not letters:
return []
for i in range(WORD_LENGTH, 1, -1):
candidates = list(words_with_all_letters(letters[:i]))
if candidates:
return candidates
def set_string_char(string, index, char):
char_array = list(string)
char_array[index] = char
return ''.join(char_array)
def dotted_pattern(position=None, letter=None, length=WORD_LENGTH):
pattern = '.' * WORD_LENGTH
if position is not None and letter is not None:
pattern = set_string_char(pattern, position - 1, letter)
return pattern
def parse_misplaced_letter(misplaced_letter):
misplaced_letter = misplaced_letter.lower()
# Format #1: a1, 3b, 4d
parse_misplaced_letter_re1 = r'^(?P<letter>[a-z])(?P<position>[0-9])$'
parse_misplaced_letter_re2 = r'^(?P<position>[0-9])(?P<letter>[a-z])$'
if rem := re.match(parse_misplaced_letter_re1, misplaced_letter) or re.match(parse_misplaced_letter_re2, misplaced_letter):
position = int(rem.group('position'))
if 1 <= position <= WORD_LENGTH:
yield dotted_pattern(position, rem.group('letter'))
else:
raise Exception(f'Invalid position {position} in {misplaced_letter}')
# Format #2: ^u
elif rem := re.match('^\^(?P<letter>[a-z])$', misplaced_letter):
yield dotted_pattern(1, rem.group('letter'))
# Format #3: u$
elif rem := re.match('^(?P<letter>[a-z])\$$', misplaced_letter):
yield dotted_pattern(WORD_LENGTH, rem.group('letter'))
# Format #4: ..a.. .abc.
else:
if len(misplaced_letter) != WORD_LENGTH:
raise Exception(f'{misplaced_letter} is {len(misplaced_letter)}-char long instead of {WORD_LENGTH}')
for position, char in enumerate(misplaced_letter, 1):
if 'a' <= char <= 'z':
yield dotted_pattern(position, char)
def extract_letters(string):
return list(filter(lambda c: 'a' <= c <= 'z', string))
def has_required_letters(word, required_letters):
for required_letter in required_letters:
if required_letter not in word:
return False
return True
def analyse_letter_frequency(words):
results = {'data': {}, 'top': []}
for word in words:
for char in word:
results['data'][char] = results['data'].setdefault(char, 0) + 1
results['top'] = sorted(results['data'], key=lambda x: results['data'][x], reverse=True)
return results
# Real work starts here:
if '-h' in sys.argv or '--help' in sys.argv:
our_name = os.path.basename(sys.argv[0])
help = f"""Wordle Assistant.
Usage:
{our_name}: list all {WORD_LENGTH}-letter words
{our_name} wrongletters: same, but remove words that contain any of the wrong letters
Caution: this parameter cannot be empty.
Example: {our_name} tyrch
{our_name} wrongletters pattern: same, but keep only words that match the given (Python) regex pattern
Use a dash (-) character if you do not have a pattern yet
Examples:
{our_name} tyrch g.e.s
{our_name} tyrch ^g
{our_name} tyrch s$
{our_name} tyrch '^g[ue]'
{our_name} wrongletters pattern misplaced_letters ...: same but takes misplaced letters into account
There are multiple supported notations:
- positions range from 1 to {WORD_LENGTH}
- "3g" or "g3" means that a "g" at position 3 was considered misplaced
- "^u" means that a "u" at the start of the word was considered misplaced
- "e$" means that an "e" at the end of the word was considered misplaced
- ".s.u." means that an "s" at position 2 and a "u" at position 4 were considered misplaced
Examples:
{our_name} tyrch - 3g ^u e$ .s.u.
{our_name} tyrch '^g[ue]' 3g ^u e$ .s.u.
"""
print(help)
sys.exit(0)
wrong_letters_re = correct_letters_re = all_misplaced_letters_re = required_letters = None
all_required_letters = []
if len(sys.argv) >= 2:
wrong_letters = sys.argv[1].lower()
wrong_letters_re = f'[{wrong_letters}]'
if len(sys.argv) >= 3:
if sys.argv[2] == '-':
correct_letters = dotted_pattern()
else:
correct_letters = sys.argv[2].lower()
correct_letters_re = f'{correct_letters}'
# Assume all letters in the pattern are required, i.e. assume there are no negative character classes:
all_required_letters = extract_letters(correct_letters)
if len(sys.argv) >= 4:
all_misplaced_letters_re = []
for misplaced_letter_arg in sys.argv[3:]:
all_misplaced_letters_re.extend(list(parse_misplaced_letter(misplaced_letter_arg)))
all_misplaced_letters_re = '|'.join(all_misplaced_letters_re)
all_misplaced_letters_re = f'^(?:{all_misplaced_letters_re})$'
required_letters = extract_letters(all_misplaced_letters_re)
all_required_letters.extend(required_letters)
retained_words_set = set()
for word in dictionary():
if wrong_letters_re:
# Discard words that contain wrong letters:
if re.search(wrong_letters_re, word):
continue
if correct_letters_re:
# Discard words that do not match correct letters in correct spots:
if not re.search(correct_letters_re, word):
continue
if all_misplaced_letters_re:
# Discard words that feature misplaced letters:
if re.match(all_misplaced_letters_re, word):
continue
# Discard words that do not contain the required letters:
if not has_required_letters(word, required_letters):
continue
# Still here? Keep this word:
retained_words_set.add(word)
# Display all retained words:
retained_words = list(retained_words_set)
retained_words.sort()
for word in retained_words:
print(word)
# Provide some hints:
if len(retained_words) > 1:
analysis = analyse_letter_frequency(retained_words)
all_required_letters = list(set(all_required_letters))
print(f'({len(retained_words)}) Top letters: %s' % ' '.join(analysis['top']))
if all_required_letters:
top_new_letters = list(filter(lambda c: c not in all_required_letters, analysis['top']))
if top_new_letters:
print('Top new letters:', ' '.join(top_new_letters))
if len(retained_words) > 2:
discriminants = words_with_most_letters(top_new_letters)
print('Suggested discriminants:', ' '.join(discriminants[:50]))
sys.exit(0)