-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathboard_solver.py
231 lines (185 loc) · 9.46 KB
/
board_solver.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
"""
A class to solve ruzzle boards and find words sorted by score.
Constants are defined in config.py, and some of these can be tweaked for
performance.
This class can also be used as a standalone program, and can write words to a
file if provided a board.txt file containing information about the board. The
first 4 lines of board.txt should contain the letters of the board, all caps
and separated by spaces. Line 5 is blank, and lines 6-9 contain information
about multipliers. 2, 3, D, T, and - are DW, TW, DL, TL, and nothing
respectively. If you don't want to input multipliers just set all 16 characters
to '-' (scores and word order won't be accurate).
Author: David Chen
"""
import config as cf
from collections import defaultdict
""" These store the dictionary and prefixes at run time. """
DICTIONARY = None
PREFIXES = None
class BoardSolver:
__slots__ = ["board", "word_mults", "board_size", "word_int_mults",
"points", "graph", "possible_words", "words_info"]
def __init__(self, board, word_mults, board_size=cf.BOARD_SIZE):
if board_size is None:
board_size = len(board)
self.board = board
self.word_mults = word_mults
self.board_size = board_size
self.word_int_mults = self.word_mults_to_int_array()
self.points = self.get_points()
self.graph = self.gen_graph()
self.possible_words = []
self.words_info = {}
""" Initialize DICTIONARY and PREFIXES if they're not yet read. """
global DICTIONARY, PREFIXES
if DICTIONARY is None:
DICTIONARY = get_dict()
if PREFIXES is None:
PREFIXES = get_prefixes()
self.all_combos()
self.check_words()
@classmethod
def open(cls, file_path=cf.MAIN_DIR / "board.txt", board_size=4):
""" Read board from board.txt. If board_size is not set, will automatically infer the size based on the firstN
line of text. Expects an empty line between the board letters and the board multiplier information."""
with open(file_path) as file:
lines = file.read().splitlines()
board = []
for row in lines[:board_size]:
board.append([l.upper() for l in row if l.isalpha()])
word_mults = [row.split() for row in lines[board_size + 1: 2 * board_size + 1]]
return cls(board, word_mults, board_size)
@classmethod
def solve_file(cls, file_path=cf.MAIN_DIR / "board.txt", board_size=None):
board = cls.open(file_path, board_size)
return board.all_combos()
def dfs(self, visited, s, word, word_pts, word_mult, path):
"""Start at point s and search for words, keeping track of the word, points, and multiplier"""
len_word = len(word)
# store all >2 letter possible words in words_info if they are actual words
if len_word >= cf.MIN_WORD_LEN and word in DICTIONARY:
score = word_pts * word_mult
bonus = 0 if len_word < 4 else 5 * (len_word - 4) # length bonus
self.possible_words.append((word, score + bonus, path[:])) # append copy of path
visited[s] = True # begin DFS, make sure no overlaps
path.append(None)
len_word += 1
for v in self.graph[s]: # graph[s] contains the adjacent points
if not visited[v]:
x, y = v
path[-1] = v # add position to path list
temp_word = word + self.board[x][y]
if len_word >= cf.MIN_WORD_LEN:
if cf.PREFIX_LOWER_BOUND <= len_word <= cf.PREFIX_UPPER_BOUND\
and temp_word not in PREFIXES[len_word - cf.PREFIX_LOWER_BOUND]:
continue
# there are no words greater than 12 letters (based on ruzzle database), so stop searching
if len_word == cf.MAX_WORD_LEN and temp_word in DICTIONARY:
score = word_pts * word_mult
bonus = 0 if len_word < 4 else 5 * (len_word - 4) # length bonus
self.possible_words.append((word, score + bonus, path)) # append copy of path
continue
visited[v] = True
# search from this new point
self.dfs(visited, v, temp_word, word_pts + self.points[x][y],
word_mult * self.word_int_mults[x][y], path)
# reset everything to continue to search in other directions
visited[v] = False
del path[-1]
def all_combos(self):
""" Returns all possible combinations of letters in board"""
if self.possible_words:
return self.possible_words
for x in range(cf.BOARD_SIZE):
for y in range(cf.BOARD_SIZE):
visited = {(i, j): False for i in range(cf.BOARD_SIZE) for j in range(cf.BOARD_SIZE)}
self.dfs(visited, (x, y), self.board[x][y], self.points[x][y], self.word_int_mults[x][y], [(x, y)])
return self.possible_words
def check_words(self, remove_bases=False):
"""returns actual words and points and removes base words if True (removes 'sleep' if 'sleeping' is a word)"""
# Keep actual words and sort by score (to keep the best words).
if not self.possible_words:
self.all_combos()
words_info = [word for word in self.possible_words if word[0] in DICTIONARY]
words_info.sort(key=lambda x: x[1])
# remove 'walk' if 'walks' is a word
if remove_bases:
all_words = {word[0] for word in words_info}
words_info = {j for i, j in enumerate(words_info) if all(j[0] not in k for k in all_words)}
self.words_info = {word: (score, path) for word, score, path in words_info}
return self.words_info
def write_words_to_file(self, print_info=False):
""" Writes all words and initial positions to words.txt. If the board has not yet been solved, will first solve
it. """
if not self.words_info:
self.all_combos()
self.check_words()
with open(cf.MAIN_DIR / 'words.txt', 'w') as words_file:
# take words_info and sort by score first, then sort by length
# words_info.items() is a list of tuples: [(word, (score, path)) ...]
high_scores = sorted(self.words_info.items(), key=lambda x: (-x[1][0], len(x[0])))
for word, info in high_scores:
print(word, info[0], file=words_file)
if print_info:
print('Number of words:', len(high_scores))
print('Total score:', sum(info[0] for word, info in high_scores))
def get_points(self):
""" Gets the points for each letter, including multipliers"""
points = []
for i in range(4): # row
row_pts = []
for j in range(4): # column
pts = self.get_letter_pts(self.board[i][j])
mult = self.word_mults[i][j]
if mult == 'D':
pts *= 2
elif mult == 'T':
pts *= 3
row_pts.append(pts)
points.append(row_pts)
return points
@staticmethod
def get_letter_pts(l):
""" Return point value for each letter (no bonuses)"""
letter_points = {'A': 1, 'B': 4, 'C': 4, 'D': 2, 'E': 1, 'F': 4, 'G': 3, 'H': 4, 'I': 1, 'J': 10, 'K': 5,
'L': 1,
'M': 3, 'N': 1, 'O': 1, 'P': 4, 'Q': 10, 'R': 1, 'S': 1, 'T': 1, 'U': 2, 'V': 4, 'W': 4,
'X': 8,
'Y': 4, 'Z': 8}
return letter_points[l]
def word_mults_to_int_array(self):
""" Converts word_mults to an array of integers representing the word score multipliers. """
int_word_mults = [[1] * self.board_size for _ in range(self.board_size)]
for i in range(self.board_size):
for j in range(self.board_size):
int_word_mults[i][j] = int(self.word_mults[i][j]) if self.word_mults[i][j].isdigit() else 1
return int_word_mults
def gen_graph(self):
"""stores grid positions into adjacency list"""
directions = [(1, 0), (-1, 0), (0, 1), (0, -1), (1, 1), (1, -1), (-1, 1), (-1, -1)]
graph = defaultdict(list)
# for each point (key), store the adjacent points (values) in graph
for x in range(self.board_size):
for y in range(self.board_size):
for cx, cy in directions:
if 0 <= x + cx < self.board_size and 0 <= y + cy < self.board_size:
graph[(x, y)].append((x + cx, y + cy))
return graph
def get_dict():
""" Returns set of words in dictionary (checking to see if a word is in a set is faster than a list) """
dict_file = cf.MAIN_DIR / 'TWL06Trimmed.txt'
return set(open(dict_file).read().splitlines())
def get_prefixes():
""" Returns a list of lists of prefixes of a certain number of letters """
prefixes = []
for i in range(cf.PREFIX_LOWER_BOUND, cf.PREFIX_UPPER_BOUND + 1):
with open(cf.MAIN_DIR / cf.PREFIX_DIR / f'prefixes{i}L.txt') as file:
prefixes.append(set(file.read().splitlines()))
return prefixes
if __name__ == '__main__': # for testing - reads board from 'board.txt' and writes words to file
# Reading data
DICTIONARY = get_dict()
PREFIXES = get_prefixes()
# Solving
boardSolver = BoardSolver.open(cf.MAIN_DIR / 'board.txt')
boardSolver.write_words_to_file(print_info=True)