-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsetup.py
52 lines (47 loc) · 2.11 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
"""
This script, using a dictionary provided by github.com/dwyl/english-words,
sorts each word in the dictionary (let's call this the sorted_word of any given
word).
The script in create_anagram_dictionary(), creates a dictionary that uses
orted_words as keys with their values being an array of words that shares that
same sorted_word.
cache_anagram_dictionary() creates a .txt file (data/anagram_dictionary.txt)
where the dictionary created in create_anagram_dictionary() is stored in the
format:
<sorted_word>:<word>|<word2>,...
This script only needed to be run once, to create data/anagram_dictionary.txt.
After that, the program will use that file to (somewhat) quickly re-create the
dictionary on each run.
"""
def create_anagram_dictionary():
"""
Creates a dictionary of words based on the words in file "data/words_alpha.txt"
Returns:
dictionary: a dictionary that uses a string of characters (in alphabetical order) as the key and
has a list of words that contain those characters (and only those characters).
"""
anagram_dictionary = {}
with open("data/words_alpha.txt","r") as words_file:
for line in words_file:
word = line.strip()
sorted_word = ''.join(sorted(word))
if sorted_word in anagram_dictionary:
anagram_dictionary.get(sorted_word).append(word)
else:
anagram_dictionary[sorted_word] = []
anagram_dictionary[sorted_word].append(word)
return anagram_dictionary
def cache_anagram_dictionary():
"""
creates a text file that stores the dictionary created by create_anagram_dictionary()
in the format:
<string of sorted letters>: <anagram of those letters>, <anagram of those letters2>,...
"""
anagram_dictionary_file = open("data/anagram_dictionary.txt","w")
for sorted_word, words in create_anagram_dictionary().items():
anagram_dictionary_file.write(sorted_word + ":")
for word in words:
anagram_dictionary_file.write(word + "|")
anagram_dictionary_file.write("\n")
if __name__ == '__main__':
cache_anagram_dictionary()