1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
|
#!/usr/bin/env python
# Challenge 007
#
# Challenge #2
# Word Ladder
# A word ladder is a sequence of words [w0, w1, ..., wn] such that each word wi
# in the sequence is obtained by changing a single character in the word wi-1.
# All words in the ladder must be valid English words.
#
# Given two input words and a file that contains an ordered word list, implement
# a routine (e.g., find_shortest_ladder(word1, word2, wordlist)) that finds the
# shortest ladder between the two input words. For example, for the words cold
# and warm, the routine might return:
#
# ("cold", "cord", "core", "care", "card", "ward", "warm")
# However, there's a shortest ladder: ("cold", "cord", "card", "ward", "warm").
#
# Givens:
# All words in the list have the same length.
#
# All words contain only lowercase alphabetical characters.
#
# There are no duplicates in the word list.
#
# The input words aren't empty and aren't equal but they have the same length
# as any word in the word list.
#
# Requirements:
# The routine must return a list of the words in the ladder if it exists.
# Otherwise, it returns an empty list.
#
# If any of the input words is the wrong length (i.e., its length is different
# to a random from the word list) or isn't in the word list, return an empty list.
from __future__ import print_function
import sys
import re
import collections
from collections import deque
def eprint(*args, **kwargs):
print(*args, file=sys.stderr, **kwargs)
def get_args():
if len(sys.argv) != 3:
eprint("Usage: ch-2.py word1 word2")
sys.exit(1)
word1, word2 = sys.argv[1:]
if len(word1) != len(word2):
eprint("words must have the same length")
sys.exit(1)
if word1 == word2:
eprint("words must be different")
sys.exit(1)
for word in word1, word2:
if not re.match(r"^[a-z]+$", word):
eprint("words must have lower case letters only")
sys.exit(1)
return word1, word2
def read_words(filename, length):
wordlist = set()
with open(filename, 'r') as f:
for line in f.readlines():
word = line.strip()
if len(word) == length and re.match(r"^[a-z]+$", word):
wordlist.add(word)
return wordlist
def find_shortest_ladder(word1, word2, wordlist):
queue = deque()
queue.append((word1, [word1])) # node, path
while queue:
word, path = queue.popleft()
for next in sorted(next_possible_words(word, wordlist - set(path))):
if next == word2: # found solution
return path + [next]
else:
queue.append((next, path + [next]))
return []
def next_possible_words(word1, wordlist):
next = set()
for word in wordlist:
if word != word1 and word_diff(word, word1) == 1:
next.add(word)
return next
def word_diff(word1, word2):
diff = 0
list1 = list(word1)
list2 = list(word2)
for i in range(0, len(list1)):
if list1[i] != list2[i]:
diff = diff+1
return diff
def print_list(list):
output = "(";
for word in list:
output += '"' + word + '", '
output = output[:-2] + ")"
print(output)
word1, word2 = get_args()
wordlist = read_words("words.txt", len(word1))
print_list(find_shortest_ladder(word1, word2, wordlist))
|