horray for subtle UTF8-is-not-ASCII bugs

This commit is contained in:
Mark Pilgrim
2010-01-04 21:28:57 -05:00
parent ea9e664e80
commit 6782826583
+1 -1
View File
@@ -5,7 +5,7 @@ import time
# get list of chapters
chapters = []
for line in open('index.html'):
for line in open('index.html', encoding="utf-8"):
if not line.count('<li') or not line.count('<a href'):
continue
chapters.append(line.split('<a href=', 1)[1].split('>', 1)[0])