# HG changeset patch # User Igor Chubin # Date 1295803099 -3600 # Node ID 4629e08b0d87c2b1a7e18dc83c8345f2446bf94c # Parent c3a50c0d2400e1a8afe7f6e54d64fdfdf53874da minifix: skip numbers as words diff -r c3a50c0d2400 -r 4629e08b0d87 new-words.py --- a/new-words.py Sun Jan 23 17:09:44 2011 +0100 +++ b/new-words.py Sun Jan 23 18:18:19 2011 +0100 @@ -165,6 +165,8 @@ for line in lines: words = words_from_line(line) for word in words: + if re.match('[0-9]*$', word): + continue result.setdefault(word, 0) result[word] += 1 return result