From 737634e7400c3d6f03144a6df08d6b42ce14432f Mon Sep 17 00:00:00 2001 From: OneNewDev Date: Sat, 28 May 2022 15:33:29 +0200 Subject: [PATCH] ignore digits --- tagger.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/tagger.py b/tagger.py index 63ddabb..299d084 100644 --- a/tagger.py +++ b/tagger.py @@ -44,6 +44,8 @@ class FileScanner(HTMLParser): score = 10 if word in EXCLUDED_WORDS: continue + if word.isdigit(): + continue if word in title_words: score *= 4 word_length = len(word)