Added emdash 0x2014 as a word separator

2021-11-22 21:25:08 +01:00 · 2021-11-22 21:25:08 +01:00 · 357eceabad
parent 1c53c94b9c
commit 357eceabad
1 changed files with 3 additions and 1 deletions
--- a/novel_stats/novel_stats.py
+++ b/novel_stats/novel_stats.py
@ -4,6 +4,7 @@
 import argparse
 import collections
 import tempfile
 import re
 CHAPTER_MARKER = '## '
 STATUS_MARKER = '[status]: # '
@ -11,12 +12,13 @@ ACT_MARKER = '[act]: # '
 # Standard markdown comment marker, supported by Pandoc and Calibre's ebook-convert.
 COMMENT_MARKER = '[//]: # '
 TITLE_MARKER = '# '
 WORD_SEPS = [' ','—']
 def count_words(line):
    count = 0
-    for word in line.strip().split(' '):
+    for word in re.split('|'.join(WORD_SEPS), line.strip()):
        if not word.strip() or word == '*' or word.startswith('#'):
            continue