fix: unsuited segmentation

3 years ago · b768f58c19
1 changed files with 1 additions and 1 deletions
--- a/src/ixsw.la/extract.py
+++ b/src/ixsw.la/extract.py
@ -23,7 +23,7 @@ def splitHtml(rawHtml: str) -> dict:  # extract from raw html content
    div = '\n'.join(div.prettify().split('\n')[1: -2])
    return {
        'title': '%s %s' % (title[1], title[2].strip()),
-        'content': [x.strip() for x in div.split('<br/>\n <br/>\n')]
+        'content': [x.strip() for x in div.split('\n <br/>\n <br/>') if x.strip() != '']
    }