diff --git a/sources/browser.py b/sources/browser.py index 2cfe47a..a64e5d9 100644 --- a/sources/browser.py +++ b/sources/browser.py @@ -156,6 +156,7 @@ class Browser: element.decompose() + text = soup.get_text() lines = (line.strip() for line in text.splitlines()) chunks = (phrase.strip() for line in lines for phrase in line.split(" ")) text = "\n".join(chunk for chunk in chunks if chunk and self.is_sentence(chunk))