1234567890123456789012345
" " " "" ) doc = Document(sample) doc.summary() def test_correct_cleanup(self): sample = """Lot of text here.
More text is written here, and contains punctuation and dots.
The comment is also helpful, but it's still not the correct item to be extracted.
It's even longer than the article itself!"
foo" + long_space + "
" doc = Document(sample) s = doc.summary() assert "foo" in s def test_not_self_closing(self): sample = '