Improved remove_unlikely_candidates following an advice from issue #102

pull/87/merge
Yuri Baburov 6 years ago
parent 97e86c4559
commit 537de2b8f6

@ -395,7 +395,7 @@ class Document:
}
def remove_unlikely_candidates(self):
for elem in self.html.iter():
for elem in self.html.findall('.//*'):
s = "%s %s" % (elem.get('class', ''), elem.get('id', ''))
if len(s) < 2:
continue

Loading…
Cancel
Save